From 7b668d0e1923bad2437afad1ba6996f7200468a1 Mon Sep 17 00:00:00 2001 From: tykoo-chen Date: Wed, 11 Mar 2026 18:53:18 +0000 Subject: [PATCH] feat: print startup_time in final summary startup_time is already calculated but not printed. Adding it to the output helps understand compilation overhead and total experiment time. --- train.py | 1 + 1 file changed, 1 insertion(+) diff --git a/train.py b/train.py index 2e743974..7b46cb66 100644 --- a/train.py +++ b/train.py @@ -628,3 +628,4 @@ def get_weight_decay(progress): print(f"num_steps: {step}") print(f"num_params_M: {num_params / 1e6:.1f}") print(f"depth: {DEPTH}") +print(f"startup_seconds: {startup_time:.1f}")