diff --git a/train.py b/train.py index 2e743974..7b46cb66 100644 --- a/train.py +++ b/train.py @@ -628,3 +628,4 @@ def get_weight_decay(progress): print(f"num_steps: {step}") print(f"num_params_M: {num_params / 1e6:.1f}") print(f"depth: {DEPTH}") +print(f"startup_seconds: {startup_time:.1f}")