-
Notifications
You must be signed in to change notification settings - Fork 1
Expand file tree
/
Copy pathmonitor_training.sh
More file actions
29 lines (24 loc) · 884 Bytes
/
monitor_training.sh
File metadata and controls
29 lines (24 loc) · 884 Bytes
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
#!/bin/bash
# monitor_training.sh
# Monitor and check status of training jobs
echo "================================================"
echo "ChessHacks Training Monitor"
echo "================================================"
echo ""
# Check for running training processes
echo "Active training processes:"
ps aux | grep train_overnight | grep -v grep || echo " (none)"
echo ""
echo "Latest log files:"
ls -lhtr logs/training_*.log 2>/dev/null | tail -5 || echo " (no logs)"
echo ""
echo "Model checkpoints:"
ls -lhtr checkpoints/model_*.pth 2>/dev/null | tail -5 || echo " (no checkpoints)"
echo ""
echo "Latest training log output (last 50 lines):"
echo "================================================"
if [ -f "$(ls -t logs/training_*.log 2>/dev/null | head -1)" ]; then
tail -50 "$(ls -t logs/training_*.log 2>/dev/null | head -1)"
else
echo "(no logs found)"
fi