-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathstart_tensorboard.sh
More file actions
executable file
·37 lines (31 loc) · 987 Bytes
/
start_tensorboard.sh
File metadata and controls
executable file
·37 lines (31 loc) · 987 Bytes
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
#!/bin/bash
# Start TensorBoard for training monitoring.
set -e
REPO_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
ENV_NAME="${ENV_NAME:-verl}"
LOGDIR="${1:-${LOGDIR:-$REPO_DIR/verl/tensorboard_log}}"
PORT="${PORT:-6006}"
if [ ! -d "$LOGDIR" ]; then
echo "ERROR: Log directory not found at $LOGDIR"
echo "Pass a log directory as the first argument or set LOGDIR."
exit 1
fi
echo "Starting TensorBoard..."
echo "Log directory: $LOGDIR"
echo "Port: $PORT"
echo ""
echo "Access TensorBoard at:"
echo " Local: http://localhost:$PORT"
echo " Remote: Use SSH port forwarding if needed"
echo ""
echo "SSH port forwarding example:"
echo " ssh -L $PORT:localhost:$PORT <username>@<server-address>"
echo ""
echo "Press Ctrl+C to stop TensorBoard"
echo "=========================================="
echo ""
# Activate conda environment
eval "$(conda shell.bash hook)"
conda activate "$ENV_NAME"
# Start TensorBoard
tensorboard --logdir="$LOGDIR" --port="$PORT" --bind_all