#!/usr/bin/env bash set -euo pipefail NNODES=${NNODES:-4} MASTER_ADDR=${MASTER_ADDR:-10.232.82.69} MASTER_PORT=${MASTER_PORT:-29500} NPROC_PER_NODE=${NPROC_PER_NODE:-8} NODE_RANK=${NODE_RANK:?Please set NODE_RANK, for example: NODE_RANK=0 bash train_mono3d_roi1.sh} /home/fcheng/miniconda/bin/python -m torch.distributed.run \ --nnodes="${NNODES}" \ --node_rank="${NODE_RANK}" \ --master_addr "${MASTER_ADDR}" \ --master_port "${MASTER_PORT}" \ --nproc_per_node "${NPROC_PER_NODE}" \ train_mono3d.py \ --model yolo26s \ --epochs 50 \ --lr0 0.0003 \ --lrf 0.33 \ --e2e_o2m_start 0.3 \ --e2e_o2m_final 0.1 \ --batch 512 \ --imgsz 768,352 \ --pretrained ./runs/detect/train_mono3d_roi0_20260406/weights/last.pt \ --roi_metrics_only \ --warmup_epochs 1 \ --loss_3d_warmup_epochs 0 \ --loss_3d_ramp_epochs 3 \ --loss_3d_weight_max 0.05 \ --roi roi0 \ --exp_dir=./runs/detect/train_mono3d_roi0_20260413