Files
yolov26_3d/train_mono3d_roi1_node_finetuning.sh

34 lines
901 B
Bash
Raw Normal View History

2026-06-24 09:35:46 +08:00
#!/usr/bin/env bash
set -euo pipefail
NNODES=${NNODES:-4}
MASTER_ADDR=${MASTER_ADDR:-10.232.118.76}
MASTER_PORT=${MASTER_PORT:-29500}
NPROC_PER_NODE=${NPROC_PER_NODE:-8}
NODE_RANK=${NODE_RANK:?Please set NODE_RANK, for example: NODE_RANK=0 bash train_mono3d_roi1.sh}
/home/fcheng/miniconda/bin/python -m torch.distributed.run \
--nnodes="${NNODES}" \
--node_rank="${NODE_RANK}" \
--master_addr "${MASTER_ADDR}" \
--master_port "${MASTER_PORT}" \
--nproc_per_node "${NPROC_PER_NODE}" \
train_mono3d.py \
--model yolo26s \
--epochs 50 \
--lr0 0.0003 \
--lrf 0.33 \
--e2e_o2m_start 0.3 \
--e2e_o2m_final 0.1 \
--batch 512 \
--imgsz 768,352 \
--pretrained ./runs/detect/train_mono3d_roi1_20260406/weights/last.pt \
--roi_metrics_only \
--warmup_epochs 1 \
--loss_3d_warmup_epochs 0 \
--loss_3d_ramp_epochs 3 \
--loss_3d_weight_max 0.05 \
--roi roi1 \
--exp_dir=./runs/detect/train_mono3d_roi1_20260413