# Basic configuration | |
export CUDA_VISIBLE_DEVICES="0,1" | |
export PYTHONWARNINGS="ignore" | |
export PYTHONPATH="${PYTHONPATH}:${PWD}" # Add current directory to Python path | |
# Create directories | |
mkdir -p logs weights cache | |
# Get timestamp for error log only | |
TIMESTAMP=$(date +%Y%m%d_%H%M%S) | |
ERROR_LOG="logs/error_${TIMESTAMP}.log" | |
# Print configuration | |
echo "Starting training with configuration:" | |
echo "======================================" | |
echo "Error log: $ERROR_LOG" | |
echo "PYTHONPATH: $PYTHONPATH" | |
echo "======================================" | |
# Start training with nohup, only redirecting stderr | |
echo "Starting training in background..." | |
nohup python model/train.py 2> "$ERROR_LOG" & | |
# Save process ID | |
pid=$! | |
echo $pid > "logs/train_${TIMESTAMP}.pid" | |
echo "Training process started with PID: $pid" | |
echo | |
echo "Monitor commands:" | |
echo "1. View error log: tail -f $ERROR_LOG" | |
echo "2. Check process status: ps -p $pid" | |
echo "3. Stop training: kill $pid" |