TEST: use tensorboard for stuff
This commit is contained in:
parent
2d31162c58
commit
524ee03187
10 changed files with 212 additions and 12 deletions
36
_DDPShA-train.sh
Normal file
36
_DDPShA-train.sh
Normal file
|
|
@ -0,0 +1,36 @@
|
|||
#!/bin/sh
|
||||
#SBATCH -N 1
|
||||
#SBATCH -n 1
|
||||
#SBATCH --partition=Teach-Standard
|
||||
#SBATCH --gres=gpu:4
|
||||
#SBATCH --mem=24000
|
||||
#SBATCH --time=3-00:00:00
|
||||
|
||||
set -e
|
||||
|
||||
export CUDA_HOME=/opt/cuda-9.0.176.1/
|
||||
export CUDNN_HOME=/opt/cuDNN-7.0/
|
||||
export STUDENT_ID=$(whoami)
|
||||
|
||||
export LD_LIBRARY_PATH=${CUDNN_HOME}/lib64:${CUDA_HOME}/lib64:${LD_LIBRARY_PATH}
|
||||
export LIBRARY_PATH=${CUDNN_HOME}/lib64:${LIBRARY_PATH}
|
||||
export CPATH=${CUDNN_HOME}/include:$CPATH
|
||||
export PATH=${CUDA_HOME}/bin:${PATH}
|
||||
export PYTHON_PATH=$PATH
|
||||
|
||||
mkdir -p /disk/scratch/${STUDENT_ID}
|
||||
export TMPDIR=/disk/scratch/${STUDENT_ID}/
|
||||
export TMP=/disk/scratch/${STUDENT_ID}/
|
||||
|
||||
source /home/${STUDENT_ID}/miniconda3/bin/activate mlp-cuda
|
||||
|
||||
python train.py \
|
||||
--pth_tar './pretrained/deit_base_patch16_384-8de9b5d1.pth' \
|
||||
--model 'stn' \
|
||||
--save_path ./save/DDP-ShanghaiA-stn-$(date -Iminutes) \
|
||||
--batch_size 4 \
|
||||
--use_ddp True \
|
||||
--ddp_world_size 4 \
|
||||
--gpus 0,1,2,3 \
|
||||
--print_freq 100
|
||||
|
||||
Loading…
Add table
Add a link
Reference in a new issue