https://docs.nvidia.com/datacenter/cloud-native/container-toolkit/install-guide.html
docker build -t cs269_full -f full.dockerfile .
docker run -ti --gpus all --shm-size=1g --ulimit memlock=-1 -e "TERM=xterm-256color" -v "$(pwd):/workspace" -v /etc/localtime:/etc/localtime:ro -v "$HOME"/.zsh_history_docker:/root/.zsh_history:z -e HIST_FILE="/root/.zsh_history" --network host cs_269 note that docker run automatically starts jupyter and tensorboard
ssh -o "UserKnownHostsFile=/dev/null" -o "StrictHostKeyChecking=no" root@localhost -p 7722
localhost:8888
localhost:6006
docker build -t cs269_slim -f slim.dockerfile .
docker run -ti --shm-size=1g -e "TERM=xterm-256color" -v "$(pwd):/workspace" -p 7722:7722 -v /etc/localtime:/etc/localtime:ro cs269_slim
ssh -o "UserKnownHostsFile=/dev/null" -o "StrictHostKeyChecking=no" root@localhost -p 7722
Hoffman2 does not support docker so you will need to manually set up the conda environment
qrsh -l h_rt=1:00:00,h_data=4G,gpu,RTX2080Ti
module load python/anaconda3 module load cuda/10.2 module load glibc/2.14
conda create --name EML conda activate EML
conda install pytorch torchvision -c pytorch -y conda config --append channels conda-forge
conda install expect gdown snakeviz -y pip install rigl_torch
Download login script
wget https://gitlab.idre.ucla.edu/dauria/jupyter-notebook/raw/master/h2jupynb
python h2jupynb -u username -v anaconda3 -d Edge_Meta_Learning -t session_length_in_hours -m session_memory_in_GB -g yes -c V100
docker run ...
python3 -m cProfile -o results.prof main.py
snakeviz results.prof -p 4433 -s -H 0.0.0.0
go to localhost:4433/snakeviz/%2Fworkspace%2Fresults.prof in browser