在CentOS下管理PyTorch项目可按以下步骤进行:
sudo yum update -y
sudo yum install python3 python3-pip -y
sudo yum groupinstall -y "Development Tools"
venv:python3 -m venv pytorch_env
source pytorch_env/bin/activate
conda(需先安装Miniconda/Anaconda):conda create -n pytorch_env python=3.8
conda activate pytorch_env
pip install torch torchvision torchaudio
nvidia-smipip install torch torchvision torchaudio --extra-index-url https://download.pytorch.org/whl/cu117
conda安装:conda install pytorch torchvision torchaudio cudatoolkit=11.7 -c pytorch
requirements.txt,执行:pip install -r requirements.txt
pip freeze > requirements.txt
python your_script.py
pdb:在代码中插入import pdb; pdb.set_trace()from torch.cuda.amp import autocast
with autocast():
# 训练代码
DistributedDataParallel实现多GPU训练torch.onnx.export(model, input, "model.onnx")
pip list --outdated --format=freeze | cut -d = -f 1 | xargs -n1 pip install -U
参考来源: