Deepin 23.1 上的 docker 使用 GPU

24 阅读1分钟
#确认系统能识别显卡
lspci | grep -i nvidia

#确认驱动正常
nvidia-smi

#如果驱动不存在则安装570 版本
apt install -y \
nvidia-driver=570.124.04-1 \
nvidia-vdpau-driver=570.124.04-1 \
nvidia-kernel-dkms=570.124.04-1

#安装 NVIDIA Container Toolkit
distribution="debian10"
curl -s -L https://nvidia.github.io/nvidia-docker/gpgkey | sudo apt-key add -
curl -s -L https://nvidia.github.io/nvidia-docker/$distribution/nvidia-docker.list | sudo tee /etc/apt/sources.list.d/nvidia-docker.list
sudo apt-get update
sudo apt-get install -y nvidia-container-toolkit
sudo systemctl restart docker

# 检查软件包是否安装
dpkg -l | grep nvidia-container-toolkit

#正常输出:
ii  nvidia-container-toolkit                          1.13.5-1                                 amd64        NVIDIA Container toolkit
ii  nvidia-container-toolkit-base                     1.13.5-1                                 amd64        NVIDIA Container Toolkit Base

#/etc/docker/daemon.json 中添加以下内容:
"runtimes": { "nvidia": { "path": "nvidia-container-runtime", "runtimeArgs": [] } }

#重启docker服务
sudo systemctl restart docker

#验证是否生效
docker info | grep -i runtime

#正常输出:
Runtimes: io.containerd.runc.v2 nvidia runc
Default Runtime: runc

#compose配置中加入以下配置:
    deploy:
      resources:
        reservations:
          devices:
            - driver: nvidia
              count: 1
              capabilities: [gpu]

#进入容器中验证是否生效
nvidia-smi