echo $(cat /sys/module/amdgpu/version)
sudo apt-get install rocm-dev
or
sudo apt-get update
sudo apt-get upgrade
sudo systemctl start docker.socket
docker pull rocm/pytorch
sudo docker run -it --name=rocm-pytorch -v /mnt/Data/GPU-ROCm/AI/Data:/data --privileged --rm --device=/dev/kfd --device=/dev/dri --group-add video rocm/pytorch
apt-get install kmod -y
rocminfo
clinfo
PYTORCH_TEST_WITH_ROCM=1 python3.6 test/run_test.py –-verbose
>/src/external/hip-on-vdi/rocclr/hip_code_object.cpp:92: guarantee(false && "hipErrorNoBinaryForGpu: Coudn't find binary for current devices!")
Aborted (core dumped)
No tests will fail if the compilation and installation is correct.
pip install torchvision
docker system prune -f
docker build --rm -f ./ci/docker/ubuntu18.04.Dockerfile -t qpanprojects/rocm:latest .
docker push qpanprojects/rocm:latest