- Since CUDA 9.1 doesn't support LLVM 9.0.0, you need to install Xcode 8.3.2 with LLVM 8.1.0 for compiling CUDA programs.
- Select
Xcode 8.3.2
for Command Line Tools in Xcode. (Or use xcode-select
)
- Clone MXNet
$ https://github.com/apache/incubator-mxnet.git --recursive
$ cd incubator-mxnet
- Configure:
- use default config for macOS:
$ cp make/osx.mk config.mk
- Give only one
KNOWN_CUDA_ARCHS
to spped up compiling:
diff --git a/Makefile b/Makefile
index 8584ab65..0b6e4792 100644
--- a/Makefile
+++ b/Makefile
@@ -254,7 +254,8 @@ endif
# be JIT-compiled by the updated driver from the included PTX.
ifeq ($(USE_CUDA), 1)
ifeq ($(CUDA_ARCH),)
- KNOWN_CUDA_ARCHS := 30 35 50 52 60 61 70
+ # KNOWN_CUDA_ARCHS := 30 35 50 52 60 61 70
+ KNOWN_CUDA_ARCHS := 61
# Run nvcc on a zero-length file to check architecture-level support.
# Create args to include SASS in the fat binary for supported levels.
CUDA_ARCH := $(foreach arch,$(KNOWN_CUDA_ARCHS), \
- Compile
$ make -j4 USE_OPENCV=1 USE_CUDA=1 USE_CUDA_PATH=/usr/local/cuda USE_CUDNN=1
- Install
$ cd python
$ pip3 install --upgrade pip
$ pip3 install -e .
- Validate
>>> import mxnet as mx
>>> a = mx.nd.ones((2, 3), mx.gpu())
>>> b = a * 2 + 1
>>> b.asnumpy()
array([[ 3., 3., 3.],
[ 3., 3., 3.]], dtype=float32)