Closed SumNeuron closed 6 years ago
The gist of the error is:
nvcc fatal : The version ('80100') of the host compiler ('Apple clang') is not supported
The problem is nvcc doesn't support the new clang complier that comes with the newer Xcode versions. You will need to revert your command line tool to 7.3.3 or 8.0. You may refer to my stackoverflow answer on how to revert the command line tool (note that the answer reverts to 7.2, and you can pick the appropriate version when downloading).
ok, I will do that... and new errors:
make
cd /Users/sumner/Downloads/mxnet/dmlc-core; /Library/Developer/CommandLineTools/usr/bin/make libdmlc.a USE_SSE=1 config=/Users/sumner/Downloads/mxnet/config.mk; cd /Users/sumner/Downloads/mxnet
make[1]: `libdmlc.a' is up to date.
/usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=[sm_61,compute_61] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/Users/sumner/Downloads/mxnet/mshadow/ -I/Users/sumner/Downloads/mxnet/dmlc-core/include -fPIC -I/Users/sumner/Downloads/mxnet/nnvm/include -I/Users/sumner/Downloads/mxnet/dlpack/include -Iinclude -funroll-loops -Wno-unused-variable -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_OPENCV=1 -I/usr/local/Cellar/opencv/3.3.0_3/include/opencv -I/usr/local/Cellar/opencv/3.3.0_3/include -DMSHADOW_USE_CUDNN=1 -I/usr/local/opt/openblas/include -I/Users/sumner/Downloads/mxnet/cub -DMXNET_USE_NVRTC=0" -M -MT build/src/operator/contrib/count_sketch_gpu.o src/operator/contrib/count_sketch.cu >build/src/operator/contrib/count_sketch_gpu.d
/usr/local/cuda/bin/nvcc -c -o build/src/operator/contrib/count_sketch_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=[sm_61,compute_61] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/Users/sumner/Downloads/mxnet/mshadow/ -I/Users/sumner/Downloads/mxnet/dmlc-core/include -fPIC -I/Users/sumner/Downloads/mxnet/nnvm/include -I/Users/sumner/Downloads/mxnet/dlpack/include -Iinclude -funroll-loops -Wno-unused-variable -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_OPENCV=1 -I/usr/local/Cellar/opencv/3.3.0_3/include/opencv -I/usr/local/Cellar/opencv/3.3.0_3/include -DMSHADOW_USE_CUDNN=1 -I/usr/local/opt/openblas/include -I/Users/sumner/Downloads/mxnet/cub -DMXNET_USE_NVRTC=0" src/operator/contrib/count_sketch.cu
/Users/sumner/Downloads/mxnet/dmlc-core/include/dmlc/./thread_local.h:40:8: error: thread-local storage is not supported for the
current target
static thread_local T inst;
^
/usr/local/cuda/include/thrust/system/cuda/detail/bulk/malloc.hpp:110:7: warning: private field 'm_program_break' is not used
[-Wunused-private-field]
void *m_program_break;
^
/usr/local/cuda/include/thrust/system/cuda/detail/bulk/malloc.hpp:113:8: warning: private field 'm_max_data_segment_size' is not used
[-Wunused-private-field]
size_t m_max_data_segment_size;
^
/usr/local/cuda/include/thrust/system/cuda/detail/bulk/malloc.hpp:242:15: warning: private field 'm_is_free' is not used
[-Wunused-private-field]
private: bool m_is_free:1;
^
/usr/local/cuda/include/thrust/system/cuda/detail/bulk/malloc.hpp:243:8: warning: private field 'm_size' is not used
[-Wunused-private-field]
size_t m_size:((8) * sizeof(size_t)) - (1);
^
/usr/local/cuda/include/thrust/system/cuda/detail/bulk/malloc.hpp:244:8: warning: private field 'm_prev' is not used
[-Wunused-private-field]
block *m_prev;
^
/usr/local/cuda/include/thrust/system/cuda/detail/bulk/malloc.hpp:445:19: warning: private field 'm_in_use' is not used
[-Wunused-private-field]
private: unsigned m_in_use;
^
6 warnings and 1 error generated.
make: *** [build/src/operator/contrib/count_sketch_gpu.o] Error 1
myhost:mxnet sumner$ pwd
/Users/sumner/Downloads/mxnet
Could you do a make clean, pull the latest master, and try again?
ran make clean ran git clone --recursive https://github.com/apache/incubator-mxnet.git mxnet --branch 0.11.0 and tried
make
g++ -std=c++11 -c -DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/Users/sumner/Downloads/mxnet/mshadow/ -I/Users/sumner/Downloads/mxnet/dmlc-core/include -fPIC -I/Users/sumner/Downloads/mxnet/nnvm/include -I/Users/sumner/Downloads/mxnet/dlpack/include -Iinclude -funroll-loops -Wno-unused-variable -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_OPENCV=1 -I/usr/local/Cellar/opencv/3.3.0_3/include/opencv -I/usr/local/Cellar/opencv/3.3.0_3/include -DMSHADOW_USE_CUDNN=1 -I/usr/local/opt/openblas/include -I/Users/sumner/Downloads/mxnet/cub -DMXNET_USE_NVRTC=0 -MMD -c src/operator/contrib/count_sketch.cc -o build/src/operator/contrib/count_sketch.o
In file included from src/operator/contrib/count_sketch.cc:25:
In file included from src/operator/contrib/./count_sketch-inl.h:29:
In file included from include/mxnet/operator.h:32:
In file included from /Users/sumner/Downloads/mxnet/nnvm/include/nnvm/node.h:13:
In file included from /Users/sumner/Downloads/mxnet/nnvm/include/nnvm/./base.h:11:
In file included from /Users/sumner/Downloads/mxnet/dmlc-core/include/dmlc/memory.h:12:
/Users/sumner/Downloads/mxnet/dmlc-core/include/dmlc/./thread_local.h:40:12: error: thread-local storage is not supported for the
current target
static thread_local T inst;
^
1 error generated.
make: *** [build/src/operator/contrib/count_sketch.o] Error 1
The branch 0.11.0 doesn't have the fix. Please use the master head instead.
also tried with --branch master still a bunch of OpenMP / CXX11 thread_local warnings as it is not installed (should be added to install instructions) It has been running for a while....
finished installing. No errors for install.
a = mx.nd.ones((100, 100), mx.gpu())
[22:59:37] src/c_api/c_api_ndarray.cc:147: GPU support is disabled. Compile MXNet with USE_CUDA=1 to enable GPU support.
[22:59:37] /Users/travis/build/dmlc/mxnet-distro/mxnet-build/dmlc-core/include/dmlc/logging.h:308: [22:59:37] src/c_api/c_api_ndarray.cc:416: Operator _ones is not implemented for GPU.
Stack trace returned 5 entries:
[bt] (0) 0 libmxnet.so 0x000000010f4dbad8 _ZN4dmlc15LogMessageFatalD2Ev + 40
[bt] (1) 1 libmxnet.so 0x000000010fbdabbf _Z20ImperativeInvokeImplRKN5mxnet7ContextERKN4nnvm9NodeAttrsEPNSt3__16vectorINS_7NDArrayENS7_9allocatorIS9_EEEESD_ + 2079
[bt] (2) 2 libmxnet.so 0x000000010fbdb7f1 MXImperativeInvoke + 433
[bt] (3) 3 _ctypes.cpython-36m-darwin.so 0x000000010e63142f ffi_call_unix64 + 79
[bt] (4) 4 ??? 0x00007fff51bc0920 0x0 + 140734564665632
Traceback (most recent call last):
File "<stdin>", line 1, in <module>
File "/usr/local/lib/python3.6/site-packages/mxnet/ndarray.py", line 1216, in ones
return _internal._ones(shape=shape, ctx=ctx, dtype=dtype, **kwargs)
File "<string>", line 15, in _ones
File "/usr/local/lib/python3.6/site-packages/mxnet/_ctypes/ndarray.py", line 89, in _imperative_invoke
c_array(ctypes.c_char_p, [c_str(str(val)) for val in vals])))
File "/usr/local/lib/python3.6/site-packages/mxnet/base.py", line 129, in check_call
raise MXNetError(py_str(_LIB.MXGetLastError()))
mxnet.base.MXNetError: [22:59:37] src/c_api/c_api_ndarray.cc:416: Operator _ones is not implemented for GPU.
Stack trace returned 5 entries:
[bt] (0) 0 libmxnet.so 0x000000010f4dbad8 _ZN4dmlc15LogMessageFatalD2Ev + 40
[bt] (1) 1 libmxnet.so 0x000000010fbdabbf _Z20ImperativeInvokeImplRKN5mxnet7ContextERKN4nnvm9NodeAttrsEPNSt3__16vectorINS_7NDArrayENS7_9allocatorIS9_EEEESD_ + 2079
[bt] (2) 2 libmxnet.so 0x000000010fbdb7f1 MXImperativeInvoke + 433
[bt] (3) 3 _ctypes.cpython-36m-darwin.so 0x000000010e63142f ffi_call_unix64 + 79
[bt] (4) 4 ??? 0x00007fff51bc0920 0x0 + 140734564665632
Did you turn on the GPU support when checking out?
I was able to do this successfully on my mac. Let me quickly update the guide.
Prepared environment:
export CUDA_HOME=/usr/local/cuda
export DYLD_LIBRARY_PATH="$CUDA_HOME/lib:$DYLD_LIBRARY_PATH"
export PATH="$CUDA_HOME/bin:$PATH"
installed all dependencies from the link in the original post.
then did this:
git clone --recursive https://github.com/apache/incubator-mxnet.git mxnet --branch master
cd ~/mxnet
cp make/osx.mk ./config.mk
echo "USE_BLAS = openblas" >> ./config.mk
echo "ADD_CFLAGS += -I/usr/local/opt/openblas/include" >> ./config.mk
echo "ADD_LDFLAGS += -L/usr/local/opt/openblas/lib" >> ./config.mk
echo "ADD_LDFLAGS += -L/usr/local/lib/graphviz/" >> ./config.mk
echo "USE_CUDA = 1" >> ./config.mk
echo "USE_CUDA_PATH = /usr/local/cuda" >> ./config.mk
echo "USE_CUDNN = 1" >> ./config.mk
make
Here is a small chunk of the error message. The full message is so long that 1/4 of it goes over the character limit :)
`
/usr/local/cuda/include/thrust/system/cuda/detail/bulk/malloc.hpp:242:15: warning: private field 'm_is_free' is not used
[-Wunused-private-field]
private: bool m_is_free:1;
^
/usr/local/cuda/include/thrust/system/cuda/detail/bulk/malloc.hpp:243:8: warning: private field 'm_size' is not used
[-Wunused-private-field]
size_t m_size:((8) * sizeof(size_t)) - (1);
^
/usr/local/cuda/include/thrust/system/cuda/detail/bulk/malloc.hpp:244:8: warning: private field 'm_prev' is not used
[-Wunused-private-field]
block *m_prev;
^
/usr/local/cuda/include/thrust/system/cuda/detail/bulk/malloc.hpp:445:19: warning: private field 'm_in_use' is not used
[-Wunused-private-field]
private: unsigned m_in_use;
^
230 warnings generated.
ar crv lib/libmxnet.a build/src/operator/contrib/count_sketch.o build/src/operator/contrib/ctc_loss.o build/src/operator/contrib/deformable_convolution.o build/src/operator/contrib/deformable_psroi_pooling.o build/src/operator/contrib/dequantize.o build/src/operator/contrib/fft.o build/src/operator/contrib/ifft.o build/src/operator/contrib/multi_proposal.o build/src/operator/contrib/multibox_detection.o build/src/operator/contrib/multibox_prior.o build/src/operator/contrib/multibox_target.o build/src/operator/contrib/proposal.o build/src/operator/contrib/psroi_pooling.o build/src/operator/contrib/quantize.o build/src/operator/custom/custom.o build/src/operator/custom/native_op.o build/src/operator/custom/ndarray_op.o build/src/operator/mkl/mkl_cppwrapper.o build/src/operator/mkl/mkl_memory.o build/src/operator/nn/softmax.o build/src/operator/nnpack/nnpack_util.o build/src/operator/random/multisample_op.o build/src/operator/random/sample_multinomial_op.o build/src/operator/random/sample_op.o build/src/operator/tensor/broadcast_reduce_op_index.o build/src/operator/tensor/broadcast_reduce_op_value.o build/src/operator/tensor/cast_storage.o build/src/operator/tensor/control_flow_op.o build/src/operator/tensor/dot.o build/src/operator/tensor/elemwise_binary_broadcast_op_basic.o build/src/operator/tensor/elemwise_binary_broadcast_op_extended.o build/src/operator/tensor/elemwise_binary_broadcast_op_logic.o build/src/operator/tensor/elemwise_binary_op_basic.o build/src/operator/tensor/elemwise_binary_op_extended.o build/src/operator/tensor/elemwise_binary_op_logic.o build/src/operator/tensor/elemwise_binary_scalar_op_basic.o build/src/operator/tensor/elemwise_binary_scalar_op_extended.o build/src/operator/tensor/elemwise_binary_scalar_op_logic.o build/src/operator/tensor/elemwise_sum.o build/src/operator/tensor/elemwise_unary_op.o build/src/operator/tensor/indexing_op.o build/src/operator/tensor/init_op.o build/src/operator/tensor/la_op.o build/src/operator/tensor/matrix_op.o build/src/operator/tensor/ordering_op.o build/src/operator/tensor/sparse_retain.o build/src/operator/tensor/square_sum.o build/src/c_api/c_api.o build/src/c_api/c_api_error.o build/src/c_api/c_api_executor.o build/src/c_api/c_api_function.o build/src/c_api/c_api_ndarray.o build/src/c_api/c_api_symbolic.o build/src/c_api/c_predict_api.o build/src/common/mxrtc.o build/src/common/utils.o build/src/engine/engine.o build/src/engine/naive_engine.o build/src/engine/profiler.o build/src/engine/threaded_engine.o build/src/engine/threaded_engine_perdevice.o build/src/engine/threaded_engine_pooled.o build/src/executor/attach_op_execs_pass.o build/src/executor/attach_op_resource_pass.o build/src/executor/graph_executor.o build/src/executor/infer_graph_attr_pass.o build/src/executor/inplace_addto_detect_pass.o build/src/io/image_aug_default.o build/src/io/image_det_aug_default.o build/src/io/image_io.o build/src/io/io.o build/src/io/iter_csv.o build/src/io/iter_image_det_recordio.o build/src/io/iter_image_recordio.o build/src/io/iter_image_recordio_2.o build/src/io/iter_libsvm.o build/src/io/iter_mnist.o build/src/kvstore/kvstore.o build/src/ndarray/autograd.o build/src/ndarray/ndarray.o build/src/ndarray/ndarray_function.o build/src/nnvm/legacy_json_util.o build/src/nnvm/legacy_op_util.o build/src/operator/activation.o build/src/operator/batch_norm.o build/src/operator/batch_norm_v1.o build/src/operator/bilinear_sampler.o build/src/operator/concat.o build/src/operator/convolution.o build/src/operator/convolution_v1.o build/src/operator/correlation.o build/src/operator/crop.o build/src/operator/cross_device_copy.o build/src/operator/cudnn_algoreg.o build/src/operator/cudnn_batch_norm.o build/src/operator/deconvolution.o build/src/operator/dropout.o build/src/operator/fully_connected.o build/src/operator/grid_generator.o build/src/operator/identity_attach_KL_sparse_reg.o build/src/operator/instance_norm.o build/src/operator/l2_normalization.o build/src/operator/leaky_relu.o build/src/operator/loss_binary_op.o build/src/operator/lrn.o build/src/operator/make_loss.o build/src/operator/operator.o build/src/operator/operator_util.o build/src/operator/optimizer_op.o build/src/operator/pad.o build/src/operator/pooling.o build/src/operator/pooling_v1.o build/src/operator/regression_output.o build/src/operator/rnn.o build/src/operator/roi_pooling.o build/src/operator/sequence_last.o build/src/operator/sequence_mask.o build/src/operator/sequence_reverse.o build/src/operator/slice_channel.o build/src/operator/softmax_activation.o build/src/operator/softmax_output.o build/src/operator/spatial_transformer.o build/src/operator/svm_output.o build/src/operator/swapaxis.o build/src/operator/upsampling.o build/src/storage/storage.o build/src/initialize.o build/src/resource.o build/src/operator/contrib/count_sketch_gpu.o build/src/operator/contrib/ctc_loss_gpu.o build/src/operator/contrib/deformable_convolution_gpu.o build/src/operator/contrib/deformable_psroi_pooling_gpu.o build/src/operator/contrib/dequantize_gpu.o build/src/operator/contrib/fft_gpu.o build/src/operator/contrib/ifft_gpu.o build/src/operator/contrib/multi_proposal_gpu.o build/src/operator/contrib/multibox_detection_gpu.o build/src/operator/contrib/multibox_prior_gpu.o build/src/operator/contrib/multibox_target_gpu.o build/src/operator/contrib/proposal_gpu.o build/src/operator/contrib/psroi_pooling_gpu.o build/src/operator/contrib/quantize_gpu.o build/src/operator/custom/native_op_gpu.o build/src/operator/nn/softmax_gpu.o build/src/operator/random/sample_multinomial_op_gpu.o build/src/operator/random/sample_op_gpu.o build/src/operator/tensor/broadcast_reduce_op_index_gpu.o build/src/operator/tensor/broadcast_reduce_op_value_gpu.o build/src/operator/tensor/cast_storage_gpu.o build/src/operator/tensor/control_flow_op_gpu.o build/src/operator/tensor/dot_gpu.o build/src/operator/tensor/elemwise_binary_broadcast_op_basic_gpu.o build/src/operator/tensor/elemwise_binary_broadcast_op_extended_gpu.o build/src/operator/tensor/elemwise_binary_broadcast_op_logic_gpu.o build/src/operator/tensor/elemwise_binary_op_basic_gpu.o build/src/operator/tensor/elemwise_binary_op_extended_gpu.o build/src/operator/tensor/elemwise_binary_op_logic_gpu.o build/src/operator/tensor/elemwise_binary_scalar_op_basic_gpu.o build/src/operator/tensor/elemwise_binary_scalar_op_extended_gpu.o build/src/operator/tensor/elemwise_binary_scalar_op_logic_gpu.o build/src/operator/tensor/elemwise_sum_gpu.o build/src/operator/tensor/elemwise_unary_op_gpu.o build/src/operator/tensor/indexing_op_gpu.o build/src/operator/tensor/init_op_gpu.o build/src/operator/tensor/la_op_gpu.o build/src/operator/tensor/matrix_op_gpu.o build/src/operator/tensor/ordering_op_gpu.o build/src/operator/tensor/sparse_retain_gpu.o build/src/common/utils_gpu.o build/src/ndarray/ndarray_function_gpu.o build/src/operator/activation_gpu.o build/src/operator/batch_norm_gpu.o build/src/operator/batch_norm_v1_gpu.o build/src/operator/bilinear_sampler_gpu.o build/src/operator/concat_gpu.o build/src/operator/convolution_gpu.o build/src/operator/convolution_v1_gpu.o build/src/operator/correlation_gpu.o build/src/operator/crop_gpu.o build/src/operator/cudnn_batch_norm_gpu.o build/src/operator/deconvolution_gpu.o build/src/operator/dropout_gpu.o build/src/operator/fully_connected_gpu.o build/src/operator/grid_generator_gpu.o build/src/operator/identity_attach_KL_sparse_reg_gpu.o build/src/operator/instance_norm_gpu.o build/src/operator/l2_normalization_gpu.o build/src/operator/leaky_relu_gpu.o build/src/operator/loss_binary_op_gpu.o build/src/operator/lrn_gpu.o build/src/operator/make_loss_gpu.o build/src/operator/optimizer_op_gpu.o build/src/operator/pad_gpu.o build/src/operator/pooling_gpu.o build/src/operator/pooling_v1_gpu.o build/src/operator/regression_output_gpu.o build/src/operator/rnn_gpu.o build/src/operator/roi_pooling_gpu.o build/src/operator/sequence_last_gpu.o build/src/operator/sequence_mask_gpu.o build/src/operator/sequence_reverse_gpu.o build/src/operator/slice_channel_gpu.o build/src/operator/softmax_activation_gpu.o build/src/operator/softmax_output_gpu.o build/src/operator/spatial_transformer_gpu.o build/src/operator/svm_output_gpu.o build/src/operator/swapaxis_gpu.o build/src/operator/upsampling_gpu.o
a - build/src/operator/contrib/count_sketch.o
a - build/src/operator/contrib/ctc_loss.o
a - build/src/operator/contrib/deformable_convolution.o
a - build/src/operator/contrib/deformable_psroi_pooling.o
a - build/src/operator/contrib/dequantize.o
a - build/src/operator/contrib/fft.o
a - build/src/operator/contrib/ifft.o
a - build/src/operator/contrib/multi_proposal.o
a - build/src/operator/contrib/multibox_detection.o
a - build/src/operator/contrib/multibox_prior.o
a - build/src/operator/contrib/multibox_target.o
a - build/src/operator/contrib/proposal.o
a - build/src/operator/contrib/psroi_pooling.o
a - build/src/operator/contrib/quantize.o
a - build/src/operator/custom/custom.o
a - build/src/operator/custom/native_op.o
a - build/src/operator/custom/ndarray_op.o
a - build/src/operator/mkl/mkl_cppwrapper.o
a - build/src/operator/mkl/mkl_memory.o
a - build/src/operator/nn/softmax.o
a - build/src/operator/nnpack/nnpack_util.o
a - build/src/operator/random/multisample_op.o
a - build/src/operator/random/sample_multinomial_op.o
a - build/src/operator/random/sample_op.o
a - build/src/operator/tensor/broadcast_reduce_op_index.o
a - build/src/operator/tensor/broadcast_reduce_op_value.o
a - build/src/operator/tensor/cast_storage.o
a - build/src/operator/tensor/control_flow_op.o
a - build/src/operator/tensor/dot.o
a - build/src/operator/tensor/elemwise_binary_broadcast_op_basic.o
a - build/src/operator/tensor/elemwise_binary_broadcast_op_extended.o
a - build/src/operator/tensor/elemwise_binary_broadcast_op_logic.o
a - build/src/operator/tensor/elemwise_binary_op_basic.o
a - build/src/operator/tensor/elemwise_binary_op_extended.o
a - build/src/operator/tensor/elemwise_binary_op_logic.o
a - build/src/operator/tensor/elemwise_binary_scalar_op_basic.o
a - build/src/operator/tensor/elemwise_binary_scalar_op_extended.o
a - build/src/operator/tensor/elemwise_binary_scalar_op_logic.o
a - build/src/operator/tensor/elemwise_sum.o
a - build/src/operator/tensor/elemwise_unary_op.o
a - build/src/operator/tensor/indexing_op.o
a - build/src/operator/tensor/init_op.o
a - build/src/operator/tensor/la_op.o
a - build/src/operator/tensor/matrix_op.o
a - build/src/operator/tensor/ordering_op.o
a - build/src/operator/tensor/sparse_retain.o
a - build/src/operator/tensor/square_sum.o
a - build/src/c_api/c_api.o
a - build/src/c_api/c_api_error.o
a - build/src/c_api/c_api_executor.o
a - build/src/c_api/c_api_function.o
a - build/src/c_api/c_api_ndarray.o
a - build/src/c_api/c_api_symbolic.o
a - build/src/c_api/c_predict_api.o
a - build/src/common/mxrtc.o
a - build/src/common/utils.o
a - build/src/engine/engine.o
a - build/src/engine/naive_engine.o
a - build/src/engine/profiler.o
a - build/src/engine/threaded_engine.o
a - build/src/engine/threaded_engine_perdevice.o
a - build/src/engine/threaded_engine_pooled.o
a - build/src/executor/attach_op_execs_pass.o
a - build/src/executor/attach_op_resource_pass.o
a - build/src/executor/graph_executor.o
a - build/src/executor/infer_graph_attr_pass.o
a - build/src/executor/inplace_addto_detect_pass.o
a - build/src/io/image_aug_default.o
a - build/src/io/image_det_aug_default.o
a - build/src/io/image_io.o
a - build/src/io/io.o
a - build/src/io/iter_csv.o
a - build/src/io/iter_image_det_recordio.o
a - build/src/io/iter_image_recordio.o
a - build/src/io/iter_image_recordio_2.o
a - build/src/io/iter_libsvm.o
a - build/src/io/iter_mnist.o
a - build/src/kvstore/kvstore.o
a - build/src/ndarray/autograd.o
a - build/src/ndarray/ndarray.o
a - build/src/ndarray/ndarray_function.o
a - build/src/nnvm/legacy_json_util.o
a - build/src/nnvm/legacy_op_util.o
a - build/src/operator/activation.o
a - build/src/operator/batch_norm.o
a - build/src/operator/batch_norm_v1.o
a - build/src/operator/bilinear_sampler.o
a - build/src/operator/concat.o
a - build/src/operator/convolution.o
a - build/src/operator/convolution_v1.o
a - build/src/operator/correlation.o
a - build/src/operator/crop.o
a - build/src/operator/cross_device_copy.o
a - build/src/operator/cudnn_algoreg.o
a - build/src/operator/cudnn_batch_norm.o
a - build/src/operator/deconvolution.o
a - build/src/operator/dropout.o
a - build/src/operator/fully_connected.o
a - build/src/operator/grid_generator.o
a - build/src/operator/identity_attach_KL_sparse_reg.o
a - build/src/operator/instance_norm.o
a - build/src/operator/l2_normalization.o
a - build/src/operator/leaky_relu.o
a - build/src/operator/loss_binary_op.o
a - build/src/operator/lrn.o
a - build/src/operator/make_loss.o
a - build/src/operator/operator.o
a - build/src/operator/operator_util.o
a - build/src/operator/optimizer_op.o
a - build/src/operator/pad.o
a - build/src/operator/pooling.o
a - build/src/operator/pooling_v1.o
a - build/src/operator/regression_output.o
a - build/src/operator/rnn.o
a - build/src/operator/roi_pooling.o
a - build/src/operator/sequence_last.o
a - build/src/operator/sequence_mask.o
a - build/src/operator/sequence_reverse.o
a - build/src/operator/slice_channel.o
a - build/src/operator/softmax_activation.o
a - build/src/operator/softmax_output.o
a - build/src/operator/spatial_transformer.o
a - build/src/operator/svm_output.o
a - build/src/operator/swapaxis.o
a - build/src/operator/upsampling.o
a - build/src/storage/storage.o
a - build/src/initialize.o
a - build/src/resource.o
a - build/src/operator/contrib/count_sketch_gpu.o
a - build/src/operator/contrib/ctc_loss_gpu.o
a - build/src/operator/contrib/deformable_convolution_gpu.o
a - build/src/operator/contrib/deformable_psroi_pooling_gpu.o
a - build/src/operator/contrib/dequantize_gpu.o
a - build/src/operator/contrib/fft_gpu.o
a - build/src/operator/contrib/ifft_gpu.o
a - build/src/operator/contrib/multi_proposal_gpu.o
a - build/src/operator/contrib/multibox_detection_gpu.o
a - build/src/operator/contrib/multibox_prior_gpu.o
a - build/src/operator/contrib/multibox_target_gpu.o
a - build/src/operator/contrib/proposal_gpu.o
a - build/src/operator/contrib/psroi_pooling_gpu.o
a - build/src/operator/contrib/quantize_gpu.o
a - build/src/operator/custom/native_op_gpu.o
a - build/src/operator/nn/softmax_gpu.o
a - build/src/operator/random/sample_multinomial_op_gpu.o
a - build/src/operator/random/sample_op_gpu.o
a - build/src/operator/tensor/broadcast_reduce_op_index_gpu.o
a - build/src/operator/tensor/broadcast_reduce_op_value_gpu.o
a - build/src/operator/tensor/cast_storage_gpu.o
a - build/src/operator/tensor/control_flow_op_gpu.o
a - build/src/operator/tensor/dot_gpu.o
a - build/src/operator/tensor/elemwise_binary_broadcast_op_basic_gpu.o
a - build/src/operator/tensor/elemwise_binary_broadcast_op_extended_gpu.o
a - build/src/operator/tensor/elemwise_binary_broadcast_op_logic_gpu.o
a - build/src/operator/tensor/elemwise_binary_op_basic_gpu.o
a - build/src/operator/tensor/elemwise_binary_op_extended_gpu.o
a - build/src/operator/tensor/elemwise_binary_op_logic_gpu.o
a - build/src/operator/tensor/elemwise_binary_scalar_op_basic_gpu.o
a - build/src/operator/tensor/elemwise_binary_scalar_op_extended_gpu.o
a - build/src/operator/tensor/elemwise_binary_scalar_op_logic_gpu.o
a - build/src/operator/tensor/elemwise_sum_gpu.o
a - build/src/operator/tensor/elemwise_unary_op_gpu.o
a - build/src/operator/tensor/indexing_op_gpu.o
a - build/src/operator/tensor/init_op_gpu.o
a - build/src/operator/tensor/la_op_gpu.o
a - build/src/operator/tensor/matrix_op_gpu.o
a - build/src/operator/tensor/ordering_op_gpu.o
a - build/src/operator/tensor/sparse_retain_gpu.o
a - build/src/common/utils_gpu.o
a - build/src/ndarray/ndarray_function_gpu.o
a - build/src/operator/activation_gpu.o
a - build/src/operator/batch_norm_gpu.o
a - build/src/operator/batch_norm_v1_gpu.o
a - build/src/operator/bilinear_sampler_gpu.o
a - build/src/operator/concat_gpu.o
a - build/src/operator/convolution_gpu.o
a - build/src/operator/convolution_v1_gpu.o
a - build/src/operator/correlation_gpu.o
a - build/src/operator/crop_gpu.o
a - build/src/operator/cudnn_batch_norm_gpu.o
a - build/src/operator/deconvolution_gpu.o
a - build/src/operator/dropout_gpu.o
a - build/src/operator/fully_connected_gpu.o
a - build/src/operator/grid_generator_gpu.o
a - build/src/operator/identity_attach_KL_sparse_reg_gpu.o
a - build/src/operator/instance_norm_gpu.o
a - build/src/operator/l2_normalization_gpu.o
a - build/src/operator/leaky_relu_gpu.o
a - build/src/operator/loss_binary_op_gpu.o
a - build/src/operator/lrn_gpu.o
a - build/src/operator/make_loss_gpu.o
a - build/src/operator/optimizer_op_gpu.o
a - build/src/operator/pad_gpu.o
a - build/src/operator/pooling_gpu.o
a - build/src/operator/pooling_v1_gpu.o
a - build/src/operator/regression_output_gpu.o
a - build/src/operator/rnn_gpu.o
a - build/src/operator/roi_pooling_gpu.o
a - build/src/operator/sequence_last_gpu.o
a - build/src/operator/sequence_mask_gpu.o
a - build/src/operator/sequence_reverse_gpu.o
a - build/src/operator/slice_channel_gpu.o
a - build/src/operator/softmax_activation_gpu.o
a - build/src/operator/softmax_output_gpu.o
a - build/src/operator/spatial_transformer_gpu.o
a - build/src/operator/svm_output_gpu.o
a - build/src/operator/swapaxis_gpu.o
a - build/src/operator/upsampling_gpu.o
/Library/Developer/CommandLineTools/usr/bin/ranlib: file: lib/libmxnet.a(mkl_cppwrapper.o) has no symbols
/Library/Developer/CommandLineTools/usr/bin/ranlib: file: lib/libmxnet.a(mkl_memory.o) has no symbols
/Library/Developer/CommandLineTools/usr/bin/ranlib: file: lib/libmxnet.a(nnpack_util.o) has no symbols
/Library/Developer/CommandLineTools/usr/bin/ranlib: file: lib/libmxnet.a(mxrtc.o) has no symbols
g++ -DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/Users/sumner/Downloads/mxnet/mshadow/ -I/Users/sumner/Downloads/mxnet/dmlc-core/include -fPIC -I/Users/sumner/Downloads/mxnet/nnvm/include -I/Users/sumner/Downloads/mxnet/dlpack/include -Iinclude -funroll-loops -Wno-unused-variable -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_OPENCV=1 -I/usr/local/Cellar/opencv/3.3.0_3/include/opencv -I/usr/local/Cellar/opencv/3.3.0_3/include -DMSHADOW_USE_CUDNN=1 -I/usr/local/opt/openblas/include -I/Users/sumner/Downloads/mxnet/cub -DMXNET_USE_NVRTC=0 -shared -o lib/libmxnet.so build/src/operator/contrib/count_sketch.o build/src/operator/contrib/ctc_loss.o build/src/operator/contrib/deformable_convolution.o build/src/operator/contrib/deformable_psroi_pooling.o build/src/operator/contrib/dequantize.o build/src/operator/contrib/fft.o build/src/operator/contrib/ifft.o build/src/operator/contrib/multi_proposal.o build/src/operator/contrib/multibox_detection.o build/src/operator/contrib/multibox_prior.o build/src/operator/contrib/multibox_target.o build/src/operator/contrib/proposal.o build/src/operator/contrib/psroi_pooling.o build/src/operator/contrib/quantize.o build/src/operator/custom/custom.o build/src/operator/custom/native_op.o build/src/operator/custom/ndarray_op.o build/src/operator/mkl/mkl_cppwrapper.o build/src/operator/mkl/mkl_memory.o build/src/operator/nn/softmax.o build/src/operator/nnpack/nnpack_util.o build/src/operator/random/multisample_op.o build/src/operator/random/sample_multinomial_op.o build/src/operator/random/sample_op.o build/src/operator/tensor/broadcast_reduce_op_index.o build/src/operator/tensor/broadcast_reduce_op_value.o build/src/operator/tensor/cast_storage.o build/src/operator/tensor/control_flow_op.o build/src/operator/tensor/dot.o build/src/operator/tensor/elemwise_binary_broadcast_op_basic.o build/src/operator/tensor/elemwise_binary_broadcast_op_extended.o build/src/operator/tensor/elemwise_binary_broadcast_op_logic.o build/src/operator/tensor/elemwise_binary_op_basic.o build/src/operator/tensor/elemwise_binary_op_extended.o build/src/operator/tensor/elemwise_binary_op_logic.o build/src/operator/tensor/elemwise_binary_scalar_op_basic.o build/src/operator/tensor/elemwise_binary_scalar_op_extended.o build/src/operator/tensor/elemwise_binary_scalar_op_logic.o build/src/operator/tensor/elemwise_sum.o build/src/operator/tensor/elemwise_unary_op.o build/src/operator/tensor/indexing_op.o build/src/operator/tensor/init_op.o build/src/operator/tensor/la_op.o build/src/operator/tensor/matrix_op.o build/src/operator/tensor/ordering_op.o build/src/operator/tensor/sparse_retain.o build/src/operator/tensor/square_sum.o build/src/c_api/c_api.o build/src/c_api/c_api_error.o build/src/c_api/c_api_executor.o build/src/c_api/c_api_function.o build/src/c_api/c_api_ndarray.o build/src/c_api/c_api_symbolic.o build/src/c_api/c_predict_api.o build/src/common/mxrtc.o build/src/common/utils.o build/src/engine/engine.o build/src/engine/naive_engine.o build/src/engine/profiler.o build/src/engine/threaded_engine.o build/src/engine/threaded_engine_perdevice.o build/src/engine/threaded_engine_pooled.o build/src/executor/attach_op_execs_pass.o build/src/executor/attach_op_resource_pass.o build/src/executor/graph_executor.o build/src/executor/infer_graph_attr_pass.o build/src/executor/inplace_addto_detect_pass.o build/src/io/image_aug_default.o build/src/io/image_det_aug_default.o build/src/io/image_io.o build/src/io/io.o build/src/io/iter_csv.o build/src/io/iter_image_det_recordio.o build/src/io/iter_image_recordio.o build/src/io/iter_image_recordio_2.o build/src/io/iter_libsvm.o build/src/io/iter_mnist.o build/src/kvstore/kvstore.o build/src/ndarray/autograd.o build/src/ndarray/ndarray.o build/src/ndarray/ndarray_function.o build/src/nnvm/legacy_json_util.o build/src/nnvm/legacy_op_util.o build/src/operator/activation.o build/src/operator/batch_norm.o build/src/operator/batch_norm_v1.o build/src/operator/bilinear_sampler.o build/src/operator/concat.o build/src/operator/convolution.o build/src/operator/convolution_v1.o build/src/operator/correlation.o build/src/operator/crop.o build/src/operator/cross_device_copy.o build/src/operator/cudnn_algoreg.o build/src/operator/cudnn_batch_norm.o build/src/operator/deconvolution.o build/src/operator/dropout.o build/src/operator/fully_connected.o build/src/operator/grid_generator.o build/src/operator/identity_attach_KL_sparse_reg.o build/src/operator/instance_norm.o build/src/operator/l2_normalization.o build/src/operator/leaky_relu.o build/src/operator/loss_binary_op.o build/src/operator/lrn.o build/src/operator/make_loss.o build/src/operator/operator.o build/src/operator/operator_util.o build/src/operator/optimizer_op.o build/src/operator/pad.o build/src/operator/pooling.o build/src/operator/pooling_v1.o build/src/operator/regression_output.o build/src/operator/rnn.o build/src/operator/roi_pooling.o build/src/operator/sequence_last.o build/src/operator/sequence_mask.o build/src/operator/sequence_reverse.o build/src/operator/slice_channel.o build/src/operator/softmax_activation.o build/src/operator/softmax_output.o build/src/operator/spatial_transformer.o build/src/operator/svm_output.o build/src/operator/swapaxis.o build/src/operator/upsampling.o build/src/storage/storage.o build/src/initialize.o build/src/resource.o /Users/sumner/Downloads/mxnet/dmlc-core/libdmlc.a build/src/operator/contrib/count_sketch_gpu.o build/src/operator/contrib/ctc_loss_gpu.o build/src/operator/contrib/deformable_convolution_gpu.o build/src/operator/contrib/deformable_psroi_pooling_gpu.o build/src/operator/contrib/dequantize_gpu.o build/src/operator/contrib/fft_gpu.o build/src/operator/contrib/ifft_gpu.o build/src/operator/contrib/multi_proposal_gpu.o build/src/operator/contrib/multibox_detection_gpu.o build/src/operator/contrib/multibox_prior_gpu.o build/src/operator/contrib/multibox_target_gpu.o build/src/operator/contrib/proposal_gpu.o build/src/operator/contrib/psroi_pooling_gpu.o build/src/operator/contrib/quantize_gpu.o build/src/operator/custom/native_op_gpu.o build/src/operator/nn/softmax_gpu.o build/src/operator/random/sample_multinomial_op_gpu.o build/src/operator/random/sample_op_gpu.o build/src/operator/tensor/broadcast_reduce_op_index_gpu.o build/src/operator/tensor/broadcast_reduce_op_value_gpu.o build/src/operator/tensor/cast_storage_gpu.o build/src/operator/tensor/control_flow_op_gpu.o build/src/operator/tensor/dot_gpu.o build/src/operator/tensor/elemwise_binary_broadcast_op_basic_gpu.o build/src/operator/tensor/elemwise_binary_broadcast_op_extended_gpu.o build/src/operator/tensor/elemwise_binary_broadcast_op_logic_gpu.o build/src/operator/tensor/elemwise_binary_op_basic_gpu.o build/src/operator/tensor/elemwise_binary_op_extended_gpu.o build/src/operator/tensor/elemwise_binary_op_logic_gpu.o build/src/operator/tensor/elemwise_binary_scalar_op_basic_gpu.o build/src/operator/tensor/elemwise_binary_scalar_op_extended_gpu.o build/src/operator/tensor/elemwise_binary_scalar_op_logic_gpu.o build/src/operator/tensor/elemwise_sum_gpu.o build/src/operator/tensor/elemwise_unary_op_gpu.o build/src/operator/tensor/indexing_op_gpu.o build/src/operator/tensor/init_op_gpu.o build/src/operator/tensor/la_op_gpu.o build/src/operator/tensor/matrix_op_gpu.o build/src/operator/tensor/ordering_op_gpu.o build/src/operator/tensor/sparse_retain_gpu.o build/src/common/utils_gpu.o build/src/ndarray/ndarray_function_gpu.o build/src/operator/activation_gpu.o build/src/operator/batch_norm_gpu.o build/src/operator/batch_norm_v1_gpu.o build/src/operator/bilinear_sampler_gpu.o build/src/operator/concat_gpu.o build/src/operator/convolution_gpu.o build/src/operator/convolution_v1_gpu.o build/src/operator/correlation_gpu.o build/src/operator/crop_gpu.o build/src/operator/cudnn_batch_norm_gpu.o build/src/operator/deconvolution_gpu.o build/src/operator/dropout_gpu.o build/src/operator/fully_connected_gpu.o build/src/operator/grid_generator_gpu.o build/src/operator/identity_attach_KL_sparse_reg_gpu.o build/src/operator/instance_norm_gpu.o build/src/operator/l2_normalization_gpu.o build/src/operator/leaky_relu_gpu.o build/src/operator/loss_binary_op_gpu.o build/src/operator/lrn_gpu.o build/src/operator/make_loss_gpu.o build/src/operator/optimizer_op_gpu.o build/src/operator/pad_gpu.o build/src/operator/pooling_gpu.o build/src/operator/pooling_v1_gpu.o build/src/operator/regression_output_gpu.o build/src/operator/rnn_gpu.o build/src/operator/roi_pooling_gpu.o build/src/operator/sequence_last_gpu.o build/src/operator/sequence_mask_gpu.o build/src/operator/sequence_reverse_gpu.o build/src/operator/slice_channel_gpu.o build/src/operator/softmax_activation_gpu.o build/src/operator/softmax_output_gpu.o build/src/operator/spatial_transformer_gpu.o build/src/operator/svm_output_gpu.o build/src/operator/swapaxis_gpu.o build/src/operator/upsampling_gpu.o -pthread -lm -lcudart -lcublas -lcurand -lcusolver -L/usr/local/cuda/lib64 -L/usr/local/cuda/lib -lopenblas -L/usr/local/Cellar/opencv/3.3.0_3/lib -lopencv_stitching -lopencv_superres -lopencv_videostab -lopencv_photo -lopencv_aruco -lopencv_bgsegm -lopencv_bioinspired -lopencv_ccalib -lopencv_dpm -lopencv_face -lopencv_fuzzy -lopencv_img_hash -lopencv_line_descriptor -lopencv_optflow -lopencv_reg -lopencv_rgbd -lopencv_saliency -lopencv_stereo -lopencv_structured_light -lopencv_phase_unwrapping -lopencv_surface_matching -lopencv_tracking -lopencv_datasets -lopencv_text -lopencv_dnn -lopencv_plot -lopencv_ml -lopencv_xfeatures2d -lopencv_shape -lopencv_video -lopencv_ximgproc -lopencv_calib3d -lopencv_features2d -lopencv_highgui -lopencv_videoio -lopencv_flann -lopencv_xobjdetect -lopencv_imgcodecs -lopencv_objdetect -lopencv_xphoto -lopencv_imgproc -lopencv_core -lcudnn -L/usr/local/opt/openblas/lib -L/usr/local/lib/graphviz/ -lcuda -lcufft \
-Wl,-all_load /Users/sumner/Downloads/mxnet/nnvm/lib/libnnvm.a -Wl,-noall_load
clang: warning: argument unused during compilation: '-pthread'
ld: warning: directory not found for option '-L/usr/local/cuda/lib64'
ld: warning: option -noall_load is obsolete and being ignored
g++ -DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/Users/sumner/Downloads/mxnet/mshadow/ -I/Users/sumner/Downloads/mxnet/dmlc-core/include -fPIC -I/Users/sumner/Downloads/mxnet/nnvm/include -I/Users/sumner/Downloads/mxnet/dlpack/include -Iinclude -funroll-loops -Wno-unused-variable -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_OPENCV=1 -I/usr/local/Cellar/opencv/3.3.0_3/include/opencv -I/usr/local/Cellar/opencv/3.3.0_3/include -DMSHADOW_USE_CUDNN=1 -I/usr/local/opt/openblas/include -I/Users/sumner/Downloads/mxnet/cub -DMXNET_USE_NVRTC=0 -std=c++11 -o bin/im2rec tools/im2rec.cc build/src/operator/contrib/count_sketch.o build/src/operator/contrib/ctc_loss.o build/src/operator/contrib/deformable_convolution.o build/src/operator/contrib/deformable_psroi_pooling.o build/src/operator/contrib/dequantize.o build/src/operator/contrib/fft.o build/src/operator/contrib/ifft.o build/src/operator/contrib/multi_proposal.o build/src/operator/contrib/multibox_detection.o build/src/operator/contrib/multibox_prior.o build/src/operator/contrib/multibox_target.o build/src/operator/contrib/proposal.o build/src/operator/contrib/psroi_pooling.o build/src/operator/contrib/quantize.o build/src/operator/custom/custom.o build/src/operator/custom/native_op.o build/src/operator/custom/ndarray_op.o build/src/operator/mkl/mkl_cppwrapper.o build/src/operator/mkl/mkl_memory.o build/src/operator/nn/softmax.o build/src/operator/nnpack/nnpack_util.o build/src/operator/random/multisample_op.o build/src/operator/random/sample_multinomial_op.o build/src/operator/random/sample_op.o build/src/operator/tensor/broadcast_reduce_op_index.o build/src/operator/tensor/broadcast_reduce_op_value.o build/src/operator/tensor/cast_storage.o build/src/operator/tensor/control_flow_op.o build/src/operator/tensor/dot.o build/src/operator/tensor/elemwise_binary_broadcast_op_basic.o build/src/operator/tensor/elemwise_binary_broadcast_op_extended.o build/src/operator/tensor/elemwise_binary_broadcast_op_logic.o build/src/operator/tensor/elemwise_binary_op_basic.o build/src/operator/tensor/elemwise_binary_op_extended.o build/src/operator/tensor/elemwise_binary_op_logic.o build/src/operator/tensor/elemwise_binary_scalar_op_basic.o build/src/operator/tensor/elemwise_binary_scalar_op_extended.o build/src/operator/tensor/elemwise_binary_scalar_op_logic.o build/src/operator/tensor/elemwise_sum.o build/src/operator/tensor/elemwise_unary_op.o build/src/operator/tensor/indexing_op.o build/src/operator/tensor/init_op.o build/src/operator/tensor/la_op.o build/src/operator/tensor/matrix_op.o build/src/operator/tensor/ordering_op.o build/src/operator/tensor/sparse_retain.o build/src/operator/tensor/square_sum.o build/src/c_api/c_api.o build/src/c_api/c_api_error.o build/src/c_api/c_api_executor.o build/src/c_api/c_api_function.o build/src/c_api/c_api_ndarray.o build/src/c_api/c_api_symbolic.o build/src/c_api/c_predict_api.o build/src/common/mxrtc.o build/src/common/utils.o build/src/engine/engine.o build/src/engine/naive_engine.o build/src/engine/profiler.o build/src/engine/threaded_engine.o build/src/engine/threaded_engine_perdevice.o build/src/engine/threaded_engine_pooled.o build/src/executor/attach_op_execs_pass.o build/src/executor/attach_op_resource_pass.o build/src/executor/graph_executor.o build/src/executor/infer_graph_attr_pass.o build/src/executor/inplace_addto_detect_pass.o build/src/io/image_aug_default.o build/src/io/image_det_aug_default.o build/src/io/image_io.o build/src/io/io.o build/src/io/iter_csv.o build/src/io/iter_image_det_recordio.o build/src/io/iter_image_recordio.o build/src/io/iter_image_recordio_2.o build/src/io/iter_libsvm.o build/src/io/iter_mnist.o build/src/kvstore/kvstore.o build/src/ndarray/autograd.o build/src/ndarray/ndarray.o build/src/ndarray/ndarray_function.o build/src/nnvm/legacy_json_util.o build/src/nnvm/legacy_op_util.o build/src/operator/activation.o build/src/operator/batch_norm.o build/src/operator/batch_norm_v1.o build/src/operator/bilinear_sampler.o build/src/operator/concat.o build/src/operator/convolution.o build/src/operator/convolution_v1.o build/src/operator/correlation.o build/src/operator/crop.o build/src/operator/cross_device_copy.o build/src/operator/cudnn_algoreg.o build/src/operator/cudnn_batch_norm.o build/src/operator/deconvolution.o build/src/operator/dropout.o build/src/operator/fully_connected.o build/src/operator/grid_generator.o build/src/operator/identity_attach_KL_sparse_reg.o build/src/operator/instance_norm.o build/src/operator/l2_normalization.o build/src/operator/leaky_relu.o build/src/operator/loss_binary_op.o build/src/operator/lrn.o build/src/operator/make_loss.o build/src/operator/operator.o build/src/operator/operator_util.o build/src/operator/optimizer_op.o build/src/operator/pad.o build/src/operator/pooling.o build/src/operator/pooling_v1.o build/src/operator/regression_output.o build/src/operator/rnn.o build/src/operator/roi_pooling.o build/src/operator/sequence_last.o build/src/operator/sequence_mask.o build/src/operator/sequence_reverse.o build/src/operator/slice_channel.o build/src/operator/softmax_activation.o build/src/operator/softmax_output.o build/src/operator/spatial_transformer.o build/src/operator/svm_output.o build/src/operator/swapaxis.o build/src/operator/upsampling.o build/src/storage/storage.o build/src/initialize.o build/src/resource.o /Users/sumner/Downloads/mxnet/dmlc-core/libdmlc.a /Users/sumner/Downloads/mxnet/nnvm/lib/libnnvm.a build/src/operator/contrib/count_sketch_gpu.o build/src/operator/contrib/ctc_loss_gpu.o build/src/operator/contrib/deformable_convolution_gpu.o build/src/operator/contrib/deformable_psroi_pooling_gpu.o build/src/operator/contrib/dequantize_gpu.o build/src/operator/contrib/fft_gpu.o build/src/operator/contrib/ifft_gpu.o build/src/operator/contrib/multi_proposal_gpu.o build/src/operator/contrib/multibox_detection_gpu.o build/src/operator/contrib/multibox_prior_gpu.o build/src/operator/contrib/multibox_target_gpu.o build/src/operator/contrib/proposal_gpu.o build/src/operator/contrib/psroi_pooling_gpu.o build/src/operator/contrib/quantize_gpu.o build/src/operator/custom/native_op_gpu.o build/src/operator/nn/softmax_gpu.o build/src/operator/random/sample_multinomial_op_gpu.o build/src/operator/random/sample_op_gpu.o build/src/operator/tensor/broadcast_reduce_op_index_gpu.o build/src/operator/tensor/broadcast_reduce_op_value_gpu.o build/src/operator/tensor/cast_storage_gpu.o build/src/operator/tensor/control_flow_op_gpu.o build/src/operator/tensor/dot_gpu.o build/src/operator/tensor/elemwise_binary_broadcast_op_basic_gpu.o build/src/operator/tensor/elemwise_binary_broadcast_op_extended_gpu.o build/src/operator/tensor/elemwise_binary_broadcast_op_logic_gpu.o build/src/operator/tensor/elemwise_binary_op_basic_gpu.o build/src/operator/tensor/elemwise_binary_op_extended_gpu.o build/src/operator/tensor/elemwise_binary_op_logic_gpu.o build/src/operator/tensor/elemwise_binary_scalar_op_basic_gpu.o build/src/operator/tensor/elemwise_binary_scalar_op_extended_gpu.o build/src/operator/tensor/elemwise_binary_scalar_op_logic_gpu.o build/src/operator/tensor/elemwise_sum_gpu.o build/src/operator/tensor/elemwise_unary_op_gpu.o build/src/operator/tensor/indexing_op_gpu.o build/src/operator/tensor/init_op_gpu.o build/src/operator/tensor/la_op_gpu.o build/src/operator/tensor/matrix_op_gpu.o build/src/operator/tensor/ordering_op_gpu.o build/src/operator/tensor/sparse_retain_gpu.o build/src/common/utils_gpu.o build/src/ndarray/ndarray_function_gpu.o build/src/operator/activation_gpu.o build/src/operator/batch_norm_gpu.o build/src/operator/batch_norm_v1_gpu.o build/src/operator/bilinear_sampler_gpu.o build/src/operator/concat_gpu.o build/src/operator/convolution_gpu.o build/src/operator/convolution_v1_gpu.o build/src/operator/correlation_gpu.o build/src/operator/crop_gpu.o build/src/operator/cudnn_batch_norm_gpu.o build/src/operator/deconvolution_gpu.o build/src/operator/dropout_gpu.o build/src/operator/fully_connected_gpu.o build/src/operator/grid_generator_gpu.o build/src/operator/identity_attach_KL_sparse_reg_gpu.o build/src/operator/instance_norm_gpu.o build/src/operator/l2_normalization_gpu.o build/src/operator/leaky_relu_gpu.o build/src/operator/loss_binary_op_gpu.o build/src/operator/lrn_gpu.o build/src/operator/make_loss_gpu.o build/src/operator/optimizer_op_gpu.o build/src/operator/pad_gpu.o build/src/operator/pooling_gpu.o build/src/operator/pooling_v1_gpu.o build/src/operator/regression_output_gpu.o build/src/operator/rnn_gpu.o build/src/operator/roi_pooling_gpu.o build/src/operator/sequence_last_gpu.o build/src/operator/sequence_mask_gpu.o build/src/operator/sequence_reverse_gpu.o build/src/operator/slice_channel_gpu.o build/src/operator/softmax_activation_gpu.o build/src/operator/softmax_output_gpu.o build/src/operator/spatial_transformer_gpu.o build/src/operator/svm_output_gpu.o build/src/operator/swapaxis_gpu.o build/src/operator/upsampling_gpu.o -pthread -lm -lcudart -lcublas -lcurand -lcusolver -L/usr/local/cuda/lib64 -L/usr/local/cuda/lib -lopenblas -L/usr/local/Cellar/opencv/3.3.0_3/lib -lopencv_stitching -lopencv_superres -lopencv_videostab -lopencv_photo -lopencv_aruco -lopencv_bgsegm -lopencv_bioinspired -lopencv_ccalib -lopencv_dpm -lopencv_face -lopencv_fuzzy -lopencv_img_hash -lopencv_line_descriptor -lopencv_optflow -lopencv_reg -lopencv_rgbd -lopencv_saliency -lopencv_stereo -lopencv_structured_light -lopencv_phase_unwrapping -lopencv_surface_matching -lopencv_tracking -lopencv_datasets -lopencv_text -lopencv_dnn -lopencv_plot -lopencv_ml -lopencv_xfeatures2d -lopencv_shape -lopencv_video -lopencv_ximgproc -lopencv_calib3d -lopencv_features2d -lopencv_highgui -lopencv_videoio -lopencv_flann -lopencv_xobjdetect -lopencv_imgcodecs -lopencv_objdetect -lopencv_xphoto -lopencv_imgproc -lopencv_core -lcudnn -L/usr/local/opt/openblas/lib -L/usr/local/lib/graphviz/ -lcuda -lcufft
ld: warning: directory not found for option '-L/usr/local/cuda/lib64'`
It doesn't seem to contain any error message, and only warnings are found. For example, /usr/local/cuda/lib64
doesn't seem to exist or contain the cuda library. On OSX, I think it's in /usr/local/cuda/lib
instead.
Do you mind using other means of file sharing for the complete build log, after cleaning, from scratch?
Not at all. I appreciate your assistance. Where should I but the log?
Let's try https://gist.github.com/
Still no error in the gist :)
Let me try to reproduce your steps tomorrow to have a better idea of where the problem might be
Correct, there is no error in the gist. There is an error when I try to run anything with my GPU :(
python3
import mxnet as mx
a = mx.nd.ones((100, 100), mx.gpu())
which leads to
[10:09:29] src/c_api/c_api_ndarray.cc:147: GPU support is disabled. Compile MXNet with USE_CUDA=1 to enable GPU support.
[10:09:29] /Users/travis/build/dmlc/mxnet-distro/mxnet-build/dmlc-core/include/dmlc/logging.h:308: [10:09:29] src/c_api/c_api_ndarray.cc:416: Operator _ones is not implemented for GPU.
Stack trace returned 5 entries:
[bt] (0) 0 libmxnet.so 0x000000010e4efad8 _ZN4dmlc15LogMessageFatalD2Ev + 40
[bt] (1) 1 libmxnet.so 0x000000010ebeebbf _Z20ImperativeInvokeImplRKN5mxnet7ContextERKN4nnvm9NodeAttrsEPNSt3__16vectorINS_7NDArrayENS7_9allocatorIS9_EEEESD_ + 2079
[bt] (2) 2 libmxnet.so 0x000000010ebef7f1 MXImperativeInvoke + 433
[bt] (3) 3 _ctypes.cpython-36m-darwin.so 0x000000010d64542f ffi_call_unix64 + 79
[bt] (4) 4 ??? 0x00007fff52bac710 0x0 + 140734581360400
Traceback (most recent call last):
File "<stdin>", line 1, in <module>
File "/usr/local/lib/python3.6/site-packages/mxnet/ndarray.py", line 1216, in ones
return _internal._ones(shape=shape, ctx=ctx, dtype=dtype, **kwargs)
File "<string>", line 15, in _ones
File "/usr/local/lib/python3.6/site-packages/mxnet/_ctypes/ndarray.py", line 89, in _imperative_invoke
c_array(ctypes.c_char_p, [c_str(str(val)) for val in vals])))
File "/usr/local/lib/python3.6/site-packages/mxnet/base.py", line 129, in check_call
raise MXNetError(py_str(_LIB.MXGetLastError()))
mxnet.base.MXNetError: [10:09:29] src/c_api/c_api_ndarray.cc:416: Operator _ones is not implemented for GPU.
Stack trace returned 5 entries:
[bt] (0) 0 libmxnet.so 0x000000010e4efad8 _ZN4dmlc15LogMessageFatalD2Ev + 40
[bt] (1) 1 libmxnet.so 0x000000010ebeebbf _Z20ImperativeInvokeImplRKN5mxnet7ContextERKN4nnvm9NodeAttrsEPNSt3__16vectorINS_7NDArrayENS7_9allocatorIS9_EEEESD_ + 2079
[bt] (2) 2 libmxnet.so 0x000000010ebef7f1 MXImperativeInvoke + 433
[bt] (3) 3 _ctypes.cpython-36m-darwin.so 0x000000010d64542f ffi_call_unix64 + 79
[bt] (4) 4 ??? 0x00007fff52bac710 0x0 + 140734581360400
alright, thank you :)
I wasn't able to reproduce the problem. Could you paste your config.mk here?
#-------------------------------------------------------------------------------
# Template configuration for compiling mxnet
#
# If you want to change the configuration, please use the following
# steps. Assume you are on the root directory of mxnet. First copy the this
# file so that any local changes will be ignored by git
#
# $ cp make/config.mk .
#
# Next modify the according entries, and then compile by
#
# $ make
#
# or build in parallel with 8 threads
#
# $ make -j8
#-------------------------------------------------------------------------------
#---------------------
# choice of compiler
#--------------------
export CC = gcc
export CXX = g++
export NVCC = nvcc
# whether compile with options for MXNet developer
DEV = 0
# whether compile with debug
DEBUG = 0
# the additional link flags you want to add
ADD_LDFLAGS =
# the additional compile flags you want to add
ADD_CFLAGS =
#---------------------------------------------
# matrix computation libraries for CPU/GPU
#---------------------------------------------
# whether use CUDA during compile
USE_CUDA = 0
# add the path to CUDA library to link and compile flag
# if you have already add them to environment variable, leave it as NONE
# USE_CUDA_PATH = /usr/local/cuda
USE_CUDA_PATH = NONE
# whether use CUDNN R3 library
USE_CUDNN = 0
# whether use cuda runtime compiling for writing kernels in native language (i.e. Python)
USE_NVRTC = 0
# whether use opencv during compilation
# you can disable it, however, you will not able to use
# imbin iterator
USE_OPENCV = 1
# use openmp for parallelization
USE_OPENMP = 0
# choose the version of blas you want to use
# can be: mkl, blas, atlas, openblas
USE_BLAS = apple
# whether use lapack during compilation
# only effective when compiled with blas versions openblas/apple/atlas/mkl
USE_LAPACK = 1
# add path to intel library, you may need it for MKL, if you did not add the path
# to environment variable
USE_INTEL_PATH = NONE
#----------------------------
# distributed computing
#----------------------------
# whether or not to enable multi-machine supporting
USE_DIST_KVSTORE = 0
# whether or not allow to read and write HDFS directly. If yes, then hadoop is
# required
USE_HDFS = 0
# path to libjvm.so. required if USE_HDFS=1
LIBJVM=$(JAVA_HOME)/jre/lib/amd64/server
# whether or not allow to read and write AWS S3 directly. If yes, then
# libcurl4-openssl-dev is required, it can be installed on Ubuntu by
# sudo apt-get install -y libcurl4-openssl-dev
USE_S3 = 0
#----------------------------
# additional operators
#----------------------------
# path to folders containing projects specific operators that you don't want to put in src/operators
EXTRA_OPERATORS =
#----------------------------
# other features
#----------------------------
# Create C++ interface package
USE_CPP_PACKAGE = 0
#----------------------------
# plugins
#----------------------------
# whether to use torch integration. This requires installing torch.
# TORCH_PATH = $(HOME)/torch
# MXNET_PLUGINS += plugin/torch/torch.mk
USE_BLAS = openblas
ADD_CFLAGS += -I/usr/local/opt/openblas/include
ADD_LDFLAGS += -L/usr/local/opt/openblas/lib
ADD_LDFLAGS += -L/usr/local/lib/graphviz/
USE_CUDA = 1
USE_CUDA_PATH = /usr/local/cuda
USE_CUDNN = 1
And just to be thorough, could you run the env
command in shell and share them here? Be sure to remove anything that may be sensitive from the output before pasting.
Sure
TERM_PROGRAM=Apple_Terminal
TERM=xterm-256color
SHELL=/bin/bash
TERM_PROGRAM_VERSION=388.1.1
CUDA_HOME=/usr/local/cuda
USER=sumner
PATH=/usr/local/bin:/usr/local/sbin:/usr/local/cuda/bin:/usr/local/bin:/usr/bin:/bin:/usr/sbin:/sbin:/Applications/Postgres.app/Contents/Versions/latest/bin:/Users/sumner/Library/Python/3.6/bin:/Users/sumner/Library/Python/3.6/lib/python/site-packages:/usr/local/sbin:/usr/local/Cellar:/Applications/Postgres.app/Contents/Versions/latest/bin
LANG=en_US.UTF-8
HOME=/Users/sumner
SHLVL=1
DYLD_LIBRARY_PATH=/usr/local/cuda/lib:
_=/usr/bin/env
also, I want to reiterate that I would appreciate it if you could implement a gpu connection test
either of the following would be fine by me:
A specific error for not being able to reach the GPU
gpu_device = mxnet.gpu()
try:
nd.ones(shape=(3,3), ctx=gpu_device)
except MXNetGPUError as err:
print("Can not connect to GPU {err}".formate(err=err))
or return -1
gpu_device = mxnet.gpu()
if not gpu_device:
print("GPU is not available")
But the main issue is that it seems that your GPU command examples might not be correct, given that the errors are raised by the operation nd.ones with
Operator _ones is not implemented for GPU.
because when trying something else
x = nd.ones(shape=(3,3))
x_gpu = x.copyto(gpu(0))
print(x_gpu)
I get
---------------------------------------------------------------------------
MXNetError Traceback (most recent call last)
<ipython-input-10-6b8971f19695> in <module>()
1 x = nd.ones(shape=(3,3))
----> 2 x_gpu = x.copyto(gpu(0))
3 print(x_gpu)
/usr/local/lib/python3.6/site-packages/mxnet/ndarray.py in copyto(self, other)
990 elif isinstance(other, Context):
991 hret = NDArray(_new_alloc_handle(self.shape, other, True, self.dtype))
--> 992 return _internal._copyto(self, out=hret)
993 else:
994 raise TypeError('copyto does not support type ' + str(type(other)))
/usr/local/lib/python3.6/site-packages/mxnet/ndarray.py in _copyto(src, out, name, **kwargs)
/usr/local/lib/python3.6/site-packages/mxnet/_ctypes/ndarray.py in _imperative_invoke(handle, ndargs, keys, vals, out)
87 ctypes.c_int(len(keys)),
88 c_array(ctypes.c_char_p, [c_str(key) for key in keys]),
---> 89 c_array(ctypes.c_char_p, [c_str(str(val)) for val in vals])))
90
91 if original_output is not None:
/usr/local/lib/python3.6/site-packages/mxnet/base.py in check_call(ret)
127 """
128 if ret != 0:
--> 129 raise MXNetError(py_str(_LIB.MXGetLastError()))
130
131 if sys.version_info[0] < 3:
MXNetError: [12:57:26] src/ndarray/ndarray.cc:402: GPU is not enabled
Stack trace returned 7 entries:
[bt] (0) 0 libmxnet.so 0x00000001054c6ad8 _ZN4dmlc15LogMessageFatalD2Ev + 40
[bt] (1) 1 libmxnet.so 0x0000000105cae933 _ZN5mxnet10CopyFromToERKNS_7NDArrayEPS0_i + 1587
[bt] (2) 2 libmxnet.so 0x0000000105d15513 _ZNSt3__110__function6__funcIZN5mxnet2op20RegisterLegacyNDFuncEvE3$_4NS_9allocatorIS4_EEFvRKN4nnvm9NodeAttrsERKNS_6vectorINS2_7NDArrayENS5_ISC_EEEEPSE_EEclESA_SG_OSH_ + 1619
[bt] (3) 3 libmxnet.so 0x0000000105bc5611 _Z20ImperativeInvokeImplRKN5mxnet7ContextERKN4nnvm9NodeAttrsEPNSt3__16vectorINS_7NDArrayENS7_9allocatorIS9_EEEESD_ + 625
[bt] (4) 4 libmxnet.so 0x0000000105bc67f1 MXImperativeInvoke + 433
[bt] (5) 5 _ctypes.cpython-36m-darwin.so 0x00000001040b442f ffi_call_unix64 + 79
[bt] (6) 6 ??? 0x00007fff5d7393e0 0x0 + 140734761243616
Which is more consistent with GPU not being enabled, although I am pretty sure that it is...
Anyway if it helps you debug what is going on to help me:
I am using:
And if you are concerned that maybe this set up is somehow interfering with the GPU I can assure you it is not. I can use GPU accelerated code in other languages :)
I somehow truly think it is the reversion to a previous command line tools to appease nvcc.
Looking at ArrayFire, there are all equally confused https://github.com/arrayfire/arrayfire/issues/1384
:)
You seem to have two copies of python in your system, one in /usr/local/lib/python3.6/
and the other in /Users/sumner/Library/Python/3.6/
. The error you see says the mxnet you're using is not compiled with USE_CUDA=1
while you obviously did based on the config.mk you sent. I tested locally that USE_CUDA=1
works, and it's shown in your build log too.
To sum up, are you sure you're verifying the right copy of mxnet?
Good catch. Dumb question: how do I take the master mxnet installed above and replace the other mxnet...
setting your path to use the right copy of python should do. PATH setting should be in your .bashrc/.zshrc
/usr/local/lib/python3.6/ contains mxnet inside /Users/sumner/Library/Python/3.6/ does not
The original link doesnt show what to do after make and since there isnt an .initpy I cant just import from inside the directory
Trying to import ndarray to do the test from the python subdir in the local mxnet results in a error from ctypes...
after running python3 setup.py develop --user things seem to work
I wanted to install MXNet on a second machine (running Ubuntu 16.04LTS). The vanilla install worked fine (no gpu enabled) Trying to install with gpu enabled results in
-Wl,--whole-archive /home/sumner/mxnet/nnvm/lib/libnnvm.a -Wl,--no-whole-archive
/usr/bin/ld: cannot find -lopenblas
collect2: error: ld returned 1 exit status
Makefile:384: recipe for target 'lib/libmxnet.so' failed
make: *** [lib/libmxnet.so] Error 1
We have pre-built binary for ubuntu. Depending on the cuda version, you may choose from:
mxnet-cu75
, mxnet-cu80
, or mxnet-cu90
.
You can then use pip install --pre package_name
to install the package.
python3
Python 3.5.2 (default, Sep 14 2017, 22:51:06)
[GCC 5.4.0 20160609] on linux
Type "help", "copyright", "credits" or "license" for more information.
>>> import mxnet as mx
Traceback (most recent call last):
File "<stdin>", line 1, in <module>
File "/home/sumner/mxnet/python/mxnet/__init__.py", line 25, in <module>
from .base import MXNetError
File "/home/sumner/mxnet/python/mxnet/base.py", line 111, in <module>
_LIB = _load_lib()
File "/home/sumner/mxnet/python/mxnet/base.py", line 102, in _load_lib
lib_path = libinfo.find_lib_path()
File "/home/sumner/mxnet/python/mxnet/libinfo.py", line 59, in find_lib_path
'List of candidates:\n' + str('\n'.join(dll_path)))
RuntimeError: Cannot find the files.
List of candidates:
/home/sumner/mxnet/python/mxnet/libmxnet.so
/home/sumner/mxnet/python/mxnet/../../lib/libmxnet.so
/home/sumner/mxnet/python/mxnet/../../build/Release/libmxnet.so
../../../libmxnet.so
>>>
?
output of trying to import mxnet following pip of the cuda enabled mxnet
@szha this error is still presistent for pip3 install --pre mxnet-cu90
Sorry for missing on this. From the error it looks like your python is trying to load from /home/sumner/mxnet/
, which doesn't look like the site-packages that pip usually would install in. Could it be that you have symbolic link from your work space to your python's path? (e.g. result of pip install -e
or python setup.py develop
)
I dont think so. How would I check for this?
If I remove the director mxnet loads, but then it says things like
import mxnet as mx
from mxnet import nd, gluon
ImportError: cannot import name 'nd'
Does it show any other error, such as "libxxx not found"?
it did, but I just went and removed all mxnet files and reinstalled via pip. Seems to work now. Sorry :)
Please complete the python GPU enabled install for MacOS. This guide is complete / following it to complete results in errors. https://mxnet.incubator.apache.org/get_started/osx_setup.html
Also, please update mx.gpu() to return -1 if no gpu detected. Right now I run mx.gpu() and it returns 0, which means it should be connected to my first gpu (a functioning external NVIDIA GeForce TITAN X), but trying to run anything with this command (e.g. in the demo
mx.nd.ones((100,100),mx.gpu())
results in errors.
Environment info
Operating System: MacOS 10.12.6
Package used (Python/R/Scala/Julia): Python MXNet version: 0.11
MXNet commit hash (
git rev-parse HEAD
): a5edbf94094581ee27157eae4f2113115a3994e7Python version and distribution: 3.6
Error Message:
Please paste the full error message, including stack trace.
`>>> b = mx.nd.ones((100,100), gpu_device) [14:16:34] src/c_api/c_api_ndarray.cc:147: GPU support is disabled. Compile MXNet with USE_CUDA=1 to enable GPU support. [14:16:34] /Users/travis/build/dmlc/mxnet-distro/mxnet-build/dmlc-core/include/dmlc/logging.h:308: [14:16:34] src/c_api/c_api_ndarray.cc:416: Operator _ones is not implemented for GPU.
Stack trace returned 5 entries: [bt] (0) 0 libmxnet.so 0x0000000104be1ad8 _ZN4dmlc15LogMessageFatalD2Ev + 40 [bt] (1) 1 libmxnet.so 0x00000001052e0bbf _Z20ImperativeInvokeImplRKN5mxnet7ContextERKN4nnvm9NodeAttrsEPNSt3__16vectorINS_7NDArrayENS7_9allocatorIS9EEEESD + 2079 [bt] (2) 2 libmxnet.so 0x00000001052e17f1 MXImperativeInvoke + 433 [bt] (3) 3 _ctypes.cpython-36m-darwin.so 0x0000000103d3742f ffi_call_unix64 + 79 [bt] (4) 4 ??? 0x00007fff5c4ba950 0x0 + 140734741850448
Traceback (most recent call last): File "", line 1, in
File "/usr/local/lib/python3.6/site-packages/mxnet/ndarray.py", line 1216, in ones
return _internal._ones(shape=shape, ctx=ctx, dtype=dtype, **kwargs)
File "", line 15, in _ones
File "/usr/local/lib/python3.6/site-packages/mxnet/_ctypes/ndarray.py", line 89, in _imperative_invoke
c_array(ctypes.c_char_p, [c_str(str(val)) for val in vals])))
File "/usr/local/lib/python3.6/site-packages/mxnet/base.py", line 129, in check_call
raise MXNetError(py_str(_LIB.MXGetLastError()))
mxnet.base.MXNetError: [14:16:34] src/c_api/c_api_ndarray.cc:416: Operator _ones is not implemented for GPU.
Stack trace returned 5 entries: [bt] (0) 0 libmxnet.so 0x0000000104be1ad8 _ZN4dmlc15LogMessageFatalD2Ev + 40 [bt] (1) 1 libmxnet.so 0x00000001052e0bbf _Z20ImperativeInvokeImplRKN5mxnet7ContextERKN4nnvm9NodeAttrsEPNSt3__16vectorINS_7NDArrayENS7_9allocatorIS9EEEESD + 2079 [bt] (2) 2 libmxnet.so 0x00000001052e17f1 MXImperativeInvoke + 433 [bt] (3) 3 _ctypes.cpython-36m-darwin.so 0x0000000103d3742f ffi_call_unix64 + 79 [bt] (4) 4 ??? `
Minimum reproducible example
if you are using your own code, please provide a short script that reproduces the error.
gpu_device = mx.gpu() b = mx.nd.ones((100,100), gpu_device)
Steps to reproduce
or if you are running standard examples, please provide the commands you have run that lead to the error.
1. 2. 3.
What have you tried to solve it?