Advertisement
Not a member of Pastebin yet?
Sign Up,
it unlocks many cool features!
- /usr/local/cuda/bin/nvcc -c -o build/src/operator/tensor/broadcast_reduce_op_index_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/operator/tensor/broadcast_reduce_op_index.cu
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/operator/tensor/elemwise_binary_broadcast_op_logic_gpu.o src/operator/tensor/elemwise_binary_broadcast_op_logic.cu >build/src/operator/tensor/elemwise_binary_broadcast_op_logic_gpu.d
- /usr/local/cuda/bin/nvcc -c -o build/src/operator/tensor/elemwise_scatter_op_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/operator/tensor/elemwise_scatter_op.cu
- /usr/local/cuda/bin/nvcc -c -o build/src/operator/tensor/indexing_op_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/operator/tensor/indexing_op.cu
- /usr/local/cuda/bin/nvcc -c -o build/src/operator/tensor/elemwise_binary_broadcast_op_logic_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/operator/tensor/elemwise_binary_broadcast_op_logic.cu
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/operator/tensor/la_op_gpu.o src/operator/tensor/la_op.cu >build/src/operator/tensor/la_op_gpu.d
- /usr/local/cuda/bin/nvcc -c -o build/src/operator/tensor/la_op_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/operator/tensor/la_op.cu
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/operator/tensor/elemwise_binary_op_logic_gpu.o src/operator/tensor/elemwise_binary_op_logic.cu >build/src/operator/tensor/elemwise_binary_op_logic_gpu.d
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/operator/tensor/elemwise_unary_op_basic_gpu.o src/operator/tensor/elemwise_unary_op_basic.cu >build/src/operator/tensor/elemwise_unary_op_basic_gpu.d
- /usr/local/cuda/bin/nvcc -c -o build/src/operator/tensor/elemwise_binary_op_logic_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/operator/tensor/elemwise_binary_op_logic.cu
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/operator/tensor/sparse_retain_gpu.o src/operator/tensor/sparse_retain.cu >build/src/operator/tensor/sparse_retain_gpu.d
- /usr/local/cuda/bin/nvcc -c -o build/src/operator/tensor/elemwise_unary_op_basic_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/operator/tensor/elemwise_unary_op_basic.cu
- /usr/local/cuda/bin/nvcc -c -o build/src/operator/tensor/sparse_retain_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/operator/tensor/sparse_retain.cu
- src/operator/tensor/./.././contrib/erfinv-inl.h(79): warning: calling a constexpr __host__ function("quiet_NaN") from a __host__ __device__ function("Map") is not allowed. The experimental flag '--expt-relaxed-constexpr' can be used to allow this.
- detected during:
- instantiation of "void mxnet::op::mxnet_op::op_with_req<OP, req>::Map(mxnet::index_t, DType *, const DType *) [with OP=mxnet::op::mshadow_op::erfinv, req=1, DType=float]"
- src/operator/tensor/./../mxnet_op.h(701): here
- instantiation of "void mxnet::op::mxnet_op::mxnet_generic_kernel<OP,Args...>(int, Args...) [with OP=mxnet::op::mxnet_op::op_with_req<mxnet::op::mshadow_op::erfinv, 1>, Args=<float *, float *>]"
- src/operator/tensor/./../mxnet_op.h(721): here
- instantiation of "void mxnet::op::mxnet_op::Kernel<OP, mxnet::gpu>::Launch(mshadow::Stream<mshadow::gpu> *, int, Args...) [with OP=mxnet::op::mxnet_op::op_with_req<mxnet::op::mshadow_op::erfinv, 1>, Args=<float *, float *>]"
- src/operator/tensor/./elemwise_unary_op.h(243): here
- instantiation of "void mxnet::op::UnaryOp::Compute<xpu,OP>(const nnvm::NodeAttrs &, const mxnet::OpContext &, const std::vector<mxnet::TBlob, std::allocator<mxnet::TBlob>> &, const std::vector<mxnet::OpReqType, std::allocator<mxnet::OpReqType>> &, const std::vector<mxnet::TBlob, std::allocator<mxnet::TBlob>> &) [with xpu=mxnet::gpu, OP=mxnet::op::mshadow_op::erfinv]"
- src/operator/tensor/elemwise_unary_op_basic.cu(67): here
- src/operator/tensor/./.././contrib/erfinv-inl.h(81): warning: calling a constexpr __host__ function("infinity") from a __host__ __device__ function("Map") is not allowed. The experimental flag '--expt-relaxed-constexpr' can be used to allow this.
- detected during:
- instantiation of "void mxnet::op::mxnet_op::op_with_req<OP, req>::Map(mxnet::index_t, DType *, const DType *) [with OP=mxnet::op::mshadow_op::erfinv, req=1, DType=float]"
- src/operator/tensor/./../mxnet_op.h(701): here
- instantiation of "void mxnet::op::mxnet_op::mxnet_generic_kernel<OP,Args...>(int, Args...) [with OP=mxnet::op::mxnet_op::op_with_req<mxnet::op::mshadow_op::erfinv, 1>, Args=<float *, float *>]"
- src/operator/tensor/./../mxnet_op.h(721): here
- instantiation of "void mxnet::op::mxnet_op::Kernel<OP, mxnet::gpu>::Launch(mshadow::Stream<mshadow::gpu> *, int, Args...) [with OP=mxnet::op::mxnet_op::op_with_req<mxnet::op::mshadow_op::erfinv, 1>, Args=<float *, float *>]"
- src/operator/tensor/./elemwise_unary_op.h(243): here
- instantiation of "void mxnet::op::UnaryOp::Compute<xpu,OP>(const nnvm::NodeAttrs &, const mxnet::OpContext &, const std::vector<mxnet::TBlob, std::allocator<mxnet::TBlob>> &, const std::vector<mxnet::OpReqType, std::allocator<mxnet::OpReqType>> &, const std::vector<mxnet::TBlob, std::allocator<mxnet::TBlob>> &) [with xpu=mxnet::gpu, OP=mxnet::op::mshadow_op::erfinv]"
- src/operator/tensor/elemwise_unary_op_basic.cu(67): here
- src/operator/tensor/./.././contrib/erfinv-inl.h(79): warning: floating-point value does not fit in required integral type
- detected during:
- instantiation of "DType mxnet::op::mshadow_op::erfinv::Map(DType) [with DType=int8_t]"
- src/operator/tensor/./../mxnet_op.h(479): here
- instantiation of "void mxnet::op::mxnet_op::op_with_req<OP, req>::Map(mxnet::index_t, DType *, const DType *) [with OP=mxnet::op::mshadow_op::erfinv, req=1, DType=int8_t]"
- src/operator/tensor/./../mxnet_op.h(701): here
- instantiation of "void mxnet::op::mxnet_op::mxnet_generic_kernel<OP,Args...>(int, Args...) [with OP=mxnet::op::mxnet_op::op_with_req<mxnet::op::mshadow_op::erfinv, 1>, Args=<int8_t *, int8_t *>]"
- src/operator/tensor/./../mxnet_op.h(721): here
- instantiation of "void mxnet::op::mxnet_op::Kernel<OP, mxnet::gpu>::Launch(mshadow::Stream<mshadow::gpu> *, int, Args...) [with OP=mxnet::op::mxnet_op::op_with_req<mxnet::op::mshadow_op::erfinv, 1>, Args=<int8_t *, int8_t *>]"
- src/operator/tensor/./elemwise_unary_op.h(243): here
- instantiation of "void mxnet::op::UnaryOp::Compute<xpu,OP>(const nnvm::NodeAttrs &, const mxnet::OpContext &, const std::vector<mxnet::TBlob, std::allocator<mxnet::TBlob>> &, const std::vector<mxnet::OpReqType, std::allocator<mxnet::OpReqType>> &, const std::vector<mxnet::TBlob, std::allocator<mxnet::TBlob>> &) [with xpu=mxnet::gpu, OP=mxnet::op::mshadow_op::erfinv]"
- src/operator/tensor/elemwise_unary_op_basic.cu(67): here
- src/operator/tensor/./.././contrib/erfinv-inl.h(79): warning: floating-point value does not fit in required integral type
- detected during:
- instantiation of "DType mxnet::op::mshadow_op::erfinv::Map(DType) [with DType=int32_t]"
- src/operator/tensor/./../mxnet_op.h(479): here
- instantiation of "void mxnet::op::mxnet_op::op_with_req<OP, req>::Map(mxnet::index_t, DType *, const DType *) [with OP=mxnet::op::mshadow_op::erfinv, req=1, DType=int32_t]"
- src/operator/tensor/./../mxnet_op.h(701): here
- instantiation of "void mxnet::op::mxnet_op::mxnet_generic_kernel<OP,Args...>(int, Args...) [with OP=mxnet::op::mxnet_op::op_with_req<mxnet::op::mshadow_op::erfinv, 1>, Args=<int32_t *, int32_t *>]"
- src/operator/tensor/./../mxnet_op.h(721): here
- instantiation of "void mxnet::op::mxnet_op::Kernel<OP, mxnet::gpu>::Launch(mshadow::Stream<mshadow::gpu> *, int, Args...) [with OP=mxnet::op::mxnet_op::op_with_req<mxnet::op::mshadow_op::erfinv, 1>, Args=<int32_t *, int32_t *>]"
- src/operator/tensor/./elemwise_unary_op.h(243): here
- instantiation of "void mxnet::op::UnaryOp::Compute<xpu,OP>(const nnvm::NodeAttrs &, const mxnet::OpContext &, const std::vector<mxnet::TBlob, std::allocator<mxnet::TBlob>> &, const std::vector<mxnet::OpReqType, std::allocator<mxnet::OpReqType>> &, const std::vector<mxnet::TBlob, std::allocator<mxnet::TBlob>> &) [with xpu=mxnet::gpu, OP=mxnet::op::mshadow_op::erfinv]"
- src/operator/tensor/elemwise_unary_op_basic.cu(67): here
- src/operator/tensor/./.././contrib/erfinv-inl.h(79): warning: floating-point value does not fit in required integral type
- detected during:
- instantiation of "DType mxnet::op::mshadow_op::erfinv::Map(DType) [with DType=int64_t]"
- src/operator/tensor/./../mxnet_op.h(479): here
- instantiation of "void mxnet::op::mxnet_op::op_with_req<OP, req>::Map(mxnet::index_t, DType *, const DType *) [with OP=mxnet::op::mshadow_op::erfinv, req=1, DType=int64_t]"
- src/operator/tensor/./../mxnet_op.h(701): here
- instantiation of "void mxnet::op::mxnet_op::mxnet_generic_kernel<OP,Args...>(int, Args...) [with OP=mxnet::op::mxnet_op::op_with_req<mxnet::op::mshadow_op::erfinv, 1>, Args=<int64_t *, int64_t *>]"
- src/operator/tensor/./../mxnet_op.h(721): here
- instantiation of "void mxnet::op::mxnet_op::Kernel<OP, mxnet::gpu>::Launch(mshadow::Stream<mshadow::gpu> *, int, Args...) [with OP=mxnet::op::mxnet_op::op_with_req<mxnet::op::mshadow_op::erfinv, 1>, Args=<int64_t *, int64_t *>]"
- src/operator/tensor/./elemwise_unary_op.h(243): here
- instantiation of "void mxnet::op::UnaryOp::Compute<xpu,OP>(const nnvm::NodeAttrs &, const mxnet::OpContext &, const std::vector<mxnet::TBlob, std::allocator<mxnet::TBlob>> &, const std::vector<mxnet::OpReqType, std::allocator<mxnet::OpReqType>> &, const std::vector<mxnet::TBlob, std::allocator<mxnet::TBlob>> &) [with xpu=mxnet::gpu, OP=mxnet::op::mshadow_op::erfinv]"
- src/operator/tensor/elemwise_unary_op_basic.cu(67): here
- src/operator/tensor/./.././contrib/erfinv-inl.h(79): warning: calling a constexpr __host__ function("quiet_NaN") from a __host__ __device__ function("Map") is not allowed. The experimental flag '--expt-relaxed-constexpr' can be used to allow this.
- detected during:
- instantiation of "void mxnet::op::mxnet_op::op_with_req<OP, req>::Map(mxnet::index_t, DType *, const DType *) [with OP=mxnet::op::mshadow_op::erfinv, req=1, DType=float]"
- src/operator/tensor/./../mxnet_op.h(701): here
- instantiation of "void mxnet::op::mxnet_op::mxnet_generic_kernel<OP,Args...>(int, Args...) [with OP=mxnet::op::mxnet_op::op_with_req<mxnet::op::mshadow_op::erfinv, 1>, Args=<float *, float *>]"
- src/operator/tensor/./../mxnet_op.h(721): here
- instantiation of "void mxnet::op::mxnet_op::Kernel<OP, mxnet::gpu>::Launch(mshadow::Stream<mshadow::gpu> *, int, Args...) [with OP=mxnet::op::mxnet_op::op_with_req<mxnet::op::mshadow_op::erfinv, 1>, Args=<float *, float *>]"
- src/operator/tensor/./elemwise_unary_op.h(243): here
- instantiation of "void mxnet::op::UnaryOp::Compute<xpu,OP>(const nnvm::NodeAttrs &, const mxnet::OpContext &, const std::vector<mxnet::TBlob, std::allocator<mxnet::TBlob>> &, const std::vector<mxnet::OpReqType, std::allocator<mxnet::OpReqType>> &, const std::vector<mxnet::TBlob, std::allocator<mxnet::TBlob>> &) [with xpu=mxnet::gpu, OP=mxnet::op::mshadow_op::erfinv]"
- src/operator/tensor/elemwise_unary_op_basic.cu(67): here
- src/operator/tensor/./.././contrib/erfinv-inl.h(81): warning: calling a constexpr __host__ function("infinity") from a __host__ __device__ function("Map") is not allowed. The experimental flag '--expt-relaxed-constexpr' can be used to allow this.
- detected during:
- instantiation of "void mxnet::op::mxnet_op::op_with_req<OP, req>::Map(mxnet::index_t, DType *, const DType *) [with OP=mxnet::op::mshadow_op::erfinv, req=1, DType=float]"
- src/operator/tensor/./../mxnet_op.h(701): here
- instantiation of "void mxnet::op::mxnet_op::mxnet_generic_kernel<OP,Args...>(int, Args...) [with OP=mxnet::op::mxnet_op::op_with_req<mxnet::op::mshadow_op::erfinv, 1>, Args=<float *, float *>]"
- src/operator/tensor/./../mxnet_op.h(721): here
- instantiation of "void mxnet::op::mxnet_op::Kernel<OP, mxnet::gpu>::Launch(mshadow::Stream<mshadow::gpu> *, int, Args...) [with OP=mxnet::op::mxnet_op::op_with_req<mxnet::op::mshadow_op::erfinv, 1>, Args=<float *, float *>]"
- src/operator/tensor/./elemwise_unary_op.h(243): here
- instantiation of "void mxnet::op::UnaryOp::Compute<xpu,OP>(const nnvm::NodeAttrs &, const mxnet::OpContext &, const std::vector<mxnet::TBlob, std::allocator<mxnet::TBlob>> &, const std::vector<mxnet::OpReqType, std::allocator<mxnet::OpReqType>> &, const std::vector<mxnet::TBlob, std::allocator<mxnet::TBlob>> &) [with xpu=mxnet::gpu, OP=mxnet::op::mshadow_op::erfinv]"
- src/operator/tensor/elemwise_unary_op_basic.cu(67): here
- src/operator/tensor/./.././contrib/erfinv-inl.h(79): warning: floating-point value does not fit in required integral type
- detected during:
- instantiation of "DType mxnet::op::mshadow_op::erfinv::Map(DType) [with DType=int8_t]"
- src/operator/tensor/./../mxnet_op.h(479): here
- instantiation of "void mxnet::op::mxnet_op::op_with_req<OP, req>::Map(mxnet::index_t, DType *, const DType *) [with OP=mxnet::op::mshadow_op::erfinv, req=1, DType=int8_t]"
- src/operator/tensor/./../mxnet_op.h(701): here
- instantiation of "void mxnet::op::mxnet_op::mxnet_generic_kernel<OP,Args...>(int, Args...) [with OP=mxnet::op::mxnet_op::op_with_req<mxnet::op::mshadow_op::erfinv, 1>, Args=<int8_t *, int8_t *>]"
- src/operator/tensor/./../mxnet_op.h(721): here
- instantiation of "void mxnet::op::mxnet_op::Kernel<OP, mxnet::gpu>::Launch(mshadow::Stream<mshadow::gpu> *, int, Args...) [with OP=mxnet::op::mxnet_op::op_with_req<mxnet::op::mshadow_op::erfinv, 1>, Args=<int8_t *, int8_t *>]"
- src/operator/tensor/./elemwise_unary_op.h(243): here
- instantiation of "void mxnet::op::UnaryOp::Compute<xpu,OP>(const nnvm::NodeAttrs &, const mxnet::OpContext &, const std::vector<mxnet::TBlob, std::allocator<mxnet::TBlob>> &, const std::vector<mxnet::OpReqType, std::allocator<mxnet::OpReqType>> &, const std::vector<mxnet::TBlob, std::allocator<mxnet::TBlob>> &) [with xpu=mxnet::gpu, OP=mxnet::op::mshadow_op::erfinv]"
- src/operator/tensor/elemwise_unary_op_basic.cu(67): here
- src/operator/tensor/./.././contrib/erfinv-inl.h(79): warning: floating-point value does not fit in required integral type
- detected during:
- instantiation of "DType mxnet::op::mshadow_op::erfinv::Map(DType) [with DType=int32_t]"
- src/operator/tensor/./../mxnet_op.h(479): here
- instantiation of "void mxnet::op::mxnet_op::op_with_req<OP, req>::Map(mxnet::index_t, DType *, const DType *) [with OP=mxnet::op::mshadow_op::erfinv, req=1, DType=int32_t]"
- src/operator/tensor/./../mxnet_op.h(701): here
- instantiation of "void mxnet::op::mxnet_op::mxnet_generic_kernel<OP,Args...>(int, Args...) [with OP=mxnet::op::mxnet_op::op_with_req<mxnet::op::mshadow_op::erfinv, 1>, Args=<int32_t *, int32_t *>]"
- src/operator/tensor/./../mxnet_op.h(721): here
- instantiation of "void mxnet::op::mxnet_op::Kernel<OP, mxnet::gpu>::Launch(mshadow::Stream<mshadow::gpu> *, int, Args...) [with OP=mxnet::op::mxnet_op::op_with_req<mxnet::op::mshadow_op::erfinv, 1>, Args=<int32_t *, int32_t *>]"
- src/operator/tensor/./elemwise_unary_op.h(243): here
- instantiation of "void mxnet::op::UnaryOp::Compute<xpu,OP>(const nnvm::NodeAttrs &, const mxnet::OpContext &, const std::vector<mxnet::TBlob, std::allocator<mxnet::TBlob>> &, const std::vector<mxnet::OpReqType, std::allocator<mxnet::OpReqType>> &, const std::vector<mxnet::TBlob, std::allocator<mxnet::TBlob>> &) [with xpu=mxnet::gpu, OP=mxnet::op::mshadow_op::erfinv]"
- src/operator/tensor/elemwise_unary_op_basic.cu(67): here
- src/operator/tensor/./.././contrib/erfinv-inl.h(79): warning: floating-point value does not fit in required integral type
- detected during:
- instantiation of "DType mxnet::op::mshadow_op::erfinv::Map(DType) [with DType=int64_t]"
- src/operator/tensor/./../mxnet_op.h(479): here
- instantiation of "void mxnet::op::mxnet_op::op_with_req<OP, req>::Map(mxnet::index_t, DType *, const DType *) [with OP=mxnet::op::mshadow_op::erfinv, req=1, DType=int64_t]"
- src/operator/tensor/./../mxnet_op.h(701): here
- instantiation of "void mxnet::op::mxnet_op::mxnet_generic_kernel<OP,Args...>(int, Args...) [with OP=mxnet::op::mxnet_op::op_with_req<mxnet::op::mshadow_op::erfinv, 1>, Args=<int64_t *, int64_t *>]"
- src/operator/tensor/./../mxnet_op.h(721): here
- instantiation of "void mxnet::op::mxnet_op::Kernel<OP, mxnet::gpu>::Launch(mshadow::Stream<mshadow::gpu> *, int, Args...) [with OP=mxnet::op::mxnet_op::op_with_req<mxnet::op::mshadow_op::erfinv, 1>, Args=<int64_t *, int64_t *>]"
- src/operator/tensor/./elemwise_unary_op.h(243): here
- instantiation of "void mxnet::op::UnaryOp::Compute<xpu,OP>(const nnvm::NodeAttrs &, const mxnet::OpContext &, const std::vector<mxnet::TBlob, std::allocator<mxnet::TBlob>> &, const std::vector<mxnet::OpReqType, std::allocator<mxnet::OpReqType>> &, const std::vector<mxnet::TBlob, std::allocator<mxnet::TBlob>> &) [with xpu=mxnet::gpu, OP=mxnet::op::mshadow_op::erfinv]"
- src/operator/tensor/elemwise_unary_op_basic.cu(67): here
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/operator/contrib/optimizer_op_gpu.o src/operator/contrib/optimizer_op.cu >build/src/operator/contrib/optimizer_op_gpu.d
- /usr/local/cuda/bin/nvcc -c -o build/src/operator/contrib/optimizer_op_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/operator/contrib/optimizer_op.cu
- src/operator/tensor/./.././contrib/erfinv-inl.h(79): warning: calling a constexpr __host__ function("quiet_NaN") from a __host__ __device__ function("Map") is not allowed. The experimental flag '--expt-relaxed-constexpr' can be used to allow this.
- detected during:
- instantiation of "void mxnet::op::mxnet_op::op_with_req<OP, req>::Map(mxnet::index_t, DType *, const DType *) [with OP=mxnet::op::mshadow_op::erfinv, req=1, DType=float]"
- src/operator/tensor/./../mxnet_op.h(701): here
- instantiation of "void mxnet::op::mxnet_op::mxnet_generic_kernel<OP,Args...>(int, Args...) [with OP=mxnet::op::mxnet_op::op_with_req<mxnet::op::mshadow_op::erfinv, 1>, Args=<float *, float *>]"
- src/operator/tensor/./../mxnet_op.h(721): here
- instantiation of "void mxnet::op::mxnet_op::Kernel<OP, mxnet::gpu>::Launch(mshadow::Stream<mshadow::gpu> *, int, Args...) [with OP=mxnet::op::mxnet_op::op_with_req<mxnet::op::mshadow_op::erfinv, 1>, Args=<float *, float *>]"
- src/operator/tensor/./elemwise_unary_op.h(243): here
- instantiation of "void mxnet::op::UnaryOp::Compute<xpu,OP>(const nnvm::NodeAttrs &, const mxnet::OpContext &, const std::vector<mxnet::TBlob, std::allocator<mxnet::TBlob>> &, const std::vector<mxnet::OpReqType, std::allocator<mxnet::OpReqType>> &, const std::vector<mxnet::TBlob, std::allocator<mxnet::TBlob>> &) [with xpu=mxnet::gpu, OP=mxnet::op::mshadow_op::erfinv]"
- src/operator/tensor/elemwise_unary_op_basic.cu(67): here
- src/operator/tensor/./.././contrib/erfinv-inl.h(81): warning: calling a constexpr __host__ function("infinity") from a __host__ __device__ function("Map") is not allowed. The experimental flag '--expt-relaxed-constexpr' can be used to allow this.
- detected during:
- instantiation of "void mxnet::op::mxnet_op::op_with_req<OP, req>::Map(mxnet::index_t, DType *, const DType *) [with OP=mxnet::op::mshadow_op::erfinv, req=1, DType=float]"
- src/operator/tensor/./../mxnet_op.h(701): here
- instantiation of "void mxnet::op::mxnet_op::mxnet_generic_kernel<OP,Args...>(int, Args...) [with OP=mxnet::op::mxnet_op::op_with_req<mxnet::op::mshadow_op::erfinv, 1>, Args=<float *, float *>]"
- src/operator/tensor/./../mxnet_op.h(721): here
- instantiation of "void mxnet::op::mxnet_op::Kernel<OP, mxnet::gpu>::Launch(mshadow::Stream<mshadow::gpu> *, int, Args...) [with OP=mxnet::op::mxnet_op::op_with_req<mxnet::op::mshadow_op::erfinv, 1>, Args=<float *, float *>]"
- src/operator/tensor/./elemwise_unary_op.h(243): here
- instantiation of "void mxnet::op::UnaryOp::Compute<xpu,OP>(const nnvm::NodeAttrs &, const mxnet::OpContext &, const std::vector<mxnet::TBlob, std::allocator<mxnet::TBlob>> &, const std::vector<mxnet::OpReqType, std::allocator<mxnet::OpReqType>> &, const std::vector<mxnet::TBlob, std::allocator<mxnet::TBlob>> &) [with xpu=mxnet::gpu, OP=mxnet::op::mshadow_op::erfinv]"
- src/operator/tensor/elemwise_unary_op_basic.cu(67): here
- src/operator/tensor/./.././contrib/erfinv-inl.h(79): warning: floating-point value does not fit in required integral type
- detected during:
- instantiation of "DType mxnet::op::mshadow_op::erfinv::Map(DType) [with DType=int8_t]"
- src/operator/tensor/./../mxnet_op.h(479): here
- instantiation of "void mxnet::op::mxnet_op::op_with_req<OP, req>::Map(mxnet::index_t, DType *, const DType *) [with OP=mxnet::op::mshadow_op::erfinv, req=1, DType=int8_t]"
- src/operator/tensor/./../mxnet_op.h(701): here
- instantiation of "void mxnet::op::mxnet_op::mxnet_generic_kernel<OP,Args...>(int, Args...) [with OP=mxnet::op::mxnet_op::op_with_req<mxnet::op::mshadow_op::erfinv, 1>, Args=<int8_t *, int8_t *>]"
- src/operator/tensor/./../mxnet_op.h(721): here
- instantiation of "void mxnet::op::mxnet_op::Kernel<OP, mxnet::gpu>::Launch(mshadow::Stream<mshadow::gpu> *, int, Args...) [with OP=mxnet::op::mxnet_op::op_with_req<mxnet::op::mshadow_op::erfinv, 1>, Args=<int8_t *, int8_t *>]"
- src/operator/tensor/./elemwise_unary_op.h(243): here
- instantiation of "void mxnet::op::UnaryOp::Compute<xpu,OP>(const nnvm::NodeAttrs &, const mxnet::OpContext &, const std::vector<mxnet::TBlob, std::allocator<mxnet::TBlob>> &, const std::vector<mxnet::OpReqType, std::allocator<mxnet::OpReqType>> &, const std::vector<mxnet::TBlob, std::allocator<mxnet::TBlob>> &) [with xpu=mxnet::gpu, OP=mxnet::op::mshadow_op::erfinv]"
- src/operator/tensor/elemwise_unary_op_basic.cu(67): here
- src/operator/tensor/./.././contrib/erfinv-inl.h(79): warning: floating-point value does not fit in required integral type
- detected during:
- instantiation of "DType mxnet::op::mshadow_op::erfinv::Map(DType) [with DType=int32_t]"
- src/operator/tensor/./../mxnet_op.h(479): here
- instantiation of "void mxnet::op::mxnet_op::op_with_req<OP, req>::Map(mxnet::index_t, DType *, const DType *) [with OP=mxnet::op::mshadow_op::erfinv, req=1, DType=int32_t]"
- src/operator/tensor/./../mxnet_op.h(701): here
- instantiation of "void mxnet::op::mxnet_op::mxnet_generic_kernel<OP,Args...>(int, Args...) [with OP=mxnet::op::mxnet_op::op_with_req<mxnet::op::mshadow_op::erfinv, 1>, Args=<int32_t *, int32_t *>]"
- src/operator/tensor/./../mxnet_op.h(721): here
- instantiation of "void mxnet::op::mxnet_op::Kernel<OP, mxnet::gpu>::Launch(mshadow::Stream<mshadow::gpu> *, int, Args...) [with OP=mxnet::op::mxnet_op::op_with_req<mxnet::op::mshadow_op::erfinv, 1>, Args=<int32_t *, int32_t *>]"
- src/operator/tensor/./elemwise_unary_op.h(243): here
- instantiation of "void mxnet::op::UnaryOp::Compute<xpu,OP>(const nnvm::NodeAttrs &, const mxnet::OpContext &, const std::vector<mxnet::TBlob, std::allocator<mxnet::TBlob>> &, const std::vector<mxnet::OpReqType, std::allocator<mxnet::OpReqType>> &, const std::vector<mxnet::TBlob, std::allocator<mxnet::TBlob>> &) [with xpu=mxnet::gpu, OP=mxnet::op::mshadow_op::erfinv]"
- src/operator/tensor/elemwise_unary_op_basic.cu(67): here
- src/operator/tensor/./.././contrib/erfinv-inl.h(79): warning: floating-point value does not fit in required integral type
- detected during:
- instantiation of "DType mxnet::op::mshadow_op::erfinv::Map(DType) [with DType=int64_t]"
- src/operator/tensor/./../mxnet_op.h(479): here
- instantiation of "void mxnet::op::mxnet_op::op_with_req<OP, req>::Map(mxnet::index_t, DType *, const DType *) [with OP=mxnet::op::mshadow_op::erfinv, req=1, DType=int64_t]"
- src/operator/tensor/./../mxnet_op.h(701): here
- instantiation of "void mxnet::op::mxnet_op::mxnet_generic_kernel<OP,Args...>(int, Args...) [with OP=mxnet::op::mxnet_op::op_with_req<mxnet::op::mshadow_op::erfinv, 1>, Args=<int64_t *, int64_t *>]"
- src/operator/tensor/./../mxnet_op.h(721): here
- instantiation of "void mxnet::op::mxnet_op::Kernel<OP, mxnet::gpu>::Launch(mshadow::Stream<mshadow::gpu> *, int, Args...) [with OP=mxnet::op::mxnet_op::op_with_req<mxnet::op::mshadow_op::erfinv, 1>, Args=<int64_t *, int64_t *>]"
- src/operator/tensor/./elemwise_unary_op.h(243): here
- instantiation of "void mxnet::op::UnaryOp::Compute<xpu,OP>(const nnvm::NodeAttrs &, const mxnet::OpContext &, const std::vector<mxnet::TBlob, std::allocator<mxnet::TBlob>> &, const std::vector<mxnet::OpReqType, std::allocator<mxnet::OpReqType>> &, const std::vector<mxnet::TBlob, std::allocator<mxnet::TBlob>> &) [with xpu=mxnet::gpu, OP=mxnet::op::mshadow_op::erfinv]"
- src/operator/tensor/elemwise_unary_op_basic.cu(67): here
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/operator/contrib/boolean_mask_gpu.o src/operator/contrib/boolean_mask.cu >build/src/operator/contrib/boolean_mask_gpu.d
- /usr/local/cuda/bin/nvcc -c -o build/src/operator/contrib/boolean_mask_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/operator/contrib/boolean_mask.cu
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/operator/contrib/adaptive_avg_pooling_gpu.o src/operator/contrib/adaptive_avg_pooling.cu >build/src/operator/contrib/adaptive_avg_pooling_gpu.d
- src/operator/tensor/./.././contrib/erfinv-inl.h(79): warning: calling a constexpr __host__ function("quiet_NaN") from a __host__ __device__ function("Map") is not allowed. The experimental flag '--expt-relaxed-constexpr' can be used to allow this.
- detected during:
- instantiation of "void mxnet::op::mxnet_op::op_with_req<OP, req>::Map(mxnet::index_t, DType *, const DType *) [with OP=mxnet::op::mshadow_op::erfinv, req=1, DType=float]"
- src/operator/tensor/./../mxnet_op.h(701): here
- instantiation of "void mxnet::op::mxnet_op::mxnet_generic_kernel<OP,Args...>(int, Args...) [with OP=mxnet::op::mxnet_op::op_with_req<mxnet::op::mshadow_op::erfinv, 1>, Args=<float *, float *>]"
- src/operator/tensor/./../mxnet_op.h(721): here
- instantiation of "void mxnet::op::mxnet_op::Kernel<OP, mxnet::gpu>::Launch(mshadow::Stream<mshadow::gpu> *, int, Args...) [with OP=mxnet::op::mxnet_op::op_with_req<mxnet::op::mshadow_op::erfinv, 1>, Args=<float *, float *>]"
- src/operator/tensor/./elemwise_unary_op.h(243): here
- instantiation of "void mxnet::op::UnaryOp::Compute<xpu,OP>(const nnvm::NodeAttrs &, const mxnet::OpContext &, const std::vector<mxnet::TBlob, std::allocator<mxnet::TBlob>> &, const std::vector<mxnet::OpReqType, std::allocator<mxnet::OpReqType>> &, const std::vector<mxnet::TBlob, std::allocator<mxnet::TBlob>> &) [with xpu=mxnet::gpu, OP=mxnet::op::mshadow_op::erfinv]"
- src/operator/tensor/elemwise_unary_op_basic.cu(67): here
- src/operator/tensor/./.././contrib/erfinv-inl.h(81): warning: calling a constexpr __host__ function("infinity") from a __host__ __device__ function("Map") is not allowed. The experimental flag '--expt-relaxed-constexpr' can be used to allow this.
- detected during:
- instantiation of "void mxnet::op::mxnet_op::op_with_req<OP, req>::Map(mxnet::index_t, DType *, const DType *) [with OP=mxnet::op::mshadow_op::erfinv, req=1, DType=float]"
- src/operator/tensor/./../mxnet_op.h(701): here
- instantiation of "void mxnet::op::mxnet_op::mxnet_generic_kernel<OP,Args...>(int, Args...) [with OP=mxnet::op::mxnet_op::op_with_req<mxnet::op::mshadow_op::erfinv, 1>, Args=<float *, float *>]"
- src/operator/tensor/./../mxnet_op.h(721): here
- instantiation of "void mxnet::op::mxnet_op::Kernel<OP, mxnet::gpu>::Launch(mshadow::Stream<mshadow::gpu> *, int, Args...) [with OP=mxnet::op::mxnet_op::op_with_req<mxnet::op::mshadow_op::erfinv, 1>, Args=<float *, float *>]"
- src/operator/tensor/./elemwise_unary_op.h(243): here
- instantiation of "void mxnet::op::UnaryOp::Compute<xpu,OP>(const nnvm::NodeAttrs &, const mxnet::OpContext &, const std::vector<mxnet::TBlob, std::allocator<mxnet::TBlob>> &, const std::vector<mxnet::OpReqType, std::allocator<mxnet::OpReqType>> &, const std::vector<mxnet::TBlob, std::allocator<mxnet::TBlob>> &) [with xpu=mxnet::gpu, OP=mxnet::op::mshadow_op::erfinv]"
- src/operator/tensor/elemwise_unary_op_basic.cu(67): here
- src/operator/tensor/./.././contrib/erfinv-inl.h(79): warning: floating-point value does not fit in required integral type
- detected during:
- instantiation of "DType mxnet::op::mshadow_op::erfinv::Map(DType) [with DType=int8_t]"
- src/operator/tensor/./../mxnet_op.h(479): here
- instantiation of "void mxnet::op::mxnet_op::op_with_req<OP, req>::Map(mxnet::index_t, DType *, const DType *) [with OP=mxnet::op::mshadow_op::erfinv, req=1, DType=int8_t]"
- src/operator/tensor/./../mxnet_op.h(701): here
- instantiation of "void mxnet::op::mxnet_op::mxnet_generic_kernel<OP,Args...>(int, Args...) [with OP=mxnet::op::mxnet_op::op_with_req<mxnet::op::mshadow_op::erfinv, 1>, Args=<int8_t *, int8_t *>]"
- src/operator/tensor/./../mxnet_op.h(721): here
- instantiation of "void mxnet::op::mxnet_op::Kernel<OP, mxnet::gpu>::Launch(mshadow::Stream<mshadow::gpu> *, int, Args...) [with OP=mxnet::op::mxnet_op::op_with_req<mxnet::op::mshadow_op::erfinv, 1>, Args=<int8_t *, int8_t *>]"
- src/operator/tensor/./elemwise_unary_op.h(243): here
- instantiation of "void mxnet::op::UnaryOp::Compute<xpu,OP>(const nnvm::NodeAttrs &, const mxnet::OpContext &, const std::vector<mxnet::TBlob, std::allocator<mxnet::TBlob>> &, const std::vector<mxnet::OpReqType, std::allocator<mxnet::OpReqType>> &, const std::vector<mxnet::TBlob, std::allocator<mxnet::TBlob>> &) [with xpu=mxnet::gpu, OP=mxnet::op::mshadow_op::erfinv]"
- src/operator/tensor/elemwise_unary_op_basic.cu(67): here
- src/operator/tensor/./.././contrib/erfinv-inl.h(79): warning: floating-point value does not fit in required integral type
- detected during:
- instantiation of "DType mxnet::op::mshadow_op::erfinv::Map(DType) [with DType=int32_t]"
- src/operator/tensor/./../mxnet_op.h(479): here
- instantiation of "void mxnet::op::mxnet_op::op_with_req<OP, req>::Map(mxnet::index_t, DType *, const DType *) [with OP=mxnet::op::mshadow_op::erfinv, req=1, DType=int32_t]"
- src/operator/tensor/./../mxnet_op.h(701): here
- instantiation of "void mxnet::op::mxnet_op::mxnet_generic_kernel<OP,Args...>(int, Args...) [with OP=mxnet::op::mxnet_op::op_with_req<mxnet::op::mshadow_op::erfinv, 1>, Args=<int32_t *, int32_t *>]"
- src/operator/tensor/./../mxnet_op.h(721): here
- instantiation of "void mxnet::op::mxnet_op::Kernel<OP, mxnet::gpu>::Launch(mshadow::Stream<mshadow::gpu> *, int, Args...) [with OP=mxnet::op::mxnet_op::op_with_req<mxnet::op::mshadow_op::erfinv, 1>, Args=<int32_t *, int32_t *>]"
- src/operator/tensor/./elemwise_unary_op.h(243): here
- instantiation of "void mxnet::op::UnaryOp::Compute<xpu,OP>(const nnvm::NodeAttrs &, const mxnet::OpContext &, const std::vector<mxnet::TBlob, std::allocator<mxnet::TBlob>> &, const std::vector<mxnet::OpReqType, std::allocator<mxnet::OpReqType>> &, const std::vector<mxnet::TBlob, std::allocator<mxnet::TBlob>> &) [with xpu=mxnet::gpu, OP=mxnet::op::mshadow_op::erfinv]"
- src/operator/tensor/elemwise_unary_op_basic.cu(67): here
- src/operator/tensor/./.././contrib/erfinv-inl.h(79): warning: floating-point value does not fit in required integral type
- detected during:
- instantiation of "DType mxnet::op::mshadow_op::erfinv::Map(DType) [with DType=int64_t]"
- src/operator/tensor/./../mxnet_op.h(479): here
- instantiation of "void mxnet::op::mxnet_op::op_with_req<OP, req>::Map(mxnet::index_t, DType *, const DType *) [with OP=mxnet::op::mshadow_op::erfinv, req=1, DType=int64_t]"
- src/operator/tensor/./../mxnet_op.h(701): here
- instantiation of "void mxnet::op::mxnet_op::mxnet_generic_kernel<OP,Args...>(int, Args...) [with OP=mxnet::op::mxnet_op::op_with_req<mxnet::op::mshadow_op::erfinv, 1>, Args=<int64_t *, int64_t *>]"
- src/operator/tensor/./../mxnet_op.h(721): here
- instantiation of "void mxnet::op::mxnet_op::Kernel<OP, mxnet::gpu>::Launch(mshadow::Stream<mshadow::gpu> *, int, Args...) [with OP=mxnet::op::mxnet_op::op_with_req<mxnet::op::mshadow_op::erfinv, 1>, Args=<int64_t *, int64_t *>]"
- src/operator/tensor/./elemwise_unary_op.h(243): here
- instantiation of "void mxnet::op::UnaryOp::Compute<xpu,OP>(const nnvm::NodeAttrs &, const mxnet::OpContext &, const std::vector<mxnet::TBlob, std::allocator<mxnet::TBlob>> &, const std::vector<mxnet::OpReqType, std::allocator<mxnet::OpReqType>> &, const std::vector<mxnet::TBlob, std::allocator<mxnet::TBlob>> &) [with xpu=mxnet::gpu, OP=mxnet::op::mshadow_op::erfinv]"
- src/operator/tensor/elemwise_unary_op_basic.cu(67): here
- /usr/local/cuda/bin/nvcc -c -o build/src/operator/contrib/adaptive_avg_pooling_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/operator/contrib/adaptive_avg_pooling.cu
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/operator/contrib/ifft_gpu.o src/operator/contrib/ifft.cu >build/src/operator/contrib/ifft_gpu.d
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/operator/contrib/multibox_detection_gpu.o src/operator/contrib/multibox_detection.cu >build/src/operator/contrib/multibox_detection_gpu.d
- /usr/local/cuda/bin/nvcc -c -o build/src/operator/contrib/ifft_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/operator/contrib/ifft.cu
- src/operator/tensor/./.././contrib/erfinv-inl.h(79): warning: calling a constexpr __host__ function("quiet_NaN") from a __host__ __device__ function("Map") is not allowed. The experimental flag '--expt-relaxed-constexpr' can be used to allow this.
- detected during:
- instantiation of "void mxnet::op::mxnet_op::op_with_req<OP, req>::Map(mxnet::index_t, DType *, const DType *) [with OP=mxnet::op::mshadow_op::erfinv, req=1, DType=float]"
- src/operator/tensor/./../mxnet_op.h(701): here
- instantiation of "void mxnet::op::mxnet_op::mxnet_generic_kernel<OP,Args...>(int, Args...) [with OP=mxnet::op::mxnet_op::op_with_req<mxnet::op::mshadow_op::erfinv, 1>, Args=<float *, float *>]"
- src/operator/tensor/./../mxnet_op.h(721): here
- instantiation of "void mxnet::op::mxnet_op::Kernel<OP, mxnet::gpu>::Launch(mshadow::Stream<mshadow::gpu> *, int, Args...) [with OP=mxnet::op::mxnet_op::op_with_req<mxnet::op::mshadow_op::erfinv, 1>, Args=<float *, float *>]"
- src/operator/tensor/./elemwise_unary_op.h(243): here
- instantiation of "void mxnet::op::UnaryOp::Compute<xpu,OP>(const nnvm::NodeAttrs &, const mxnet::OpContext &, const std::vector<mxnet::TBlob, std::allocator<mxnet::TBlob>> &, const std::vector<mxnet::OpReqType, std::allocator<mxnet::OpReqType>> &, const std::vector<mxnet::TBlob, std::allocator<mxnet::TBlob>> &) [with xpu=mxnet::gpu, OP=mxnet::op::mshadow_op::erfinv]"
- src/operator/tensor/elemwise_unary_op_basic.cu(67): here
- src/operator/tensor/./.././contrib/erfinv-inl.h(81): warning: calling a constexpr __host__ function("infinity") from a __host__ __device__ function("Map") is not allowed. The experimental flag '--expt-relaxed-constexpr' can be used to allow this.
- detected during:
- instantiation of "void mxnet::op::mxnet_op::op_with_req<OP, req>::Map(mxnet::index_t, DType *, const DType *) [with OP=mxnet::op::mshadow_op::erfinv, req=1, DType=float]"
- src/operator/tensor/./../mxnet_op.h(701): here
- instantiation of "void mxnet::op::mxnet_op::mxnet_generic_kernel<OP,Args...>(int, Args...) [with OP=mxnet::op::mxnet_op::op_with_req<mxnet::op::mshadow_op::erfinv, 1>, Args=<float *, float *>]"
- src/operator/tensor/./../mxnet_op.h(721): here
- instantiation of "void mxnet::op::mxnet_op::Kernel<OP, mxnet::gpu>::Launch(mshadow::Stream<mshadow::gpu> *, int, Args...) [with OP=mxnet::op::mxnet_op::op_with_req<mxnet::op::mshadow_op::erfinv, 1>, Args=<float *, float *>]"
- src/operator/tensor/./elemwise_unary_op.h(243): here
- instantiation of "void mxnet::op::UnaryOp::Compute<xpu,OP>(const nnvm::NodeAttrs &, const mxnet::OpContext &, const std::vector<mxnet::TBlob, std::allocator<mxnet::TBlob>> &, const std::vector<mxnet::OpReqType, std::allocator<mxnet::OpReqType>> &, const std::vector<mxnet::TBlob, std::allocator<mxnet::TBlob>> &) [with xpu=mxnet::gpu, OP=mxnet::op::mshadow_op::erfinv]"
- src/operator/tensor/elemwise_unary_op_basic.cu(67): here
- src/operator/tensor/./.././contrib/erfinv-inl.h(79): warning: floating-point value does not fit in required integral type
- detected during:
- instantiation of "DType mxnet::op::mshadow_op::erfinv::Map(DType) [with DType=int8_t]"
- src/operator/tensor/./../mxnet_op.h(479): here
- instantiation of "void mxnet::op::mxnet_op::op_with_req<OP, req>::Map(mxnet::index_t, DType *, const DType *) [with OP=mxnet::op::mshadow_op::erfinv, req=1, DType=int8_t]"
- src/operator/tensor/./../mxnet_op.h(701): here
- instantiation of "void mxnet::op::mxnet_op::mxnet_generic_kernel<OP,Args...>(int, Args...) [with OP=mxnet::op::mxnet_op::op_with_req<mxnet::op::mshadow_op::erfinv, 1>, Args=<int8_t *, int8_t *>]"
- src/operator/tensor/./../mxnet_op.h(721): here
- instantiation of "void mxnet::op::mxnet_op::Kernel<OP, mxnet::gpu>::Launch(mshadow::Stream<mshadow::gpu> *, int, Args...) [with OP=mxnet::op::mxnet_op::op_with_req<mxnet::op::mshadow_op::erfinv, 1>, Args=<int8_t *, int8_t *>]"
- src/operator/tensor/./elemwise_unary_op.h(243): here
- instantiation of "void mxnet::op::UnaryOp::Compute<xpu,OP>(const nnvm::NodeAttrs &, const mxnet::OpContext &, const std::vector<mxnet::TBlob, std::allocator<mxnet::TBlob>> &, const std::vector<mxnet::OpReqType, std::allocator<mxnet::OpReqType>> &, const std::vector<mxnet::TBlob, std::allocator<mxnet::TBlob>> &) [with xpu=mxnet::gpu, OP=mxnet::op::mshadow_op::erfinv]"
- src/operator/tensor/elemwise_unary_op_basic.cu(67): here
- src/operator/tensor/./.././contrib/erfinv-inl.h(79): warning: floating-point value does not fit in required integral type
- detected during:
- instantiation of "DType mxnet::op::mshadow_op::erfinv::Map(DType) [with DType=int32_t]"
- src/operator/tensor/./../mxnet_op.h(479): here
- instantiation of "void mxnet::op::mxnet_op::op_with_req<OP, req>::Map(mxnet::index_t, DType *, const DType *) [with OP=mxnet::op::mshadow_op::erfinv, req=1, DType=int32_t]"
- src/operator/tensor/./../mxnet_op.h(701): here
- instantiation of "void mxnet::op::mxnet_op::mxnet_generic_kernel<OP,Args...>(int, Args...) [with OP=mxnet::op::mxnet_op::op_with_req<mxnet::op::mshadow_op::erfinv, 1>, Args=<int32_t *, int32_t *>]"
- src/operator/tensor/./../mxnet_op.h(721): here
- instantiation of "void mxnet::op::mxnet_op::Kernel<OP, mxnet::gpu>::Launch(mshadow::Stream<mshadow::gpu> *, int, Args...) [with OP=mxnet::op::mxnet_op::op_with_req<mxnet::op::mshadow_op::erfinv, 1>, Args=<int32_t *, int32_t *>]"
- src/operator/tensor/./elemwise_unary_op.h(243): here
- instantiation of "void mxnet::op::UnaryOp::Compute<xpu,OP>(const nnvm::NodeAttrs &, const mxnet::OpContext &, const std::vector<mxnet::TBlob, std::allocator<mxnet::TBlob>> &, const std::vector<mxnet::OpReqType, std::allocator<mxnet::OpReqType>> &, const std::vector<mxnet::TBlob, std::allocator<mxnet::TBlob>> &) [with xpu=mxnet::gpu, OP=mxnet::op::mshadow_op::erfinv]"
- src/operator/tensor/elemwise_unary_op_basic.cu(67): here
- src/operator/tensor/./.././contrib/erfinv-inl.h(79): warning: floating-point value does not fit in required integral type
- detected during:
- instantiation of "DType mxnet::op::mshadow_op::erfinv::Map(DType) [with DType=int64_t]"
- src/operator/tensor/./../mxnet_op.h(479): here
- instantiation of "void mxnet::op::mxnet_op::op_with_req<OP, req>::Map(mxnet::index_t, DType *, const DType *) [with OP=mxnet::op::mshadow_op::erfinv, req=1, DType=int64_t]"
- src/operator/tensor/./../mxnet_op.h(701): here
- instantiation of "void mxnet::op::mxnet_op::mxnet_generic_kernel<OP,Args...>(int, Args...) [with OP=mxnet::op::mxnet_op::op_with_req<mxnet::op::mshadow_op::erfinv, 1>, Args=<int64_t *, int64_t *>]"
- src/operator/tensor/./../mxnet_op.h(721): here
- instantiation of "void mxnet::op::mxnet_op::Kernel<OP, mxnet::gpu>::Launch(mshadow::Stream<mshadow::gpu> *, int, Args...) [with OP=mxnet::op::mxnet_op::op_with_req<mxnet::op::mshadow_op::erfinv, 1>, Args=<int64_t *, int64_t *>]"
- src/operator/tensor/./elemwise_unary_op.h(243): here
- instantiation of "void mxnet::op::UnaryOp::Compute<xpu,OP>(const nnvm::NodeAttrs &, const mxnet::OpContext &, const std::vector<mxnet::TBlob, std::allocator<mxnet::TBlob>> &, const std::vector<mxnet::OpReqType, std::allocator<mxnet::OpReqType>> &, const std::vector<mxnet::TBlob, std::allocator<mxnet::TBlob>> &) [with xpu=mxnet::gpu, OP=mxnet::op::mshadow_op::erfinv]"
- src/operator/tensor/elemwise_unary_op_basic.cu(67): here
- /usr/local/cuda/bin/nvcc -c -o build/src/operator/contrib/multibox_detection_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/operator/contrib/multibox_detection.cu
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/operator/contrib/index_copy_gpu.o src/operator/contrib/index_copy.cu >build/src/operator/contrib/index_copy_gpu.d
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/operator/contrib/tensorrt_gpu.o src/operator/contrib/tensorrt.cu >build/src/operator/contrib/tensorrt_gpu.d
- /usr/local/cuda/bin/nvcc -c -o build/src/operator/contrib/tensorrt_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/operator/contrib/tensorrt.cu
- src/operator/tensor/./.././contrib/erfinv-inl.h(79): warning: calling a constexpr __host__ function("quiet_NaN") from a __host__ __device__ function("Map") is not allowed. The experimental flag '--expt-relaxed-constexpr' can be used to allow this.
- detected during:
- instantiation of "void mxnet::op::mxnet_op::op_with_req<OP, req>::Map(mxnet::index_t, DType *, const DType *) [with OP=mxnet::op::mshadow_op::erfinv, req=1, DType=float]"
- src/operator/tensor/./../mxnet_op.h(701): here
- instantiation of "void mxnet::op::mxnet_op::mxnet_generic_kernel<OP,Args...>(int, Args...) [with OP=mxnet::op::mxnet_op::op_with_req<mxnet::op::mshadow_op::erfinv, 1>, Args=<float *, float *>]"
- src/operator/tensor/./../mxnet_op.h(721): here
- instantiation of "void mxnet::op::mxnet_op::Kernel<OP, mxnet::gpu>::Launch(mshadow::Stream<mshadow::gpu> *, int, Args...) [with OP=mxnet::op::mxnet_op::op_with_req<mxnet::op::mshadow_op::erfinv, 1>, Args=<float *, float *>]"
- src/operator/tensor/./elemwise_unary_op.h(243): here
- instantiation of "void mxnet::op::UnaryOp::Compute<xpu,OP>(const nnvm::NodeAttrs &, const mxnet::OpContext &, const std::vector<mxnet::TBlob, std::allocator<mxnet::TBlob>> &, const std::vector<mxnet::OpReqType, std::allocator<mxnet::OpReqType>> &, const std::vector<mxnet::TBlob, std::allocator<mxnet::TBlob>> &) [with xpu=mxnet::gpu, OP=mxnet::op::mshadow_op::erfinv]"
- src/operator/tensor/elemwise_unary_op_basic.cu(67): here
- src/operator/tensor/./.././contrib/erfinv-inl.h(81): warning: calling a constexpr __host__ function("infinity") from a __host__ __device__ function("Map") is not allowed. The experimental flag '--expt-relaxed-constexpr' can be used to allow this.
- detected during:
- instantiation of "void mxnet::op::mxnet_op::op_with_req<OP, req>::Map(mxnet::index_t, DType *, const DType *) [with OP=mxnet::op::mshadow_op::erfinv, req=1, DType=float]"
- src/operator/tensor/./../mxnet_op.h(701): here
- instantiation of "void mxnet::op::mxnet_op::mxnet_generic_kernel<OP,Args...>(int, Args...) [with OP=mxnet::op::mxnet_op::op_with_req<mxnet::op::mshadow_op::erfinv, 1>, Args=<float *, float *>]"
- src/operator/tensor/./../mxnet_op.h(721): here
- instantiation of "void mxnet::op::mxnet_op::Kernel<OP, mxnet::gpu>::Launch(mshadow::Stream<mshadow::gpu> *, int, Args...) [with OP=mxnet::op::mxnet_op::op_with_req<mxnet::op::mshadow_op::erfinv, 1>, Args=<float *, float *>]"
- src/operator/tensor/./elemwise_unary_op.h(243): here
- instantiation of "void mxnet::op::UnaryOp::Compute<xpu,OP>(const nnvm::NodeAttrs &, const mxnet::OpContext &, const std::vector<mxnet::TBlob, std::allocator<mxnet::TBlob>> &, const std::vector<mxnet::OpReqType, std::allocator<mxnet::OpReqType>> &, const std::vector<mxnet::TBlob, std::allocator<mxnet::TBlob>> &) [with xpu=mxnet::gpu, OP=mxnet::op::mshadow_op::erfinv]"
- src/operator/tensor/elemwise_unary_op_basic.cu(67): here
- src/operator/tensor/./.././contrib/erfinv-inl.h(79): warning: floating-point value does not fit in required integral type
- detected during:
- instantiation of "DType mxnet::op::mshadow_op::erfinv::Map(DType) [with DType=int8_t]"
- src/operator/tensor/./../mxnet_op.h(479): here
- instantiation of "void mxnet::op::mxnet_op::op_with_req<OP, req>::Map(mxnet::index_t, DType *, const DType *) [with OP=mxnet::op::mshadow_op::erfinv, req=1, DType=int8_t]"
- src/operator/tensor/./../mxnet_op.h(701): here
- instantiation of "void mxnet::op::mxnet_op::mxnet_generic_kernel<OP,Args...>(int, Args...) [with OP=mxnet::op::mxnet_op::op_with_req<mxnet::op::mshadow_op::erfinv, 1>, Args=<int8_t *, int8_t *>]"
- src/operator/tensor/./../mxnet_op.h(721): here
- instantiation of "void mxnet::op::mxnet_op::Kernel<OP, mxnet::gpu>::Launch(mshadow::Stream<mshadow::gpu> *, int, Args...) [with OP=mxnet::op::mxnet_op::op_with_req<mxnet::op::mshadow_op::erfinv, 1>, Args=<int8_t *, int8_t *>]"
- src/operator/tensor/./elemwise_unary_op.h(243): here
- instantiation of "void mxnet::op::UnaryOp::Compute<xpu,OP>(const nnvm::NodeAttrs &, const mxnet::OpContext &, const std::vector<mxnet::TBlob, std::allocator<mxnet::TBlob>> &, const std::vector<mxnet::OpReqType, std::allocator<mxnet::OpReqType>> &, const std::vector<mxnet::TBlob, std::allocator<mxnet::TBlob>> &) [with xpu=mxnet::gpu, OP=mxnet::op::mshadow_op::erfinv]"
- src/operator/tensor/elemwise_unary_op_basic.cu(67): here
- src/operator/tensor/./.././contrib/erfinv-inl.h(79): warning: floating-point value does not fit in required integral type
- detected during:
- instantiation of "DType mxnet::op::mshadow_op::erfinv::Map(DType) [with DType=int32_t]"
- src/operator/tensor/./../mxnet_op.h(479): here
- instantiation of "void mxnet::op::mxnet_op::op_with_req<OP, req>::Map(mxnet::index_t, DType *, const DType *) [with OP=mxnet::op::mshadow_op::erfinv, req=1, DType=int32_t]"
- src/operator/tensor/./../mxnet_op.h(701): here
- instantiation of "void mxnet::op::mxnet_op::mxnet_generic_kernel<OP,Args...>(int, Args...) [with OP=mxnet::op::mxnet_op::op_with_req<mxnet::op::mshadow_op::erfinv, 1>, Args=<int32_t *, int32_t *>]"
- src/operator/tensor/./../mxnet_op.h(721): here
- instantiation of "void mxnet::op::mxnet_op::Kernel<OP, mxnet::gpu>::Launch(mshadow::Stream<mshadow::gpu> *, int, Args...) [with OP=mxnet::op::mxnet_op::op_with_req<mxnet::op::mshadow_op::erfinv, 1>, Args=<int32_t *, int32_t *>]"
- src/operator/tensor/./elemwise_unary_op.h(243): here
- instantiation of "void mxnet::op::UnaryOp::Compute<xpu,OP>(const nnvm::NodeAttrs &, const mxnet::OpContext &, const std::vector<mxnet::TBlob, std::allocator<mxnet::TBlob>> &, const std::vector<mxnet::OpReqType, std::allocator<mxnet::OpReqType>> &, const std::vector<mxnet::TBlob, std::allocator<mxnet::TBlob>> &) [with xpu=mxnet::gpu, OP=mxnet::op::mshadow_op::erfinv]"
- src/operator/tensor/elemwise_unary_op_basic.cu(67): here
- src/operator/tensor/./.././contrib/erfinv-inl.h(79): warning: floating-point value does not fit in required integral type
- detected during:
- instantiation of "DType mxnet::op::mshadow_op::erfinv::Map(DType) [with DType=int64_t]"
- src/operator/tensor/./../mxnet_op.h(479): here
- instantiation of "void mxnet::op::mxnet_op::op_with_req<OP, req>::Map(mxnet::index_t, DType *, const DType *) [with OP=mxnet::op::mshadow_op::erfinv, req=1, DType=int64_t]"
- src/operator/tensor/./../mxnet_op.h(701): here
- instantiation of "void mxnet::op::mxnet_op::mxnet_generic_kernel<OP,Args...>(int, Args...) [with OP=mxnet::op::mxnet_op::op_with_req<mxnet::op::mshadow_op::erfinv, 1>, Args=<int64_t *, int64_t *>]"
- src/operator/tensor/./../mxnet_op.h(721): here
- instantiation of "void mxnet::op::mxnet_op::Kernel<OP, mxnet::gpu>::Launch(mshadow::Stream<mshadow::gpu> *, int, Args...) [with OP=mxnet::op::mxnet_op::op_with_req<mxnet::op::mshadow_op::erfinv, 1>, Args=<int64_t *, int64_t *>]"
- src/operator/tensor/./elemwise_unary_op.h(243): here
- instantiation of "void mxnet::op::UnaryOp::Compute<xpu,OP>(const nnvm::NodeAttrs &, const mxnet::OpContext &, const std::vector<mxnet::TBlob, std::allocator<mxnet::TBlob>> &, const std::vector<mxnet::OpReqType, std::allocator<mxnet::OpReqType>> &, const std::vector<mxnet::TBlob, std::allocator<mxnet::TBlob>> &) [with xpu=mxnet::gpu, OP=mxnet::op::mshadow_op::erfinv]"
- src/operator/tensor/elemwise_unary_op_basic.cu(67): here
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/operator/contrib/multibox_target_gpu.o src/operator/contrib/multibox_target.cu >build/src/operator/contrib/multibox_target_gpu.d
- /usr/local/cuda/bin/nvcc -c -o build/src/operator/contrib/index_copy_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/operator/contrib/index_copy.cu
- /usr/local/cuda/bin/nvcc -c -o build/src/operator/contrib/multibox_target_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/operator/contrib/multibox_target.cu
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/operator/contrib/proposal_gpu.o src/operator/contrib/proposal.cu >build/src/operator/contrib/proposal_gpu.d
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/operator/contrib/bilinear_resize_gpu.o src/operator/contrib/bilinear_resize.cu >build/src/operator/contrib/bilinear_resize_gpu.d
- /usr/local/cuda/bin/nvcc -c -o build/src/operator/contrib/proposal_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/operator/contrib/proposal.cu
- /usr/local/cuda/bin/nvcc -c -o build/src/operator/contrib/bilinear_resize_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/operator/contrib/bilinear_resize.cu
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/operator/contrib/count_sketch_gpu.o src/operator/contrib/count_sketch.cu >build/src/operator/contrib/count_sketch_gpu.d
- /usr/local/cuda/bin/nvcc -c -o build/src/operator/contrib/count_sketch_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/operator/contrib/count_sketch.cu
- src/operator/tensor/./.././contrib/erfinv-inl.h(79): warning: calling a constexpr __host__ function("quiet_NaN") from a __host__ __device__ function("Map") is not allowed. The experimental flag '--expt-relaxed-constexpr' can be used to allow this.
- detected during:
- instantiation of "void mxnet::op::mxnet_op::op_with_req<OP, req>::Map(mxnet::index_t, DType *, const DType *) [with OP=mxnet::op::mshadow_op::erfinv, req=1, DType=float]"
- src/operator/tensor/./../mxnet_op.h(701): here
- instantiation of "void mxnet::op::mxnet_op::mxnet_generic_kernel<OP,Args...>(int, Args...) [with OP=mxnet::op::mxnet_op::op_with_req<mxnet::op::mshadow_op::erfinv, 1>, Args=<float *, float *>]"
- src/operator/tensor/./../mxnet_op.h(721): here
- instantiation of "void mxnet::op::mxnet_op::Kernel<OP, mxnet::gpu>::Launch(mshadow::Stream<mshadow::gpu> *, int, Args...) [with OP=mxnet::op::mxnet_op::op_with_req<mxnet::op::mshadow_op::erfinv, 1>, Args=<float *, float *>]"
- src/operator/tensor/./elemwise_unary_op.h(243): here
- instantiation of "void mxnet::op::UnaryOp::Compute<xpu,OP>(const nnvm::NodeAttrs &, const mxnet::OpContext &, const std::vector<mxnet::TBlob, std::allocator<mxnet::TBlob>> &, const std::vector<mxnet::OpReqType, std::allocator<mxnet::OpReqType>> &, const std::vector<mxnet::TBlob, std::allocator<mxnet::TBlob>> &) [with xpu=mxnet::gpu, OP=mxnet::op::mshadow_op::erfinv]"
- src/operator/tensor/elemwise_unary_op_basic.cu(67): here
- src/operator/tensor/./.././contrib/erfinv-inl.h(81): warning: calling a constexpr __host__ function("infinity") from a __host__ __device__ function("Map") is not allowed. The experimental flag '--expt-relaxed-constexpr' can be used to allow this.
- detected during:
- instantiation of "void mxnet::op::mxnet_op::op_with_req<OP, req>::Map(mxnet::index_t, DType *, const DType *) [with OP=mxnet::op::mshadow_op::erfinv, req=1, DType=float]"
- src/operator/tensor/./../mxnet_op.h(701): here
- instantiation of "void mxnet::op::mxnet_op::mxnet_generic_kernel<OP,Args...>(int, Args...) [with OP=mxnet::op::mxnet_op::op_with_req<mxnet::op::mshadow_op::erfinv, 1>, Args=<float *, float *>]"
- src/operator/tensor/./../mxnet_op.h(721): here
- instantiation of "void mxnet::op::mxnet_op::Kernel<OP, mxnet::gpu>::Launch(mshadow::Stream<mshadow::gpu> *, int, Args...) [with OP=mxnet::op::mxnet_op::op_with_req<mxnet::op::mshadow_op::erfinv, 1>, Args=<float *, float *>]"
- src/operator/tensor/./elemwise_unary_op.h(243): here
- instantiation of "void mxnet::op::UnaryOp::Compute<xpu,OP>(const nnvm::NodeAttrs &, const mxnet::OpContext &, const std::vector<mxnet::TBlob, std::allocator<mxnet::TBlob>> &, const std::vector<mxnet::OpReqType, std::allocator<mxnet::OpReqType>> &, const std::vector<mxnet::TBlob, std::allocator<mxnet::TBlob>> &) [with xpu=mxnet::gpu, OP=mxnet::op::mshadow_op::erfinv]"
- src/operator/tensor/elemwise_unary_op_basic.cu(67): here
- src/operator/tensor/./.././contrib/erfinv-inl.h(79): warning: floating-point value does not fit in required integral type
- detected during:
- instantiation of "DType mxnet::op::mshadow_op::erfinv::Map(DType) [with DType=int8_t]"
- src/operator/tensor/./../mxnet_op.h(479): here
- instantiation of "void mxnet::op::mxnet_op::op_with_req<OP, req>::Map(mxnet::index_t, DType *, const DType *) [with OP=mxnet::op::mshadow_op::erfinv, req=1, DType=int8_t]"
- src/operator/tensor/./../mxnet_op.h(701): here
- instantiation of "void mxnet::op::mxnet_op::mxnet_generic_kernel<OP,Args...>(int, Args...) [with OP=mxnet::op::mxnet_op::op_with_req<mxnet::op::mshadow_op::erfinv, 1>, Args=<int8_t *, int8_t *>]"
- src/operator/tensor/./../mxnet_op.h(721): here
- instantiation of "void mxnet::op::mxnet_op::Kernel<OP, mxnet::gpu>::Launch(mshadow::Stream<mshadow::gpu> *, int, Args...) [with OP=mxnet::op::mxnet_op::op_with_req<mxnet::op::mshadow_op::erfinv, 1>, Args=<int8_t *, int8_t *>]"
- src/operator/tensor/./elemwise_unary_op.h(243): here
- instantiation of "void mxnet::op::UnaryOp::Compute<xpu,OP>(const nnvm::NodeAttrs &, const mxnet::OpContext &, const std::vector<mxnet::TBlob, std::allocator<mxnet::TBlob>> &, const std::vector<mxnet::OpReqType, std::allocator<mxnet::OpReqType>> &, const std::vector<mxnet::TBlob, std::allocator<mxnet::TBlob>> &) [with xpu=mxnet::gpu, OP=mxnet::op::mshadow_op::erfinv]"
- src/operator/tensor/elemwise_unary_op_basic.cu(67): here
- src/operator/tensor/./.././contrib/erfinv-inl.h(79): warning: floating-point value does not fit in required integral type
- detected during:
- instantiation of "DType mxnet::op::mshadow_op::erfinv::Map(DType) [with DType=int32_t]"
- src/operator/tensor/./../mxnet_op.h(479): here
- instantiation of "void mxnet::op::mxnet_op::op_with_req<OP, req>::Map(mxnet::index_t, DType *, const DType *) [with OP=mxnet::op::mshadow_op::erfinv, req=1, DType=int32_t]"
- src/operator/tensor/./../mxnet_op.h(701): here
- instantiation of "void mxnet::op::mxnet_op::mxnet_generic_kernel<OP,Args...>(int, Args...) [with OP=mxnet::op::mxnet_op::op_with_req<mxnet::op::mshadow_op::erfinv, 1>, Args=<int32_t *, int32_t *>]"
- src/operator/tensor/./../mxnet_op.h(721): here
- instantiation of "void mxnet::op::mxnet_op::Kernel<OP, mxnet::gpu>::Launch(mshadow::Stream<mshadow::gpu> *, int, Args...) [with OP=mxnet::op::mxnet_op::op_with_req<mxnet::op::mshadow_op::erfinv, 1>, Args=<int32_t *, int32_t *>]"
- src/operator/tensor/./elemwise_unary_op.h(243): here
- instantiation of "void mxnet::op::UnaryOp::Compute<xpu,OP>(const nnvm::NodeAttrs &, const mxnet::OpContext &, const std::vector<mxnet::TBlob, std::allocator<mxnet::TBlob>> &, const std::vector<mxnet::OpReqType, std::allocator<mxnet::OpReqType>> &, const std::vector<mxnet::TBlob, std::allocator<mxnet::TBlob>> &) [with xpu=mxnet::gpu, OP=mxnet::op::mshadow_op::erfinv]"
- src/operator/tensor/elemwise_unary_op_basic.cu(67): here
- src/operator/tensor/./.././contrib/erfinv-inl.h(79): warning: floating-point value does not fit in required integral type
- detected during:
- instantiation of "DType mxnet::op::mshadow_op::erfinv::Map(DType) [with DType=int64_t]"
- src/operator/tensor/./../mxnet_op.h(479): here
- instantiation of "void mxnet::op::mxnet_op::op_with_req<OP, req>::Map(mxnet::index_t, DType *, const DType *) [with OP=mxnet::op::mshadow_op::erfinv, req=1, DType=int64_t]"
- src/operator/tensor/./../mxnet_op.h(701): here
- instantiation of "void mxnet::op::mxnet_op::mxnet_generic_kernel<OP,Args...>(int, Args...) [with OP=mxnet::op::mxnet_op::op_with_req<mxnet::op::mshadow_op::erfinv, 1>, Args=<int64_t *, int64_t *>]"
- src/operator/tensor/./../mxnet_op.h(721): here
- instantiation of "void mxnet::op::mxnet_op::Kernel<OP, mxnet::gpu>::Launch(mshadow::Stream<mshadow::gpu> *, int, Args...) [with OP=mxnet::op::mxnet_op::op_with_req<mxnet::op::mshadow_op::erfinv, 1>, Args=<int64_t *, int64_t *>]"
- src/operator/tensor/./elemwise_unary_op.h(243): here
- instantiation of "void mxnet::op::UnaryOp::Compute<xpu,OP>(const nnvm::NodeAttrs &, const mxnet::OpContext &, const std::vector<mxnet::TBlob, std::allocator<mxnet::TBlob>> &, const std::vector<mxnet::OpReqType, std::allocator<mxnet::OpReqType>> &, const std::vector<mxnet::TBlob, std::allocator<mxnet::TBlob>> &) [with xpu=mxnet::gpu, OP=mxnet::op::mshadow_op::erfinv]"
- src/operator/tensor/elemwise_unary_op_basic.cu(67): here
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/operator/contrib/dgl_graph_gpu.o src/operator/contrib/dgl_graph.cu >build/src/operator/contrib/dgl_graph_gpu.d
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/operator/contrib/gradient_multiplier_op_gpu.o src/operator/contrib/gradient_multiplier_op.cu >build/src/operator/contrib/gradient_multiplier_op_gpu.d
- /usr/local/cuda/bin/nvcc -c -o build/src/operator/contrib/dgl_graph_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/operator/contrib/dgl_graph.cu
- /usr/local/cuda/bin/nvcc -c -o build/src/operator/contrib/gradient_multiplier_op_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/operator/contrib/gradient_multiplier_op.cu
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/operator/contrib/bounding_box_gpu.o src/operator/contrib/bounding_box.cu >build/src/operator/contrib/bounding_box_gpu.d
- src/operator/tensor/./.././contrib/erfinv-inl.h(79): warning: calling a constexpr __host__ function("quiet_NaN") from a __host__ __device__ function("Map") is not allowed. The experimental flag '--expt-relaxed-constexpr' can be used to allow this.
- detected during:
- instantiation of "void mxnet::op::mxnet_op::op_with_req<OP, req>::Map(mxnet::index_t, DType *, const DType *) [with OP=mxnet::op::mshadow_op::erfinv, req=1, DType=float]"
- src/operator/tensor/./../mxnet_op.h(701): here
- instantiation of "void mxnet::op::mxnet_op::mxnet_generic_kernel<OP,Args...>(int, Args...) [with OP=mxnet::op::mxnet_op::op_with_req<mxnet::op::mshadow_op::erfinv, 1>, Args=<float *, float *>]"
- src/operator/tensor/./../mxnet_op.h(721): here
- instantiation of "void mxnet::op::mxnet_op::Kernel<OP, mxnet::gpu>::Launch(mshadow::Stream<mshadow::gpu> *, int, Args...) [with OP=mxnet::op::mxnet_op::op_with_req<mxnet::op::mshadow_op::erfinv, 1>, Args=<float *, float *>]"
- src/operator/tensor/./elemwise_unary_op.h(243): here
- instantiation of "void mxnet::op::UnaryOp::Compute<xpu,OP>(const nnvm::NodeAttrs &, const mxnet::OpContext &, const std::vector<mxnet::TBlob, std::allocator<mxnet::TBlob>> &, const std::vector<mxnet::OpReqType, std::allocator<mxnet::OpReqType>> &, const std::vector<mxnet::TBlob, std::allocator<mxnet::TBlob>> &) [with xpu=mxnet::gpu, OP=mxnet::op::mshadow_op::erfinv]"
- src/operator/tensor/elemwise_unary_op_basic.cu(67): here
- src/operator/tensor/./.././contrib/erfinv-inl.h(81): warning: calling a constexpr __host__ function("infinity") from a __host__ __device__ function("Map") is not allowed. The experimental flag '--expt-relaxed-constexpr' can be used to allow this.
- detected during:
- instantiation of "void mxnet::op::mxnet_op::op_with_req<OP, req>::Map(mxnet::index_t, DType *, const DType *) [with OP=mxnet::op::mshadow_op::erfinv, req=1, DType=float]"
- src/operator/tensor/./../mxnet_op.h(701): here
- instantiation of "void mxnet::op::mxnet_op::mxnet_generic_kernel<OP,Args...>(int, Args...) [with OP=mxnet::op::mxnet_op::op_with_req<mxnet::op::mshadow_op::erfinv, 1>, Args=<float *, float *>]"
- src/operator/tensor/./../mxnet_op.h(721): here
- instantiation of "void mxnet::op::mxnet_op::Kernel<OP, mxnet::gpu>::Launch(mshadow::Stream<mshadow::gpu> *, int, Args...) [with OP=mxnet::op::mxnet_op::op_with_req<mxnet::op::mshadow_op::erfinv, 1>, Args=<float *, float *>]"
- src/operator/tensor/./elemwise_unary_op.h(243): here
- instantiation of "void mxnet::op::UnaryOp::Compute<xpu,OP>(const nnvm::NodeAttrs &, const mxnet::OpContext &, const std::vector<mxnet::TBlob, std::allocator<mxnet::TBlob>> &, const std::vector<mxnet::OpReqType, std::allocator<mxnet::OpReqType>> &, const std::vector<mxnet::TBlob, std::allocator<mxnet::TBlob>> &) [with xpu=mxnet::gpu, OP=mxnet::op::mshadow_op::erfinv]"
- src/operator/tensor/elemwise_unary_op_basic.cu(67): here
- src/operator/tensor/./.././contrib/erfinv-inl.h(79): warning: floating-point value does not fit in required integral type
- detected during:
- instantiation of "DType mxnet::op::mshadow_op::erfinv::Map(DType) [with DType=int8_t]"
- src/operator/tensor/./../mxnet_op.h(479): here
- instantiation of "void mxnet::op::mxnet_op::op_with_req<OP, req>::Map(mxnet::index_t, DType *, const DType *) [with OP=mxnet::op::mshadow_op::erfinv, req=1, DType=int8_t]"
- src/operator/tensor/./../mxnet_op.h(701): here
- instantiation of "void mxnet::op::mxnet_op::mxnet_generic_kernel<OP,Args...>(int, Args...) [with OP=mxnet::op::mxnet_op::op_with_req<mxnet::op::mshadow_op::erfinv, 1>, Args=<int8_t *, int8_t *>]"
- src/operator/tensor/./../mxnet_op.h(721): here
- instantiation of "void mxnet::op::mxnet_op::Kernel<OP, mxnet::gpu>::Launch(mshadow::Stream<mshadow::gpu> *, int, Args...) [with OP=mxnet::op::mxnet_op::op_with_req<mxnet::op::mshadow_op::erfinv, 1>, Args=<int8_t *, int8_t *>]"
- src/operator/tensor/./elemwise_unary_op.h(243): here
- instantiation of "void mxnet::op::UnaryOp::Compute<xpu,OP>(const nnvm::NodeAttrs &, const mxnet::OpContext &, const std::vector<mxnet::TBlob, std::allocator<mxnet::TBlob>> &, const std::vector<mxnet::OpReqType, std::allocator<mxnet::OpReqType>> &, const std::vector<mxnet::TBlob, std::allocator<mxnet::TBlob>> &) [with xpu=mxnet::gpu, OP=mxnet::op::mshadow_op::erfinv]"
- src/operator/tensor/elemwise_unary_op_basic.cu(67): here
- src/operator/tensor/./.././contrib/erfinv-inl.h(79): warning: floating-point value does not fit in required integral type
- detected during:
- instantiation of "DType mxnet::op::mshadow_op::erfinv::Map(DType) [with DType=int32_t]"
- src/operator/tensor/./../mxnet_op.h(479): here
- instantiation of "void mxnet::op::mxnet_op::op_with_req<OP, req>::Map(mxnet::index_t, DType *, const DType *) [with OP=mxnet::op::mshadow_op::erfinv, req=1, DType=int32_t]"
- src/operator/tensor/./../mxnet_op.h(701): here
- instantiation of "void mxnet::op::mxnet_op::mxnet_generic_kernel<OP,Args...>(int, Args...) [with OP=mxnet::op::mxnet_op::op_with_req<mxnet::op::mshadow_op::erfinv, 1>, Args=<int32_t *, int32_t *>]"
- src/operator/tensor/./../mxnet_op.h(721): here
- instantiation of "void mxnet::op::mxnet_op::Kernel<OP, mxnet::gpu>::Launch(mshadow::Stream<mshadow::gpu> *, int, Args...) [with OP=mxnet::op::mxnet_op::op_with_req<mxnet::op::mshadow_op::erfinv, 1>, Args=<int32_t *, int32_t *>]"
- src/operator/tensor/./elemwise_unary_op.h(243): here
- instantiation of "void mxnet::op::UnaryOp::Compute<xpu,OP>(const nnvm::NodeAttrs &, const mxnet::OpContext &, const std::vector<mxnet::TBlob, std::allocator<mxnet::TBlob>> &, const std::vector<mxnet::OpReqType, std::allocator<mxnet::OpReqType>> &, const std::vector<mxnet::TBlob, std::allocator<mxnet::TBlob>> &) [with xpu=mxnet::gpu, OP=mxnet::op::mshadow_op::erfinv]"
- src/operator/tensor/elemwise_unary_op_basic.cu(67): here
- src/operator/tensor/./.././contrib/erfinv-inl.h(79): warning: floating-point value does not fit in required integral type
- detected during:
- instantiation of "DType mxnet::op::mshadow_op::erfinv::Map(DType) [with DType=int64_t]"
- src/operator/tensor/./../mxnet_op.h(479): here
- instantiation of "void mxnet::op::mxnet_op::op_with_req<OP, req>::Map(mxnet::index_t, DType *, const DType *) [with OP=mxnet::op::mshadow_op::erfinv, req=1, DType=int64_t]"
- src/operator/tensor/./../mxnet_op.h(701): here
- instantiation of "void mxnet::op::mxnet_op::mxnet_generic_kernel<OP,Args...>(int, Args...) [with OP=mxnet::op::mxnet_op::op_with_req<mxnet::op::mshadow_op::erfinv, 1>, Args=<int64_t *, int64_t *>]"
- src/operator/tensor/./../mxnet_op.h(721): here
- instantiation of "void mxnet::op::mxnet_op::Kernel<OP, mxnet::gpu>::Launch(mshadow::Stream<mshadow::gpu> *, int, Args...) [with OP=mxnet::op::mxnet_op::op_with_req<mxnet::op::mshadow_op::erfinv, 1>, Args=<int64_t *, int64_t *>]"
- src/operator/tensor/./elemwise_unary_op.h(243): here
- instantiation of "void mxnet::op::UnaryOp::Compute<xpu,OP>(const nnvm::NodeAttrs &, const mxnet::OpContext &, const std::vector<mxnet::TBlob, std::allocator<mxnet::TBlob>> &, const std::vector<mxnet::OpReqType, std::allocator<mxnet::OpReqType>> &, const std::vector<mxnet::TBlob, std::allocator<mxnet::TBlob>> &) [with xpu=mxnet::gpu, OP=mxnet::op::mshadow_op::erfinv]"
- src/operator/tensor/elemwise_unary_op_basic.cu(67): here
- /usr/local/cuda/bin/nvcc -c -o build/src/operator/contrib/bounding_box_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/operator/contrib/bounding_box.cu
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/operator/contrib/fft_gpu.o src/operator/contrib/fft.cu >build/src/operator/contrib/fft_gpu.d
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/operator/contrib/multibox_prior_gpu.o src/operator/contrib/multibox_prior.cu >build/src/operator/contrib/multibox_prior_gpu.d
- /usr/local/cuda/bin/nvcc -c -o build/src/operator/contrib/fft_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/operator/contrib/fft.cu
- /usr/local/cuda/bin/nvcc -c -o build/src/operator/contrib/multibox_prior_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/operator/contrib/multibox_prior.cu
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/operator/contrib/deformable_psroi_pooling_gpu.o src/operator/contrib/deformable_psroi_pooling.cu >build/src/operator/contrib/deformable_psroi_pooling_gpu.d
- /usr/local/cuda/bin/nvcc -c -o build/src/operator/contrib/deformable_psroi_pooling_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/operator/contrib/deformable_psroi_pooling.cu
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/operator/contrib/quadratic_op_gpu.o src/operator/contrib/quadratic_op.cu >build/src/operator/contrib/quadratic_op_gpu.d
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/operator/contrib/transformer_gpu.o src/operator/contrib/transformer.cu >build/src/operator/contrib/transformer_gpu.d
- /usr/local/cuda/bin/nvcc -c -o build/src/operator/contrib/transformer_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/operator/contrib/transformer.cu
- /usr/local/cuda/bin/nvcc -c -o build/src/operator/contrib/quadratic_op_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/operator/contrib/quadratic_op.cu
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/operator/contrib/multi_proposal_gpu.o src/operator/contrib/multi_proposal.cu >build/src/operator/contrib/multi_proposal_gpu.d
- /usr/local/cuda/bin/nvcc -c -o build/src/operator/contrib/multi_proposal_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/operator/contrib/multi_proposal.cu
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/operator/contrib/adamw_gpu.o src/operator/contrib/adamw.cu >build/src/operator/contrib/adamw_gpu.d
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/operator/contrib/sync_batch_norm_gpu.o src/operator/contrib/sync_batch_norm.cu >build/src/operator/contrib/sync_batch_norm_gpu.d
- /usr/local/cuda/bin/nvcc -c -o build/src/operator/contrib/adamw_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/operator/contrib/adamw.cu
- /usr/local/cuda/bin/nvcc -c -o build/src/operator/contrib/sync_batch_norm_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/operator/contrib/sync_batch_norm.cu
- /home/mahmood/mx/mxnet/3rdparty/dmlc-core/include/dmlc/././optional.h: In function βvoid mxnet::op::SliceLikeInferRanges(const TShape&, const TShape&, const TShape&, nnvm::Tuple<dmlc::optional<int> >*, nnvm::Tuple<dmlc::optional<int> >*, nnvm::Tuple<dmlc::optional<int> >*)β:
- /home/mahmood/mx/mxnet/3rdparty/dmlc-core/include/dmlc/././optional.h:56:1: warning: β*((void*)&<anonymous> +20)β may be used uninitialized in this function [-Wmaybe-uninitialized]
- new (&val) T(other.value());
- ^
- /home/mahmood/mx/mxnet/3rdparty/dmlc-core/include/dmlc/././optional.h:56:1: warning: β*((void*)&<anonymous> +28)β may be used uninitialized in this function [-Wmaybe-uninitialized]
- /home/mahmood/mx/mxnet/3rdparty/dmlc-core/include/dmlc/././optional.h:56:1: warning: β*((void*)&<anonymous> +36)β may be used uninitialized in this function [-Wmaybe-uninitialized]
- /home/mahmood/mx/mxnet/3rdparty/dmlc-core/include/dmlc/././optional.h:56:1: warning: β*((void*)&<anonymous> +20)β may be used uninitialized in this function [-Wmaybe-uninitialized]
- new (&val) T(other.value());
- ^
- /home/mahmood/mx/mxnet/3rdparty/dmlc-core/include/dmlc/././optional.h:56:1: warning: β*((void*)&<anonymous> +28)β may be used uninitialized in this function [-Wmaybe-uninitialized]
- /home/mahmood/mx/mxnet/3rdparty/dmlc-core/include/dmlc/././optional.h:56:1: warning: β*((void*)&<anonymous> +36)β may be used uninitialized in this function [-Wmaybe-uninitialized]
- /home/mahmood/mx/mxnet/3rdparty/dmlc-core/include/dmlc/././optional.h:56:1: warning: β*((void*)&<anonymous> +20)β may be used uninitialized in this function [-Wmaybe-uninitialized]
- new (&val) T(other.value());
- ^
- /home/mahmood/mx/mxnet/3rdparty/dmlc-core/include/dmlc/././optional.h:56:1: warning: β*((void*)&<anonymous> +28)β may be used uninitialized in this function [-Wmaybe-uninitialized]
- /home/mahmood/mx/mxnet/3rdparty/dmlc-core/include/dmlc/././optional.h:56:1: warning: β*((void*)&<anonymous> +36)β may be used uninitialized in this function [-Wmaybe-uninitialized]
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/operator/contrib/psroi_pooling_gpu.o src/operator/contrib/psroi_pooling.cu >build/src/operator/contrib/psroi_pooling_gpu.d
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/operator/contrib/deformable_convolution_gpu.o src/operator/contrib/deformable_convolution.cu >build/src/operator/contrib/deformable_convolution_gpu.d
- /usr/local/cuda/bin/nvcc -c -o build/src/operator/contrib/psroi_pooling_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/operator/contrib/psroi_pooling.cu
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/operator/contrib/roi_align_gpu.o src/operator/contrib/roi_align.cu >build/src/operator/contrib/roi_align_gpu.d
- /usr/local/cuda/bin/nvcc -c -o build/src/operator/contrib/deformable_convolution_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/operator/contrib/deformable_convolution.cu
- /usr/local/cuda/bin/nvcc -c -o build/src/operator/contrib/roi_align_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/operator/contrib/roi_align.cu
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/operator/random/shuffle_op_gpu.o src/operator/random/shuffle_op.cu >build/src/operator/random/shuffle_op_gpu.d
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/operator/random/sample_multinomial_op_gpu.o src/operator/random/sample_multinomial_op.cu >build/src/operator/random/sample_multinomial_op_gpu.d
- /usr/local/cuda/bin/nvcc -c -o build/src/operator/random/shuffle_op_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/operator/random/shuffle_op.cu
- /usr/local/cuda/bin/nvcc -c -o build/src/operator/random/sample_multinomial_op_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/operator/random/sample_multinomial_op.cu
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/operator/random/multisample_op_gpu.o src/operator/random/multisample_op.cu >build/src/operator/random/multisample_op_gpu.d
- /usr/local/cuda/bin/nvcc -c -o build/src/operator/random/multisample_op_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/operator/random/multisample_op.cu
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/operator/random/sample_op_gpu.o src/operator/random/sample_op.cu >build/src/operator/random/sample_op_gpu.d
- /usr/local/cuda/bin/nvcc -c -o build/src/operator/random/sample_op_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/operator/random/sample_op.cu
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/operator/quantization/requantize_gpu.o src/operator/quantization/requantize.cu >build/src/operator/quantization/requantize_gpu.d
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/operator/quantization/quantize_gpu.o src/operator/quantization/quantize.cu >build/src/operator/quantization/quantize_gpu.d
- /usr/local/cuda/bin/nvcc -c -o build/src/operator/quantization/quantize_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/operator/quantization/quantize.cu
- /usr/local/cuda/bin/nvcc -c -o build/src/operator/quantization/requantize_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/operator/quantization/requantize.cu
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/operator/quantization/dequantize_gpu.o src/operator/quantization/dequantize.cu >build/src/operator/quantization/dequantize_gpu.d
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/operator/quantization/quantized_conv_gpu.o src/operator/quantization/quantized_conv.cu >build/src/operator/quantization/quantized_conv_gpu.d
- /usr/local/cuda/bin/nvcc -c -o build/src/operator/quantization/dequantize_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/operator/quantization/dequantize.cu
- /usr/local/cuda/bin/nvcc -c -o build/src/operator/quantization/quantized_conv_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/operator/quantization/quantized_conv.cu
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/operator/quantization/quantized_flatten_gpu.o src/operator/quantization/quantized_flatten.cu >build/src/operator/quantization/quantized_flatten_gpu.d
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/operator/quantization/quantized_fully_connected_gpu.o src/operator/quantization/quantized_fully_connected.cu >build/src/operator/quantization/quantized_fully_connected_gpu.d
- /usr/local/cuda/bin/nvcc -c -o build/src/operator/quantization/quantized_flatten_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/operator/quantization/quantized_flatten.cu
- /usr/local/cuda/bin/nvcc -c -o build/src/operator/quantization/quantized_fully_connected_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/operator/quantization/quantized_fully_connected.cu
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/operator/quantization/quantized_pooling_gpu.o src/operator/quantization/quantized_pooling.cu >build/src/operator/quantization/quantized_pooling_gpu.d
- /usr/local/cuda/bin/nvcc -c -o build/src/operator/quantization/quantized_pooling_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/operator/quantization/quantized_pooling.cu
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/operator/quantization/quantize_v2_gpu.o src/operator/quantization/quantize_v2.cu >build/src/operator/quantization/quantize_v2_gpu.d
- /usr/local/cuda/bin/nvcc -c -o build/src/operator/quantization/quantize_v2_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/operator/quantization/quantize_v2.cu
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/operator/custom/native_op_gpu.o src/operator/custom/native_op.cu >build/src/operator/custom/native_op_gpu.d
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/operator/image/resize_gpu.o src/operator/image/resize.cu >build/src/operator/image/resize_gpu.d
- /usr/local/cuda/bin/nvcc -c -o build/src/operator/custom/native_op_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/operator/custom/native_op.cu
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/operator/image/image_random_gpu.o src/operator/image/image_random.cu >build/src/operator/image/image_random_gpu.d
- /usr/local/cuda/bin/nvcc -c -o build/src/operator/image/resize_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/operator/image/resize.cu
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/operator/nn/lrn_gpu.o src/operator/nn/lrn.cu >build/src/operator/nn/lrn_gpu.d
- /usr/local/cuda/bin/nvcc -c -o build/src/operator/image/image_random_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/operator/image/image_random.cu
- /usr/local/cuda/bin/nvcc -c -o build/src/operator/nn/lrn_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/operator/nn/lrn.cu
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/operator/nn/dropout_gpu.o src/operator/nn/dropout.cu >build/src/operator/nn/dropout_gpu.d
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/operator/nn/softmax_activation_gpu.o src/operator/nn/softmax_activation.cu >build/src/operator/nn/softmax_activation_gpu.d
- /usr/local/cuda/bin/nvcc -c -o build/src/operator/nn/dropout_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/operator/nn/dropout.cu
- /usr/local/cuda/bin/nvcc -c -o build/src/operator/nn/softmax_activation_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/operator/nn/softmax_activation.cu
- src/operator/nn/./dropout-inl.h(498): warning: statement is unreachable
- src/operator/nn/./dropout-inl.h(498): warning: statement is unreachable
- src/operator/nn/./dropout-inl.h(498): warning: statement is unreachable
- src/operator/nn/./dropout-inl.h(498): warning: statement is unreachable
- src/operator/nn/./dropout-inl.h(498): warning: statement is unreachable
- src/operator/nn/./dropout-inl.h(498): warning: statement is unreachable
- src/operator/nn/./dropout-inl.h(498): warning: statement is unreachable
- src/operator/nn/./dropout-inl.h(498): warning: statement is unreachable
- src/operator/nn/./dropout-inl.h(498): warning: statement is unreachable
- src/operator/nn/./dropout-inl.h(498): warning: statement is unreachable
- src/operator/nn/./dropout-inl.h(498): warning: statement is unreachable
- src/operator/nn/./dropout-inl.h(498): warning: statement is unreachable
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/operator/nn/fully_connected_gpu.o src/operator/nn/fully_connected.cu >build/src/operator/nn/fully_connected_gpu.d
- /usr/local/cuda/bin/nvcc -c -o build/src/operator/nn/fully_connected_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/operator/nn/fully_connected.cu
- src/operator/nn/./dropout-inl.h(498): warning: statement is unreachable
- src/operator/nn/./dropout-inl.h(498): warning: statement is unreachable
- src/operator/nn/./dropout-inl.h(498): warning: statement is unreachable
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/operator/nn/deconvolution_gpu.o src/operator/nn/deconvolution.cu >build/src/operator/nn/deconvolution_gpu.d
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/operator/nn/pooling_gpu.o src/operator/nn/pooling.cu >build/src/operator/nn/pooling_gpu.d
- /usr/local/cuda/bin/nvcc -c -o build/src/operator/nn/deconvolution_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/operator/nn/deconvolution.cu
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/operator/nn/softmax_gpu.o src/operator/nn/softmax.cu >build/src/operator/nn/softmax_gpu.d
- src/operator/nn/./dropout-inl.h(498): warning: statement is unreachable
- src/operator/nn/./dropout-inl.h(498): warning: statement is unreachable
- src/operator/nn/./dropout-inl.h(498): warning: statement is unreachable
- /usr/local/cuda/bin/nvcc -c -o build/src/operator/nn/pooling_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/operator/nn/pooling.cu
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/operator/nn/activation_gpu.o src/operator/nn/activation.cu >build/src/operator/nn/activation_gpu.d
- /usr/local/cuda/bin/nvcc -c -o build/src/operator/nn/softmax_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/operator/nn/softmax.cu
- src/operator/nn/./dropout-inl.h(498): warning: statement is unreachable
- src/operator/nn/./dropout-inl.h(498): warning: statement is unreachable
- src/operator/nn/./dropout-inl.h(498): warning: statement is unreachable
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/operator/nn/ctc_loss_gpu.o src/operator/nn/ctc_loss.cu >build/src/operator/nn/ctc_loss_gpu.d
- /usr/local/cuda/bin/nvcc -c -o build/src/operator/nn/activation_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/operator/nn/activation.cu
- /usr/local/cuda/bin/nvcc -c -o build/src/operator/nn/ctc_loss_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/operator/nn/ctc_loss.cu
- src/operator/nn/./dropout-inl.h(498): warning: statement is unreachable
- src/operator/nn/./dropout-inl.h(498): warning: statement is unreachable
- src/operator/nn/./dropout-inl.h(498): warning: statement is unreachable
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/operator/nn/convolution_gpu.o src/operator/nn/convolution.cu >build/src/operator/nn/convolution_gpu.d
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/operator/nn/upsampling_gpu.o src/operator/nn/upsampling.cu >build/src/operator/nn/upsampling_gpu.d
- /usr/local/cuda/bin/nvcc -c -o build/src/operator/nn/convolution_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/operator/nn/convolution.cu
- src/operator/nn/./dropout-inl.h(498): warning: statement is unreachable
- src/operator/nn/./dropout-inl.h(498): warning: statement is unreachable
- src/operator/nn/./dropout-inl.h(498): warning: statement is unreachable
- /usr/local/cuda/bin/nvcc -c -o build/src/operator/nn/upsampling_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/operator/nn/upsampling.cu
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/operator/nn/batch_norm_gpu.o src/operator/nn/batch_norm.cu >build/src/operator/nn/batch_norm_gpu.d
- /usr/local/cuda/bin/nvcc -c -o build/src/operator/nn/batch_norm_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/operator/nn/batch_norm.cu
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/operator/nn/layer_norm_gpu.o src/operator/nn/layer_norm.cu >build/src/operator/nn/layer_norm_gpu.d
- /usr/local/cuda/bin/nvcc -c -o build/src/operator/nn/layer_norm_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/operator/nn/layer_norm.cu
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/operator/nn/concat_gpu.o src/operator/nn/concat.cu >build/src/operator/nn/concat_gpu.d
- /usr/local/cuda/bin/nvcc -c -o build/src/operator/nn/concat_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/operator/nn/concat.cu
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/common/utils_gpu.o src/common/utils.cu >build/src/common/utils_gpu.d
- /usr/local/cuda/bin/nvcc -c -o build/src/common/utils_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/common/utils.cu
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/common/random_generator_gpu.o src/common/random_generator.cu >build/src/common/random_generator_gpu.d
- /usr/local/cuda/bin/nvcc -c -o build/src/common/random_generator_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/common/random_generator.cu
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/ndarray/ndarray_function_gpu.o src/ndarray/ndarray_function.cu >build/src/ndarray/ndarray_function_gpu.d
- /usr/local/cuda/bin/nvcc -c -o build/src/ndarray/ndarray_function_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/ndarray/ndarray_function.cu
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/operator/svm_output_gpu.o src/operator/svm_output.cu >build/src/operator/svm_output_gpu.d
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/operator/optimizer_op_gpu.o src/operator/optimizer_op.cu >build/src/operator/optimizer_op_gpu.d
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/operator/spatial_transformer_gpu.o src/operator/spatial_transformer.cu >build/src/operator/spatial_transformer_gpu.d
- /usr/local/cuda/bin/nvcc -c -o build/src/operator/svm_output_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/operator/svm_output.cu
- /usr/local/cuda/bin/nvcc -c -o build/src/operator/optimizer_op_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/operator/optimizer_op.cu
- /usr/local/cuda/bin/nvcc -c -o build/src/operator/spatial_transformer_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/operator/spatial_transformer.cu
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/operator/make_loss_gpu.o src/operator/make_loss.cu >build/src/operator/make_loss_gpu.d
- /usr/local/cuda/bin/nvcc -c -o build/src/operator/make_loss_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/operator/make_loss.cu
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/operator/pooling_v1_gpu.o src/operator/pooling_v1.cu >build/src/operator/pooling_v1_gpu.d
- /usr/local/cuda/bin/nvcc -c -o build/src/operator/pooling_v1_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/operator/pooling_v1.cu
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/operator/instance_norm_gpu.o src/operator/instance_norm.cu >build/src/operator/instance_norm_gpu.d
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/operator/sequence_mask_gpu.o src/operator/sequence_mask.cu >build/src/operator/sequence_mask_gpu.d
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/operator/correlation_gpu.o src/operator/correlation.cu >build/src/operator/correlation_gpu.d
- /usr/local/cuda/bin/nvcc -c -o build/src/operator/instance_norm_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/operator/instance_norm.cu
- /usr/local/cuda/bin/nvcc -c -o build/src/operator/sequence_mask_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/operator/sequence_mask.cu
- /usr/local/cuda/bin/nvcc -c -o build/src/operator/correlation_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/operator/correlation.cu
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/operator/slice_channel_gpu.o src/operator/slice_channel.cu >build/src/operator/slice_channel_gpu.d
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/operator/rnn_gpu.o src/operator/rnn.cu >build/src/operator/rnn_gpu.d
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/operator/crop_gpu.o src/operator/crop.cu >build/src/operator/crop_gpu.d
- /usr/local/cuda/bin/nvcc -c -o build/src/operator/slice_channel_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/operator/slice_channel.cu
- /usr/local/cuda/bin/nvcc -c -o build/src/operator/rnn_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/operator/rnn.cu
- /usr/local/cuda/bin/nvcc -c -o build/src/operator/crop_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/operator/crop.cu
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/operator/convolution_v1_gpu.o src/operator/convolution_v1.cu >build/src/operator/convolution_v1_gpu.d
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/operator/sequence_reverse_gpu.o src/operator/sequence_reverse.cu >build/src/operator/sequence_reverse_gpu.d
- /usr/local/cuda/bin/nvcc -c -o build/src/operator/convolution_v1_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/operator/convolution_v1.cu
- /usr/local/cuda/bin/nvcc -c -o build/src/operator/sequence_reverse_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/operator/sequence_reverse.cu
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/operator/identity_attach_KL_sparse_reg_gpu.o src/operator/identity_attach_KL_sparse_reg.cu >build/src/operator/identity_attach_KL_sparse_reg_gpu.d
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/operator/leaky_relu_gpu.o src/operator/leaky_relu.cu >build/src/operator/leaky_relu_gpu.d
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/operator/swapaxis_gpu.o src/operator/swapaxis.cu >build/src/operator/swapaxis_gpu.d
- /usr/local/cuda/bin/nvcc -c -o build/src/operator/identity_attach_KL_sparse_reg_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/operator/identity_attach_KL_sparse_reg.cu
- /usr/local/cuda/bin/nvcc -c -o build/src/operator/leaky_relu_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/operator/leaky_relu.cu
- /usr/local/cuda/bin/nvcc -c -o build/src/operator/swapaxis_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/operator/swapaxis.cu
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/operator/grid_generator_gpu.o src/operator/grid_generator.cu >build/src/operator/grid_generator_gpu.d
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/operator/pad_gpu.o src/operator/pad.cu >build/src/operator/pad_gpu.d
- /usr/local/cuda/bin/nvcc -c -o build/src/operator/grid_generator_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/operator/grid_generator.cu
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/operator/bilinear_sampler_gpu.o src/operator/bilinear_sampler.cu >build/src/operator/bilinear_sampler_gpu.d
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/operator/roi_pooling_gpu.o src/operator/roi_pooling.cu >build/src/operator/roi_pooling_gpu.d
- /usr/local/cuda/bin/nvcc -c -o build/src/operator/pad_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/operator/pad.cu
- /usr/local/cuda/bin/nvcc -c -o build/src/operator/bilinear_sampler_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/operator/bilinear_sampler.cu
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/operator/batch_norm_v1_gpu.o src/operator/batch_norm_v1.cu >build/src/operator/batch_norm_v1_gpu.d
- /usr/local/cuda/bin/nvcc -c -o build/src/operator/roi_pooling_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/operator/roi_pooling.cu
- /usr/local/cuda/bin/nvcc -c -o build/src/operator/batch_norm_v1_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/operator/batch_norm_v1.cu
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/operator/loss_binary_op_gpu.o src/operator/loss_binary_op.cu >build/src/operator/loss_binary_op_gpu.d
- /usr/local/cuda/bin/nvcc -c -o build/src/operator/loss_binary_op_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/operator/loss_binary_op.cu
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/operator/regression_output_gpu.o src/operator/regression_output.cu >build/src/operator/regression_output_gpu.d
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/operator/l2_normalization_gpu.o src/operator/l2_normalization.cu >build/src/operator/l2_normalization_gpu.d
- /usr/local/cuda/bin/nvcc -c -o build/src/operator/regression_output_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/operator/regression_output.cu
- /usr/local/cuda/bin/nvcc -c -o build/src/operator/l2_normalization_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/operator/l2_normalization.cu
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/operator/sequence_last_gpu.o src/operator/sequence_last.cu >build/src/operator/sequence_last_gpu.d
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/operator/softmax_output_gpu.o src/operator/softmax_output.cu >build/src/operator/softmax_output_gpu.d
- /usr/local/cuda/bin/nvcc -c -o build/src/operator/sequence_last_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/operator/sequence_last.cu
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/kvstore/gradient_compression_gpu.o src/kvstore/gradient_compression.cu >build/src/kvstore/gradient_compression_gpu.d
- /usr/local/cuda/bin/nvcc -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" --generate-dependencies -MT build/src/kvstore/kvstore_utils_gpu.o src/kvstore/kvstore_utils.cu >build/src/kvstore/kvstore_utils_gpu.d
- /usr/local/cuda/bin/nvcc -c -o build/src/operator/softmax_output_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/operator/softmax_output.cu
- /usr/local/cuda/bin/nvcc -c -o build/src/kvstore/gradient_compression_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/kvstore/gradient_compression.cu
- /usr/local/cuda/bin/nvcc -c -o build/src/kvstore/kvstore_utils_gpu.o -std=c++11 -Xcompiler -D_FORCE_INLINES -O3 -ccbin g++ -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=[sm_75,compute_75] --fatbin-options -compress-all -Xcompiler "-DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0" src/kvstore/kvstore_utils.cu
- ar crv lib/libmxnet.a build/src/operator/quantization/mkldnn/mkldnn_quantized_conv.o build/src/operator/quantization/mkldnn/mkldnn_quantized_pooling.o build/src/operator/quantization/mkldnn/mkldnn_quantized_concat.o build/src/operator/subgraph/mkldnn/mkldnn_conv_property.o build/src/operator/subgraph/mkldnn/mkldnn_conv_post_quantize_property.o build/src/operator/subgraph/mkldnn/mkldnn_conv.o build/src/operator/nn/mkldnn/mkldnn_convolution.o build/src/operator/nn/mkldnn/mkldnn_concat.o build/src/operator/nn/mkldnn/mkldnn_base.o build/src/operator/nn/mkldnn/mkldnn_slice.o build/src/operator/nn/mkldnn/mkldnn_act.o build/src/operator/nn/mkldnn/mkldnn_softmax.o build/src/operator/nn/mkldnn/mkldnn_deconvolution.o build/src/operator/nn/mkldnn/mkldnn_copy.o build/src/operator/nn/mkldnn/mkldnn_softmax_output.o build/src/operator/nn/mkldnn/mkldnn_fully_connected.o build/src/operator/nn/mkldnn/mkldnn_pooling.o build/src/operator/nn/mkldnn/mkldnn_sum.o build/src/operator/nn/cudnn/cudnn_algoreg.o build/src/operator/nn/cudnn/cudnn_batch_norm.o build/src/operator/tensor/elemwise_binary_broadcast_op_basic.o build/src/operator/tensor/elemwise_binary_op_logic.o build/src/operator/tensor/square_sum.o build/src/operator/tensor/matrix_op.o build/src/operator/tensor/init_op.o build/src/operator/tensor/elemwise_sum.o build/src/operator/tensor/la_op.o build/src/operator/tensor/histogram.o build/src/operator/tensor/broadcast_reduce_op_index.o build/src/operator/tensor/dot.o build/src/operator/tensor/elemwise_scatter_op.o build/src/operator/tensor/elemwise_unary_op_basic.o build/src/operator/tensor/elemwise_binary_broadcast_op_extended.o build/src/operator/tensor/ravel.o build/src/operator/tensor/broadcast_reduce_op_value.o build/src/operator/tensor/control_flow_op.o build/src/operator/tensor/elemwise_binary_op_basic.o build/src/operator/tensor/elemwise_binary_op_extended.o build/src/operator/tensor/indexing_op.o build/src/operator/tensor/elemwise_binary_broadcast_op_logic.o build/src/operator/tensor/diag_op.o build/src/operator/tensor/ordering_op.o build/src/operator/tensor/sparse_retain.o build/src/operator/tensor/elemwise_binary_scalar_op_extended.o build/src/operator/tensor/elemwise_binary_scalar_op_basic.o build/src/operator/tensor/elemwise_binary_scalar_op_logic.o build/src/operator/tensor/cast_storage.o build/src/operator/tensor/elemwise_binary_op.o build/src/operator/tensor/elemwise_unary_op_trig.o build/src/operator/contrib/tensorrt.o build/src/operator/contrib/multibox_target.o build/src/operator/contrib/sync_batch_norm.o build/src/operator/contrib/count_sketch.o build/src/operator/contrib/roi_align.o build/src/operator/contrib/bilinear_resize.o build/src/operator/contrib/nnz.o build/src/operator/contrib/multibox_detection.o build/src/operator/contrib/nnvm_to_onnx.o build/src/operator/contrib/deformable_psroi_pooling.o build/src/operator/contrib/dgl_graph.o build/src/operator/contrib/fft.o build/src/operator/contrib/multibox_prior.o build/src/operator/contrib/gradient_multiplier_op.o build/src/operator/contrib/adamw.o build/src/operator/contrib/transformer.o build/src/operator/contrib/krprod.o build/src/operator/contrib/multi_proposal.o build/src/operator/contrib/index_copy.o build/src/operator/contrib/optimizer_op.o build/src/operator/contrib/bounding_box.o build/src/operator/contrib/proposal.o build/src/operator/contrib/boolean_mask.o build/src/operator/contrib/psroi_pooling.o build/src/operator/contrib/quadratic_op.o build/src/operator/contrib/deformable_convolution.o build/src/operator/contrib/ifft.o build/src/operator/contrib/adaptive_avg_pooling.o build/src/operator/random/sample_multinomial_op.o build/src/operator/random/multisample_op.o build/src/operator/random/unique_sample_op.o build/src/operator/random/sample_op.o build/src/operator/random/shuffle_op.o build/src/operator/quantization/requantize.o build/src/operator/quantization/dequantize.o build/src/operator/quantization/quantize_graph_pass.o build/src/operator/quantization/quantized_flatten.o build/src/operator/quantization/quantized_conv.o build/src/operator/quantization/quantized_fully_connected.o build/src/operator/quantization/quantized_pooling.o build/src/operator/quantization/quantize_v2.o build/src/operator/quantization/quantized_concat.o build/src/operator/quantization/quantize.o build/src/operator/custom/native_op.o build/src/operator/custom/ndarray_op.o build/src/operator/custom/custom.o build/src/operator/subgraph/partition_graph.o build/src/operator/subgraph/default_subgraph_property.o build/src/operator/nnpack/nnpack_util.o build/src/operator/image/image_random.o build/src/operator/image/resize.o build/src/operator/nn/softmax.o build/src/operator/nn/pooling.o build/src/operator/nn/deconvolution.o build/src/operator/nn/activation.o build/src/operator/nn/upsampling.o build/src/operator/nn/batch_norm.o build/src/operator/nn/ctc_loss.o build/src/operator/nn/fully_connected.o build/src/operator/nn/convolution.o build/src/operator/nn/layer_norm.o build/src/operator/nn/concat.o build/src/operator/nn/softmax_activation.o build/src/operator/nn/lrn.o build/src/operator/nn/dropout.o build/src/io/io.o build/src/io/image_aug_default.o build/src/io/iter_image_det_recordio.o build/src/io/image_io.o build/src/io/image_det_aug_default.o build/src/io/iter_csv.o build/src/io/iter_image_recordio.o build/src/io/iter_mnist.o build/src/io/iter_image_recordio_2.o build/src/io/iter_libsvm.o build/src/common/utils.o build/src/common/rtc.o build/src/nnvm/legacy_op_util.o build/src/nnvm/tvm_bridge.o build/src/nnvm/graph_editor.o build/src/nnvm/legacy_json_util.o build/src/profiler/profiler.o build/src/profiler/aggregate_stats.o build/src/profiler/vtune.o build/src/imperative/cached_op.o build/src/imperative/imperative_utils.o build/src/imperative/imperative.o build/src/ndarray/ndarray_function.o build/src/ndarray/ndarray.o build/src/operator/instance_norm.o build/src/operator/subgraph_op_common.o build/src/operator/grid_generator.o build/src/operator/pooling_v1.o build/src/operator/l2_normalization.o build/src/operator/rnn.o build/src/operator/make_loss.o build/src/operator/crop.o build/src/operator/spatial_transformer.o build/src/operator/operator.o build/src/operator/control_flow.o build/src/operator/swapaxis.o build/src/operator/convolution_v1.o build/src/operator/softmax_output.o build/src/operator/operator_util.o build/src/operator/roi_pooling.o build/src/operator/slice_channel.o build/src/operator/batch_norm_v1.o build/src/operator/loss_binary_op.o build/src/operator/regression_output.o build/src/operator/sequence_reverse.o build/src/operator/c_lapack_api.o build/src/operator/identity_attach_KL_sparse_reg.o build/src/operator/bilinear_sampler.o build/src/operator/svm_output.o build/src/operator/optimizer_op.o build/src/operator/sequence_last.o build/src/operator/cross_device_copy.o build/src/operator/correlation.o build/src/operator/pad.o build/src/operator/leaky_relu.o build/src/operator/operator_tune.o build/src/operator/sequence_mask.o build/src/engine/naive_engine.o build/src/engine/openmp.o build/src/engine/threaded_engine_pooled.o build/src/engine/threaded_engine.o build/src/engine/engine.o build/src/engine/threaded_engine_perdevice.o build/src/storage/storage.o build/src/c_api/c_api_executor.o build/src/c_api/c_api_symbolic.o build/src/c_api/c_api_profile.o build/src/c_api/c_api_ndarray.o build/src/c_api/c_api_test.o build/src/c_api/c_predict_api.o build/src/c_api/c_api_function.o build/src/c_api/c_api.o build/src/c_api/c_api_error.o build/src/executor/onnx_to_tensorrt.o build/src/executor/inplace_addto_detect_pass.o build/src/executor/graph_executor.o build/src/executor/trt_graph_executor.o build/src/executor/infer_graph_attr_pass.o build/src/executor/tensorrt_pass.o build/src/executor/attach_op_execs_pass.o build/src/executor/attach_op_resource_pass.o build/src/kvstore/gradient_compression.o build/src/kvstore/kvstore_utils.o build/src/kvstore/kvstore.o build/src/resource.o build/src/libinfo.o build/src/initialize.o build/src/operator/nn/cudnn/cudnn_batch_norm_gpu.o build/src/operator/tensor/elemwise_binary_op_basic_gpu.o build/src/operator/tensor/elemwise_binary_scalar_op_basic_gpu.o build/src/operator/tensor/elemwise_binary_scalar_op_extended_gpu.o build/src/operator/tensor/matrix_op_gpu.o build/src/operator/tensor/ordering_op_gpu.o build/src/operator/tensor/elemwise_unary_op_trig_gpu.o build/src/operator/tensor/elemwise_binary_broadcast_op_extended_gpu.o build/src/operator/tensor/diag_op_gpu.o build/src/operator/tensor/square_sum_gpu.o build/src/operator/tensor/elemwise_binary_op_extended_gpu.o build/src/operator/tensor/elemwise_sum_gpu.o build/src/operator/tensor/init_op_gpu.o build/src/operator/tensor/cast_storage_gpu.o build/src/operator/tensor/histogram_gpu.o build/src/operator/tensor/dot_gpu.o build/src/operator/tensor/elemwise_binary_scalar_op_logic_gpu.o build/src/operator/tensor/ravel_gpu.o build/src/operator/tensor/control_flow_op_gpu.o build/src/operator/tensor/broadcast_reduce_op_value_gpu.o build/src/operator/tensor/elemwise_binary_broadcast_op_basic_gpu.o build/src/operator/tensor/broadcast_reduce_op_index_gpu.o build/src/operator/tensor/elemwise_scatter_op_gpu.o build/src/operator/tensor/indexing_op_gpu.o build/src/operator/tensor/elemwise_binary_broadcast_op_logic_gpu.o build/src/operator/tensor/la_op_gpu.o build/src/operator/tensor/elemwise_binary_op_logic_gpu.o build/src/operator/tensor/elemwise_unary_op_basic_gpu.o build/src/operator/tensor/sparse_retain_gpu.o build/src/operator/contrib/optimizer_op_gpu.o build/src/operator/contrib/boolean_mask_gpu.o build/src/operator/contrib/adaptive_avg_pooling_gpu.o build/src/operator/contrib/ifft_gpu.o build/src/operator/contrib/multibox_detection_gpu.o build/src/operator/contrib/index_copy_gpu.o build/src/operator/contrib/tensorrt_gpu.o build/src/operator/contrib/multibox_target_gpu.o build/src/operator/contrib/proposal_gpu.o build/src/operator/contrib/bilinear_resize_gpu.o build/src/operator/contrib/count_sketch_gpu.o build/src/operator/contrib/dgl_graph_gpu.o build/src/operator/contrib/gradient_multiplier_op_gpu.o build/src/operator/contrib/bounding_box_gpu.o build/src/operator/contrib/fft_gpu.o build/src/operator/contrib/multibox_prior_gpu.o build/src/operator/contrib/deformable_psroi_pooling_gpu.o build/src/operator/contrib/quadratic_op_gpu.o build/src/operator/contrib/transformer_gpu.o build/src/operator/contrib/multi_proposal_gpu.o build/src/operator/contrib/adamw_gpu.o build/src/operator/contrib/sync_batch_norm_gpu.o build/src/operator/contrib/psroi_pooling_gpu.o build/src/operator/contrib/deformable_convolution_gpu.o build/src/operator/contrib/roi_align_gpu.o build/src/operator/random/shuffle_op_gpu.o build/src/operator/random/sample_multinomial_op_gpu.o build/src/operator/random/multisample_op_gpu.o build/src/operator/random/sample_op_gpu.o build/src/operator/quantization/requantize_gpu.o build/src/operator/quantization/quantize_gpu.o build/src/operator/quantization/dequantize_gpu.o build/src/operator/quantization/quantized_conv_gpu.o build/src/operator/quantization/quantized_flatten_gpu.o build/src/operator/quantization/quantized_fully_connected_gpu.o build/src/operator/quantization/quantized_pooling_gpu.o build/src/operator/quantization/quantize_v2_gpu.o build/src/operator/custom/native_op_gpu.o build/src/operator/image/resize_gpu.o build/src/operator/image/image_random_gpu.o build/src/operator/nn/lrn_gpu.o build/src/operator/nn/dropout_gpu.o build/src/operator/nn/softmax_activation_gpu.o build/src/operator/nn/fully_connected_gpu.o build/src/operator/nn/deconvolution_gpu.o build/src/operator/nn/pooling_gpu.o build/src/operator/nn/softmax_gpu.o build/src/operator/nn/activation_gpu.o build/src/operator/nn/ctc_loss_gpu.o build/src/operator/nn/convolution_gpu.o build/src/operator/nn/upsampling_gpu.o build/src/operator/nn/batch_norm_gpu.o build/src/operator/nn/layer_norm_gpu.o build/src/operator/nn/concat_gpu.o build/src/common/utils_gpu.o build/src/common/random_generator_gpu.o build/src/ndarray/ndarray_function_gpu.o build/src/operator/svm_output_gpu.o build/src/operator/optimizer_op_gpu.o build/src/operator/spatial_transformer_gpu.o build/src/operator/make_loss_gpu.o build/src/operator/pooling_v1_gpu.o build/src/operator/instance_norm_gpu.o build/src/operator/sequence_mask_gpu.o build/src/operator/correlation_gpu.o build/src/operator/slice_channel_gpu.o build/src/operator/rnn_gpu.o build/src/operator/crop_gpu.o build/src/operator/convolution_v1_gpu.o build/src/operator/sequence_reverse_gpu.o build/src/operator/identity_attach_KL_sparse_reg_gpu.o build/src/operator/leaky_relu_gpu.o build/src/operator/swapaxis_gpu.o build/src/operator/grid_generator_gpu.o build/src/operator/pad_gpu.o build/src/operator/bilinear_sampler_gpu.o build/src/operator/roi_pooling_gpu.o build/src/operator/batch_norm_v1_gpu.o build/src/operator/loss_binary_op_gpu.o build/src/operator/regression_output_gpu.o build/src/operator/l2_normalization_gpu.o build/src/operator/sequence_last_gpu.o build/src/operator/softmax_output_gpu.o build/src/kvstore/gradient_compression_gpu.o build/src/kvstore/kvstore_utils_gpu.o
- g++ -DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0 -shared -o lib/libmxnet.so build/src/operator/quantization/mkldnn/mkldnn_quantized_conv.o build/src/operator/quantization/mkldnn/mkldnn_quantized_pooling.o build/src/operator/quantization/mkldnn/mkldnn_quantized_concat.o build/src/operator/subgraph/mkldnn/mkldnn_conv_property.o build/src/operator/subgraph/mkldnn/mkldnn_conv_post_quantize_property.o build/src/operator/subgraph/mkldnn/mkldnn_conv.o build/src/operator/nn/mkldnn/mkldnn_convolution.o build/src/operator/nn/mkldnn/mkldnn_concat.o build/src/operator/nn/mkldnn/mkldnn_base.o build/src/operator/nn/mkldnn/mkldnn_slice.o build/src/operator/nn/mkldnn/mkldnn_act.o build/src/operator/nn/mkldnn/mkldnn_softmax.o build/src/operator/nn/mkldnn/mkldnn_deconvolution.o build/src/operator/nn/mkldnn/mkldnn_copy.o build/src/operator/nn/mkldnn/mkldnn_softmax_output.o build/src/operator/nn/mkldnn/mkldnn_fully_connected.o build/src/operator/nn/mkldnn/mkldnn_pooling.o build/src/operator/nn/mkldnn/mkldnn_sum.o build/src/operator/nn/cudnn/cudnn_algoreg.o build/src/operator/nn/cudnn/cudnn_batch_norm.o build/src/operator/tensor/elemwise_binary_broadcast_op_basic.o build/src/operator/tensor/elemwise_binary_op_logic.o build/src/operator/tensor/square_sum.o build/src/operator/tensor/matrix_op.o build/src/operator/tensor/init_op.o build/src/operator/tensor/elemwise_sum.o build/src/operator/tensor/la_op.o build/src/operator/tensor/histogram.o build/src/operator/tensor/broadcast_reduce_op_index.o build/src/operator/tensor/dot.o build/src/operator/tensor/elemwise_scatter_op.o build/src/operator/tensor/elemwise_unary_op_basic.o build/src/operator/tensor/elemwise_binary_broadcast_op_extended.o build/src/operator/tensor/ravel.o build/src/operator/tensor/broadcast_reduce_op_value.o build/src/operator/tensor/control_flow_op.o build/src/operator/tensor/elemwise_binary_op_basic.o build/src/operator/tensor/elemwise_binary_op_extended.o build/src/operator/tensor/indexing_op.o build/src/operator/tensor/elemwise_binary_broadcast_op_logic.o build/src/operator/tensor/diag_op.o build/src/operator/tensor/ordering_op.o build/src/operator/tensor/sparse_retain.o build/src/operator/tensor/elemwise_binary_scalar_op_extended.o build/src/operator/tensor/elemwise_binary_scalar_op_basic.o build/src/operator/tensor/elemwise_binary_scalar_op_logic.o build/src/operator/tensor/cast_storage.o build/src/operator/tensor/elemwise_binary_op.o build/src/operator/tensor/elemwise_unary_op_trig.o build/src/operator/contrib/tensorrt.o build/src/operator/contrib/multibox_target.o build/src/operator/contrib/sync_batch_norm.o build/src/operator/contrib/count_sketch.o build/src/operator/contrib/roi_align.o build/src/operator/contrib/bilinear_resize.o build/src/operator/contrib/nnz.o build/src/operator/contrib/multibox_detection.o build/src/operator/contrib/nnvm_to_onnx.o build/src/operator/contrib/deformable_psroi_pooling.o build/src/operator/contrib/dgl_graph.o build/src/operator/contrib/fft.o build/src/operator/contrib/multibox_prior.o build/src/operator/contrib/gradient_multiplier_op.o build/src/operator/contrib/adamw.o build/src/operator/contrib/transformer.o build/src/operator/contrib/krprod.o build/src/operator/contrib/multi_proposal.o build/src/operator/contrib/index_copy.o build/src/operator/contrib/optimizer_op.o build/src/operator/contrib/bounding_box.o build/src/operator/contrib/proposal.o build/src/operator/contrib/boolean_mask.o build/src/operator/contrib/psroi_pooling.o build/src/operator/contrib/quadratic_op.o build/src/operator/contrib/deformable_convolution.o build/src/operator/contrib/ifft.o build/src/operator/contrib/adaptive_avg_pooling.o build/src/operator/random/sample_multinomial_op.o build/src/operator/random/multisample_op.o build/src/operator/random/unique_sample_op.o build/src/operator/random/sample_op.o build/src/operator/random/shuffle_op.o build/src/operator/quantization/requantize.o build/src/operator/quantization/dequantize.o build/src/operator/quantization/quantize_graph_pass.o build/src/operator/quantization/quantized_flatten.o build/src/operator/quantization/quantized_conv.o build/src/operator/quantization/quantized_fully_connected.o build/src/operator/quantization/quantized_pooling.o build/src/operator/quantization/quantize_v2.o build/src/operator/quantization/quantized_concat.o build/src/operator/quantization/quantize.o build/src/operator/custom/native_op.o build/src/operator/custom/ndarray_op.o build/src/operator/custom/custom.o build/src/operator/subgraph/partition_graph.o build/src/operator/subgraph/default_subgraph_property.o build/src/operator/nnpack/nnpack_util.o build/src/operator/image/image_random.o build/src/operator/image/resize.o build/src/operator/nn/softmax.o build/src/operator/nn/pooling.o build/src/operator/nn/deconvolution.o build/src/operator/nn/activation.o build/src/operator/nn/upsampling.o build/src/operator/nn/batch_norm.o build/src/operator/nn/ctc_loss.o build/src/operator/nn/fully_connected.o build/src/operator/nn/convolution.o build/src/operator/nn/layer_norm.o build/src/operator/nn/concat.o build/src/operator/nn/softmax_activation.o build/src/operator/nn/lrn.o build/src/operator/nn/dropout.o build/src/io/io.o build/src/io/image_aug_default.o build/src/io/iter_image_det_recordio.o build/src/io/image_io.o build/src/io/image_det_aug_default.o build/src/io/iter_csv.o build/src/io/iter_image_recordio.o build/src/io/iter_mnist.o build/src/io/iter_image_recordio_2.o build/src/io/iter_libsvm.o build/src/common/utils.o build/src/common/rtc.o build/src/nnvm/legacy_op_util.o build/src/nnvm/tvm_bridge.o build/src/nnvm/graph_editor.o build/src/nnvm/legacy_json_util.o build/src/profiler/profiler.o build/src/profiler/aggregate_stats.o build/src/profiler/vtune.o build/src/imperative/cached_op.o build/src/imperative/imperative_utils.o build/src/imperative/imperative.o build/src/ndarray/ndarray_function.o build/src/ndarray/ndarray.o build/src/operator/instance_norm.o build/src/operator/subgraph_op_common.o build/src/operator/grid_generator.o build/src/operator/pooling_v1.o build/src/operator/l2_normalization.o build/src/operator/rnn.o build/src/operator/make_loss.o build/src/operator/crop.o build/src/operator/spatial_transformer.o build/src/operator/operator.o build/src/operator/control_flow.o build/src/operator/swapaxis.o build/src/operator/convolution_v1.o build/src/operator/softmax_output.o build/src/operator/operator_util.o build/src/operator/roi_pooling.o build/src/operator/slice_channel.o build/src/operator/batch_norm_v1.o build/src/operator/loss_binary_op.o build/src/operator/regression_output.o build/src/operator/sequence_reverse.o build/src/operator/c_lapack_api.o build/src/operator/identity_attach_KL_sparse_reg.o build/src/operator/bilinear_sampler.o build/src/operator/svm_output.o build/src/operator/optimizer_op.o build/src/operator/sequence_last.o build/src/operator/cross_device_copy.o build/src/operator/correlation.o build/src/operator/pad.o build/src/operator/leaky_relu.o build/src/operator/operator_tune.o build/src/operator/sequence_mask.o build/src/engine/naive_engine.o build/src/engine/openmp.o build/src/engine/threaded_engine_pooled.o build/src/engine/threaded_engine.o build/src/engine/engine.o build/src/engine/threaded_engine_perdevice.o build/src/storage/storage.o build/src/c_api/c_api_executor.o build/src/c_api/c_api_symbolic.o build/src/c_api/c_api_profile.o build/src/c_api/c_api_ndarray.o build/src/c_api/c_api_test.o build/src/c_api/c_predict_api.o build/src/c_api/c_api_function.o build/src/c_api/c_api.o build/src/c_api/c_api_error.o build/src/executor/onnx_to_tensorrt.o build/src/executor/inplace_addto_detect_pass.o build/src/executor/graph_executor.o build/src/executor/trt_graph_executor.o build/src/executor/infer_graph_attr_pass.o build/src/executor/tensorrt_pass.o build/src/executor/attach_op_execs_pass.o build/src/executor/attach_op_resource_pass.o build/src/kvstore/gradient_compression.o build/src/kvstore/kvstore_utils.o build/src/kvstore/kvstore.o build/src/resource.o build/src/libinfo.o build/src/initialize.o /home/mahmood/mx/mxnet/3rdparty/dmlc-core/libdmlc.a build/src/operator/nn/cudnn/cudnn_batch_norm_gpu.o build/src/operator/tensor/elemwise_binary_op_basic_gpu.o build/src/operator/tensor/elemwise_binary_scalar_op_basic_gpu.o build/src/operator/tensor/elemwise_binary_scalar_op_extended_gpu.o build/src/operator/tensor/matrix_op_gpu.o build/src/operator/tensor/ordering_op_gpu.o build/src/operator/tensor/elemwise_unary_op_trig_gpu.o build/src/operator/tensor/elemwise_binary_broadcast_op_extended_gpu.o build/src/operator/tensor/diag_op_gpu.o build/src/operator/tensor/square_sum_gpu.o build/src/operator/tensor/elemwise_binary_op_extended_gpu.o build/src/operator/tensor/elemwise_sum_gpu.o build/src/operator/tensor/init_op_gpu.o build/src/operator/tensor/cast_storage_gpu.o build/src/operator/tensor/histogram_gpu.o build/src/operator/tensor/dot_gpu.o build/src/operator/tensor/elemwise_binary_scalar_op_logic_gpu.o build/src/operator/tensor/ravel_gpu.o build/src/operator/tensor/control_flow_op_gpu.o build/src/operator/tensor/broadcast_reduce_op_value_gpu.o build/src/operator/tensor/elemwise_binary_broadcast_op_basic_gpu.o build/src/operator/tensor/broadcast_reduce_op_index_gpu.o build/src/operator/tensor/elemwise_scatter_op_gpu.o build/src/operator/tensor/indexing_op_gpu.o build/src/operator/tensor/elemwise_binary_broadcast_op_logic_gpu.o build/src/operator/tensor/la_op_gpu.o build/src/operator/tensor/elemwise_binary_op_logic_gpu.o build/src/operator/tensor/elemwise_unary_op_basic_gpu.o build/src/operator/tensor/sparse_retain_gpu.o build/src/operator/contrib/optimizer_op_gpu.o build/src/operator/contrib/boolean_mask_gpu.o build/src/operator/contrib/adaptive_avg_pooling_gpu.o build/src/operator/contrib/ifft_gpu.o build/src/operator/contrib/multibox_detection_gpu.o build/src/operator/contrib/index_copy_gpu.o build/src/operator/contrib/tensorrt_gpu.o build/src/operator/contrib/multibox_target_gpu.o build/src/operator/contrib/proposal_gpu.o build/src/operator/contrib/bilinear_resize_gpu.o build/src/operator/contrib/count_sketch_gpu.o build/src/operator/contrib/dgl_graph_gpu.o build/src/operator/contrib/gradient_multiplier_op_gpu.o build/src/operator/contrib/bounding_box_gpu.o build/src/operator/contrib/fft_gpu.o build/src/operator/contrib/multibox_prior_gpu.o build/src/operator/contrib/deformable_psroi_pooling_gpu.o build/src/operator/contrib/quadratic_op_gpu.o build/src/operator/contrib/transformer_gpu.o build/src/operator/contrib/multi_proposal_gpu.o build/src/operator/contrib/adamw_gpu.o build/src/operator/contrib/sync_batch_norm_gpu.o build/src/operator/contrib/psroi_pooling_gpu.o build/src/operator/contrib/deformable_convolution_gpu.o build/src/operator/contrib/roi_align_gpu.o build/src/operator/random/shuffle_op_gpu.o build/src/operator/random/sample_multinomial_op_gpu.o build/src/operator/random/multisample_op_gpu.o build/src/operator/random/sample_op_gpu.o build/src/operator/quantization/requantize_gpu.o build/src/operator/quantization/quantize_gpu.o build/src/operator/quantization/dequantize_gpu.o build/src/operator/quantization/quantized_conv_gpu.o build/src/operator/quantization/quantized_flatten_gpu.o build/src/operator/quantization/quantized_fully_connected_gpu.o build/src/operator/quantization/quantized_pooling_gpu.o build/src/operator/quantization/quantize_v2_gpu.o build/src/operator/custom/native_op_gpu.o build/src/operator/image/resize_gpu.o build/src/operator/image/image_random_gpu.o build/src/operator/nn/lrn_gpu.o build/src/operator/nn/dropout_gpu.o build/src/operator/nn/softmax_activation_gpu.o build/src/operator/nn/fully_connected_gpu.o build/src/operator/nn/deconvolution_gpu.o build/src/operator/nn/pooling_gpu.o build/src/operator/nn/softmax_gpu.o build/src/operator/nn/activation_gpu.o build/src/operator/nn/ctc_loss_gpu.o build/src/operator/nn/convolution_gpu.o build/src/operator/nn/upsampling_gpu.o build/src/operator/nn/batch_norm_gpu.o build/src/operator/nn/layer_norm_gpu.o build/src/operator/nn/concat_gpu.o build/src/common/utils_gpu.o build/src/common/random_generator_gpu.o build/src/ndarray/ndarray_function_gpu.o build/src/operator/svm_output_gpu.o build/src/operator/optimizer_op_gpu.o build/src/operator/spatial_transformer_gpu.o build/src/operator/make_loss_gpu.o build/src/operator/pooling_v1_gpu.o build/src/operator/instance_norm_gpu.o build/src/operator/sequence_mask_gpu.o build/src/operator/correlation_gpu.o build/src/operator/slice_channel_gpu.o build/src/operator/rnn_gpu.o build/src/operator/crop_gpu.o build/src/operator/convolution_v1_gpu.o build/src/operator/sequence_reverse_gpu.o build/src/operator/identity_attach_KL_sparse_reg_gpu.o build/src/operator/leaky_relu_gpu.o build/src/operator/swapaxis_gpu.o build/src/operator/grid_generator_gpu.o build/src/operator/pad_gpu.o build/src/operator/bilinear_sampler_gpu.o build/src/operator/roi_pooling_gpu.o build/src/operator/batch_norm_v1_gpu.o build/src/operator/loss_binary_op_gpu.o build/src/operator/regression_output_gpu.o build/src/operator/l2_normalization_gpu.o build/src/operator/sequence_last_gpu.o build/src/operator/softmax_output_gpu.o build/src/kvstore/gradient_compression_gpu.o build/src/kvstore/kvstore_utils_gpu.o -pthread -lm -lcudart -lcublas -lcurand -lcusolver -L/usr/local/cuda/lib64 -L/usr/local/cuda/lib -Wl,--as-needed -lmklml_intel -lmklml_gnu -liomp5 -L/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/lib/ -lopenblas -fopenmp -lrt -L/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/lib -lmkldnn -Wl,-rpath,'${ORIGIN}' -lopencv_shape -lopencv_stitching -lopencv_superres -lopencv_videostab -lopencv_aruco -lopencv_bgsegm -lopencv_bioinspired -lopencv_ccalib -lopencv_datasets -lopencv_dpm -lopencv_face -lopencv_freetype -lopencv_fuzzy -lopencv_hdf -lopencv_line_descriptor -lopencv_optflow -lopencv_video -lopencv_plot -lopencv_reg -lopencv_saliency -lopencv_stereo -lopencv_structured_light -lopencv_phase_unwrapping -lopencv_rgbd -lopencv_viz -lopencv_surface_matching -lopencv_text -lopencv_ximgproc -lopencv_calib3d -lopencv_features2d -lopencv_flann -lopencv_xobjdetect -lopencv_objdetect -lopencv_ml -lopencv_xphoto -lopencv_highgui -lopencv_videoio -lopencv_imgcodecs -lopencv_photo -lopencv_imgproc -lopencv_core -lcudnn -lcufft -lcuda -lnvrtc -L/usr/local/cuda/lib64/stubs \
- -Wl,--whole-archive /home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/lib/libnnvm.a -Wl,--no-whole-archive
- a - build/src/operator/quantization/mkldnn/mkldnn_quantized_conv.o
- a - build/src/operator/quantization/mkldnn/mkldnn_quantized_pooling.o
- a - build/src/operator/quantization/mkldnn/mkldnn_quantized_concat.o
- a - build/src/operator/subgraph/mkldnn/mkldnn_conv_property.o
- a - build/src/operator/subgraph/mkldnn/mkldnn_conv_post_quantize_property.o
- a - build/src/operator/subgraph/mkldnn/mkldnn_conv.o
- a - build/src/operator/nn/mkldnn/mkldnn_convolution.o
- a - build/src/operator/nn/mkldnn/mkldnn_concat.o
- a - build/src/operator/nn/mkldnn/mkldnn_base.o
- a - build/src/operator/nn/mkldnn/mkldnn_slice.o
- a - build/src/operator/nn/mkldnn/mkldnn_act.o
- a - build/src/operator/nn/mkldnn/mkldnn_softmax.o
- a - build/src/operator/nn/mkldnn/mkldnn_deconvolution.o
- a - build/src/operator/nn/mkldnn/mkldnn_copy.o
- a - build/src/operator/nn/mkldnn/mkldnn_softmax_output.o
- a - build/src/operator/nn/mkldnn/mkldnn_fully_connected.o
- a - build/src/operator/nn/mkldnn/mkldnn_pooling.o
- a - build/src/operator/nn/mkldnn/mkldnn_sum.o
- a - build/src/operator/nn/cudnn/cudnn_algoreg.o
- a - build/src/operator/nn/cudnn/cudnn_batch_norm.o
- a - build/src/operator/tensor/elemwise_binary_broadcast_op_basic.o
- a - build/src/operator/tensor/elemwise_binary_op_logic.o
- a - build/src/operator/tensor/square_sum.o
- a - build/src/operator/tensor/matrix_op.o
- a - build/src/operator/tensor/init_op.o
- a - build/src/operator/tensor/elemwise_sum.o
- a - build/src/operator/tensor/la_op.o
- a - build/src/operator/tensor/histogram.o
- a - build/src/operator/tensor/broadcast_reduce_op_index.o
- a - build/src/operator/tensor/dot.o
- a - build/src/operator/tensor/elemwise_scatter_op.o
- a - build/src/operator/tensor/elemwise_unary_op_basic.o
- a - build/src/operator/tensor/elemwise_binary_broadcast_op_extended.o
- a - build/src/operator/tensor/ravel.o
- a - build/src/operator/tensor/broadcast_reduce_op_value.o
- a - build/src/operator/tensor/control_flow_op.o
- a - build/src/operator/tensor/elemwise_binary_op_basic.o
- a - build/src/operator/tensor/elemwise_binary_op_extended.o
- a - build/src/operator/tensor/indexing_op.o
- a - build/src/operator/tensor/elemwise_binary_broadcast_op_logic.o
- a - build/src/operator/tensor/diag_op.o
- a - build/src/operator/tensor/ordering_op.o
- a - build/src/operator/tensor/sparse_retain.o
- a - build/src/operator/tensor/elemwise_binary_scalar_op_extended.o
- a - build/src/operator/tensor/elemwise_binary_scalar_op_basic.o
- a - build/src/operator/tensor/elemwise_binary_scalar_op_logic.o
- a - build/src/operator/tensor/cast_storage.o
- a - build/src/operator/tensor/elemwise_binary_op.o
- a - build/src/operator/tensor/elemwise_unary_op_trig.o
- a - build/src/operator/contrib/tensorrt.o
- a - build/src/operator/contrib/multibox_target.o
- a - build/src/operator/contrib/sync_batch_norm.o
- a - build/src/operator/contrib/count_sketch.o
- a - build/src/operator/contrib/roi_align.o
- a - build/src/operator/contrib/bilinear_resize.o
- a - build/src/operator/contrib/nnz.o
- a - build/src/operator/contrib/multibox_detection.o
- g++ -DMSHADOW_FORCE_STREAM -Wall -Wsign-compare -O3 -DNDEBUG=1 -I/home/mahmood/mx/mxnet/3rdparty/mshadow/ -I/home/mahmood/mx/mxnet/3rdparty/dmlc-core/include -fPIC -I/home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/include -I/home/mahmood/mx/mxnet/3rdparty/dlpack/include -I/home/mahmood/mx/mxnet/3rdparty/tvm/include -Iinclude -funroll-loops -Wno-unused-parameter -Wno-unknown-pragmas -Wno-unused-local-typedefs -msse3 -mf16c -I/usr/local/cuda/include -DMSHADOW_USE_CBLAS=1 -DMSHADOW_USE_MKL=0 -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMSHADOW_RABIT_PS=0 -DMSHADOW_DIST_PS=0 -DMSHADOW_USE_PASCAL=0 -DMXNET_USE_MKLDNN=1 -DUSE_MKL=1 -I/home/mahmood/mx/mxnet/src/operator/nn/mkldnn/ -I/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/include -DMXNET_USE_OPENCV=1 -I/usr/include/opencv -fopenmp -DMXNET_USE_OPERATOR_TUNING=1 -DMSHADOW_USE_CUDNN=1 -I/home/mahmood/mx/mxnet/3rdparty/cub -DMXNET_ENABLE_CUDA_RTC=1 -DMXNET_USE_NCCL=0 -DMXNET_USE_LIBJPEG_TURBO=0 -std=c++11 -o bin/im2rec tools/im2rec.cc build/src/operator/quantization/mkldnn/mkldnn_quantized_conv.o build/src/operator/quantization/mkldnn/mkldnn_quantized_pooling.o build/src/operator/quantization/mkldnn/mkldnn_quantized_concat.o build/src/operator/subgraph/mkldnn/mkldnn_conv_property.o build/src/operator/subgraph/mkldnn/mkldnn_conv_post_quantize_property.o build/src/operator/subgraph/mkldnn/mkldnn_conv.o build/src/operator/nn/mkldnn/mkldnn_convolution.o build/src/operator/nn/mkldnn/mkldnn_concat.o build/src/operator/nn/mkldnn/mkldnn_base.o build/src/operator/nn/mkldnn/mkldnn_slice.o build/src/operator/nn/mkldnn/mkldnn_act.o build/src/operator/nn/mkldnn/mkldnn_softmax.o build/src/operator/nn/mkldnn/mkldnn_deconvolution.o build/src/operator/nn/mkldnn/mkldnn_copy.o build/src/operator/nn/mkldnn/mkldnn_softmax_output.o build/src/operator/nn/mkldnn/mkldnn_fully_connected.o build/src/operator/nn/mkldnn/mkldnn_pooling.o build/src/operator/nn/mkldnn/mkldnn_sum.o build/src/operator/nn/cudnn/cudnn_algoreg.o build/src/operator/nn/cudnn/cudnn_batch_norm.o build/src/operator/tensor/elemwise_binary_broadcast_op_basic.o build/src/operator/tensor/elemwise_binary_op_logic.o build/src/operator/tensor/square_sum.o build/src/operator/tensor/matrix_op.o build/src/operator/tensor/init_op.o build/src/operator/tensor/elemwise_sum.o build/src/operator/tensor/la_op.o build/src/operator/tensor/histogram.o build/src/operator/tensor/broadcast_reduce_op_index.o build/src/operator/tensor/dot.o build/src/operator/tensor/elemwise_scatter_op.o build/src/operator/tensor/elemwise_unary_op_basic.o build/src/operator/tensor/elemwise_binary_broadcast_op_extended.o build/src/operator/tensor/ravel.o build/src/operator/tensor/broadcast_reduce_op_value.o build/src/operator/tensor/control_flow_op.o build/src/operator/tensor/elemwise_binary_op_basic.o build/src/operator/tensor/elemwise_binary_op_extended.o build/src/operator/tensor/indexing_op.o build/src/operator/tensor/elemwise_binary_broadcast_op_logic.o build/src/operator/tensor/diag_op.o build/src/operator/tensor/ordering_op.o build/src/operator/tensor/sparse_retain.o build/src/operator/tensor/elemwise_binary_scalar_op_extended.o build/src/operator/tensor/elemwise_binary_scalar_op_basic.o build/src/operator/tensor/elemwise_binary_scalar_op_logic.o build/src/operator/tensor/cast_storage.o build/src/operator/tensor/elemwise_binary_op.o build/src/operator/tensor/elemwise_unary_op_trig.o build/src/operator/contrib/tensorrt.o build/src/operator/contrib/multibox_target.o build/src/operator/contrib/sync_batch_norm.o build/src/operator/contrib/count_sketch.o build/src/operator/contrib/roi_align.o build/src/operator/contrib/bilinear_resize.o build/src/operator/contrib/nnz.o build/src/operator/contrib/multibox_detection.o build/src/operator/contrib/nnvm_to_onnx.o build/src/operator/contrib/deformable_psroi_pooling.o build/src/operator/contrib/dgl_graph.o build/src/operator/contrib/fft.o build/src/operator/contrib/multibox_prior.o build/src/operator/contrib/gradient_multiplier_op.o build/src/operator/contrib/adamw.o build/src/operator/contrib/transformer.o build/src/operator/contrib/krprod.o build/src/operator/contrib/multi_proposal.o build/src/operator/contrib/index_copy.o build/src/operator/contrib/optimizer_op.o build/src/operator/contrib/bounding_box.o build/src/operator/contrib/proposal.o build/src/operator/contrib/boolean_mask.o build/src/operator/contrib/psroi_pooling.o build/src/operator/contrib/quadratic_op.o build/src/operator/contrib/deformable_convolution.o build/src/operator/contrib/ifft.o build/src/operator/contrib/adaptive_avg_pooling.o build/src/operator/random/sample_multinomial_op.o build/src/operator/random/multisample_op.o build/src/operator/random/unique_sample_op.o build/src/operator/random/sample_op.o build/src/operator/random/shuffle_op.o build/src/operator/quantization/requantize.o build/src/operator/quantization/dequantize.o build/src/operator/quantization/quantize_graph_pass.o build/src/operator/quantization/quantized_flatten.o build/src/operator/quantization/quantized_conv.o build/src/operator/quantization/quantized_fully_connected.o build/src/operator/quantization/quantized_pooling.o build/src/operator/quantization/quantize_v2.o build/src/operator/quantization/quantized_concat.o build/src/operator/quantization/quantize.o build/src/operator/custom/native_op.o build/src/operator/custom/ndarray_op.o build/src/operator/custom/custom.o build/src/operator/subgraph/partition_graph.o build/src/operator/subgraph/default_subgraph_property.o build/src/operator/nnpack/nnpack_util.o build/src/operator/image/image_random.o build/src/operator/image/resize.o build/src/operator/nn/softmax.o build/src/operator/nn/pooling.o build/src/operator/nn/deconvolution.o build/src/operator/nn/activation.o build/src/operator/nn/upsampling.o build/src/operator/nn/batch_norm.o build/src/operator/nn/ctc_loss.o build/src/operator/nn/fully_connected.o build/src/operator/nn/convolution.o build/src/operator/nn/layer_norm.o build/src/operator/nn/concat.o build/src/operator/nn/softmax_activation.o build/src/operator/nn/lrn.o build/src/operator/nn/dropout.o build/src/io/io.o build/src/io/image_aug_default.o build/src/io/iter_image_det_recordio.o build/src/io/image_io.o build/src/io/image_det_aug_default.o build/src/io/iter_csv.o build/src/io/iter_image_recordio.o build/src/io/iter_mnist.o build/src/io/iter_image_recordio_2.o build/src/io/iter_libsvm.o build/src/common/utils.o build/src/common/rtc.o build/src/nnvm/legacy_op_util.o build/src/nnvm/tvm_bridge.o build/src/nnvm/graph_editor.o build/src/nnvm/legacy_json_util.o build/src/profiler/profiler.o build/src/profiler/aggregate_stats.o build/src/profiler/vtune.o build/src/imperative/cached_op.o build/src/imperative/imperative_utils.o build/src/imperative/imperative.o build/src/ndarray/ndarray_function.o build/src/ndarray/ndarray.o build/src/operator/instance_norm.o build/src/operator/subgraph_op_common.o build/src/operator/grid_generator.o build/src/operator/pooling_v1.o build/src/operator/l2_normalization.o build/src/operator/rnn.o build/src/operator/make_loss.o build/src/operator/crop.o build/src/operator/spatial_transformer.o build/src/operator/operator.o build/src/operator/control_flow.o build/src/operator/swapaxis.o build/src/operator/convolution_v1.o build/src/operator/softmax_output.o build/src/operator/operator_util.o build/src/operator/roi_pooling.o build/src/operator/slice_channel.o build/src/operator/batch_norm_v1.o build/src/operator/loss_binary_op.o build/src/operator/regression_output.o build/src/operator/sequence_reverse.o build/src/operator/c_lapack_api.o build/src/operator/identity_attach_KL_sparse_reg.o build/src/operator/bilinear_sampler.o build/src/operator/svm_output.o build/src/operator/optimizer_op.o build/src/operator/sequence_last.o build/src/operator/cross_device_copy.o build/src/operator/correlation.o build/src/operator/pad.o build/src/operator/leaky_relu.o build/src/operator/operator_tune.o build/src/operator/sequence_mask.o build/src/engine/naive_engine.o build/src/engine/openmp.o build/src/engine/threaded_engine_pooled.o build/src/engine/threaded_engine.o build/src/engine/engine.o build/src/engine/threaded_engine_perdevice.o build/src/storage/storage.o build/src/c_api/c_api_executor.o build/src/c_api/c_api_symbolic.o build/src/c_api/c_api_profile.o build/src/c_api/c_api_ndarray.o build/src/c_api/c_api_test.o build/src/c_api/c_predict_api.o build/src/c_api/c_api_function.o build/src/c_api/c_api.o build/src/c_api/c_api_error.o build/src/executor/onnx_to_tensorrt.o build/src/executor/inplace_addto_detect_pass.o build/src/executor/graph_executor.o build/src/executor/trt_graph_executor.o build/src/executor/infer_graph_attr_pass.o build/src/executor/tensorrt_pass.o build/src/executor/attach_op_execs_pass.o build/src/executor/attach_op_resource_pass.o build/src/kvstore/gradient_compression.o build/src/kvstore/kvstore_utils.o build/src/kvstore/kvstore.o build/src/resource.o build/src/libinfo.o build/src/initialize.o /home/mahmood/mx/mxnet/3rdparty/dmlc-core/libdmlc.a /home/mahmood/mx/mxnet/3rdparty/tvm/nnvm/lib/libnnvm.a build/src/operator/nn/cudnn/cudnn_batch_norm_gpu.o build/src/operator/tensor/elemwise_binary_op_basic_gpu.o build/src/operator/tensor/elemwise_binary_scalar_op_basic_gpu.o build/src/operator/tensor/elemwise_binary_scalar_op_extended_gpu.o build/src/operator/tensor/matrix_op_gpu.o build/src/operator/tensor/ordering_op_gpu.o build/src/operator/tensor/elemwise_unary_op_trig_gpu.o build/src/operator/tensor/elemwise_binary_broadcast_op_extended_gpu.o build/src/operator/tensor/diag_op_gpu.o build/src/operator/tensor/square_sum_gpu.o build/src/operator/tensor/elemwise_binary_op_extended_gpu.o build/src/operator/tensor/elemwise_sum_gpu.o build/src/operator/tensor/init_op_gpu.o build/src/operator/tensor/cast_storage_gpu.o build/src/operator/tensor/histogram_gpu.o build/src/operator/tensor/dot_gpu.o build/src/operator/tensor/elemwise_binary_scalar_op_logic_gpu.o build/src/operator/tensor/ravel_gpu.o build/src/operator/tensor/control_flow_op_gpu.o build/src/operator/tensor/broadcast_reduce_op_value_gpu.o build/src/operator/tensor/elemwise_binary_broadcast_op_basic_gpu.o build/src/operator/tensor/broadcast_reduce_op_index_gpu.o build/src/operator/tensor/elemwise_scatter_op_gpu.o build/src/operator/tensor/indexing_op_gpu.o build/src/operator/tensor/elemwise_binary_broadcast_op_logic_gpu.o build/src/operator/tensor/la_op_gpu.o build/src/operator/tensor/elemwise_binary_op_logic_gpu.o build/src/operator/tensor/elemwise_unary_op_basic_gpu.o build/src/operator/tensor/sparse_retain_gpu.o build/src/operator/contrib/optimizer_op_gpu.o build/src/operator/contrib/boolean_mask_gpu.o build/src/operator/contrib/adaptive_avg_pooling_gpu.o build/src/operator/contrib/ifft_gpu.o build/src/operator/contrib/multibox_detection_gpu.o build/src/operator/contrib/index_copy_gpu.o build/src/operator/contrib/tensorrt_gpu.o build/src/operator/contrib/multibox_target_gpu.o build/src/operator/contrib/proposal_gpu.o build/src/operator/contrib/bilinear_resize_gpu.o build/src/operator/contrib/count_sketch_gpu.o build/src/operator/contrib/dgl_graph_gpu.o build/src/operator/contrib/gradient_multiplier_op_gpu.o build/src/operator/contrib/bounding_box_gpu.o build/src/operator/contrib/fft_gpu.o build/src/operator/contrib/multibox_prior_gpu.o build/src/operator/contrib/deformable_psroi_pooling_gpu.o build/src/operator/contrib/quadratic_op_gpu.o build/src/operator/contrib/transformer_gpu.o build/src/operator/contrib/multi_proposal_gpu.o build/src/operator/contrib/adamw_gpu.o build/src/operator/contrib/sync_batch_norm_gpu.o build/src/operator/contrib/psroi_pooling_gpu.o build/src/operator/contrib/deformable_convolution_gpu.o build/src/operator/contrib/roi_align_gpu.o build/src/operator/random/shuffle_op_gpu.o build/src/operator/random/sample_multinomial_op_gpu.o build/src/operator/random/multisample_op_gpu.o build/src/operator/random/sample_op_gpu.o build/src/operator/quantization/requantize_gpu.o build/src/operator/quantization/quantize_gpu.o build/src/operator/quantization/dequantize_gpu.o build/src/operator/quantization/quantized_conv_gpu.o build/src/operator/quantization/quantized_flatten_gpu.o build/src/operator/quantization/quantized_fully_connected_gpu.o build/src/operator/quantization/quantized_pooling_gpu.o build/src/operator/quantization/quantize_v2_gpu.o build/src/operator/custom/native_op_gpu.o build/src/operator/image/resize_gpu.o build/src/operator/image/image_random_gpu.o build/src/operator/nn/lrn_gpu.o build/src/operator/nn/dropout_gpu.o build/src/operator/nn/softmax_activation_gpu.o build/src/operator/nn/fully_connected_gpu.o build/src/operator/nn/deconvolution_gpu.o build/src/operator/nn/pooling_gpu.o build/src/operator/nn/softmax_gpu.o build/src/operator/nn/activation_gpu.o build/src/operator/nn/ctc_loss_gpu.o build/src/operator/nn/convolution_gpu.o build/src/operator/nn/upsampling_gpu.o build/src/operator/nn/batch_norm_gpu.o build/src/operator/nn/layer_norm_gpu.o build/src/operator/nn/concat_gpu.o build/src/common/utils_gpu.o build/src/common/random_generator_gpu.o build/src/ndarray/ndarray_function_gpu.o build/src/operator/svm_output_gpu.o build/src/operator/optimizer_op_gpu.o build/src/operator/spatial_transformer_gpu.o build/src/operator/make_loss_gpu.o build/src/operator/pooling_v1_gpu.o build/src/operator/instance_norm_gpu.o build/src/operator/sequence_mask_gpu.o build/src/operator/correlation_gpu.o build/src/operator/slice_channel_gpu.o build/src/operator/rnn_gpu.o build/src/operator/crop_gpu.o build/src/operator/convolution_v1_gpu.o build/src/operator/sequence_reverse_gpu.o build/src/operator/identity_attach_KL_sparse_reg_gpu.o build/src/operator/leaky_relu_gpu.o build/src/operator/swapaxis_gpu.o build/src/operator/grid_generator_gpu.o build/src/operator/pad_gpu.o build/src/operator/bilinear_sampler_gpu.o build/src/operator/roi_pooling_gpu.o build/src/operator/batch_norm_v1_gpu.o build/src/operator/loss_binary_op_gpu.o build/src/operator/regression_output_gpu.o build/src/operator/l2_normalization_gpu.o build/src/operator/sequence_last_gpu.o build/src/operator/softmax_output_gpu.o build/src/kvstore/gradient_compression_gpu.o build/src/kvstore/kvstore_utils_gpu.o -pthread -lm -lcudart -lcublas -lcurand -lcusolver -L/usr/local/cuda/lib64 -L/usr/local/cuda/lib -Wl,--as-needed -lmklml_intel -lmklml_gnu -liomp5 -L/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/lib/ -lopenblas -fopenmp -lrt -L/home/mahmood/mx/mxnet/3rdparty/mkldnn/build/install/lib -lmkldnn -Wl,-rpath,'${ORIGIN}' -lopencv_shape -lopencv_stitching -lopencv_superres -lopencv_videostab -lopencv_aruco -lopencv_bgsegm -lopencv_bioinspired -lopencv_ccalib -lopencv_datasets -lopencv_dpm -lopencv_face -lopencv_freetype -lopencv_fuzzy -lopencv_hdf -lopencv_line_descriptor -lopencv_optflow -lopencv_video -lopencv_plot -lopencv_reg -lopencv_saliency -lopencv_stereo -lopencv_structured_light -lopencv_phase_unwrapping -lopencv_rgbd -lopencv_viz -lopencv_surface_matching -lopencv_text -lopencv_ximgproc -lopencv_calib3d -lopencv_features2d -lopencv_flann -lopencv_xobjdetect -lopencv_objdetect -lopencv_ml -lopencv_xphoto -lopencv_highgui -lopencv_videoio -lopencv_imgcodecs -lopencv_photo -lopencv_imgproc -lopencv_core -lcudnn -lcufft -lcuda -lnvrtc -L/usr/local/cuda/lib64/stubs
- a - build/src/operator/contrib/nnvm_to_onnx.o
- a - build/src/operator/contrib/deformable_psroi_pooling.o
- a - build/src/operator/contrib/dgl_graph.o
- a - build/src/operator/contrib/fft.o
- a - build/src/operator/contrib/multibox_prior.o
- a - build/src/operator/contrib/gradient_multiplier_op.o
- a - build/src/operator/contrib/adamw.o
- a - build/src/operator/contrib/transformer.o
- a - build/src/operator/contrib/krprod.o
- a - build/src/operator/contrib/multi_proposal.o
- a - build/src/operator/contrib/index_copy.o
- a - build/src/operator/contrib/optimizer_op.o
- a - build/src/operator/contrib/bounding_box.o
- a - build/src/operator/contrib/proposal.o
- a - build/src/operator/contrib/boolean_mask.o
- a - build/src/operator/contrib/psroi_pooling.o
- a - build/src/operator/contrib/quadratic_op.o
- a - build/src/operator/contrib/deformable_convolution.o
- a - build/src/operator/contrib/ifft.o
- a - build/src/operator/contrib/adaptive_avg_pooling.o
- a - build/src/operator/random/sample_multinomial_op.o
- a - build/src/operator/random/multisample_op.o
- a - build/src/operator/random/unique_sample_op.o
- a - build/src/operator/random/sample_op.o
- a - build/src/operator/random/shuffle_op.o
- a - build/src/operator/quantization/requantize.o
- a - build/src/operator/quantization/dequantize.o
- a - build/src/operator/quantization/quantize_graph_pass.o
- a - build/src/operator/quantization/quantized_flatten.o
- a - build/src/operator/quantization/quantized_conv.o
- a - build/src/operator/quantization/quantized_fully_connected.o
- a - build/src/operator/quantization/quantized_pooling.o
- a - build/src/operator/quantization/quantize_v2.o
- a - build/src/operator/quantization/quantized_concat.o
- a - build/src/operator/quantization/quantize.o
- a - build/src/operator/custom/native_op.o
- a - build/src/operator/custom/ndarray_op.o
- a - build/src/operator/custom/custom.o
- a - build/src/operator/subgraph/partition_graph.o
- a - build/src/operator/subgraph/default_subgraph_property.o
- a - build/src/operator/nnpack/nnpack_util.o
- a - build/src/operator/image/image_random.o
- a - build/src/operator/image/resize.o
- a - build/src/operator/nn/softmax.o
- a - build/src/operator/nn/pooling.o
- a - build/src/operator/nn/deconvolution.o
- a - build/src/operator/nn/activation.o
- a - build/src/operator/nn/upsampling.o
- a - build/src/operator/nn/batch_norm.o
- a - build/src/operator/nn/ctc_loss.o
- a - build/src/operator/nn/fully_connected.o
- a - build/src/operator/nn/convolution.o
- a - build/src/operator/nn/layer_norm.o
- a - build/src/operator/nn/concat.o
- a - build/src/operator/nn/softmax_activation.o
- a - build/src/operator/nn/lrn.o
- a - build/src/operator/nn/dropout.o
- a - build/src/io/io.o
- a - build/src/io/image_aug_default.o
- a - build/src/io/iter_image_det_recordio.o
- a - build/src/io/image_io.o
- a - build/src/io/image_det_aug_default.o
- a - build/src/io/iter_csv.o
- a - build/src/io/iter_image_recordio.o
- a - build/src/io/iter_mnist.o
- a - build/src/io/iter_image_recordio_2.o
- a - build/src/io/iter_libsvm.o
- a - build/src/common/utils.o
- a - build/src/common/rtc.o
- a - build/src/nnvm/legacy_op_util.o
- a - build/src/nnvm/tvm_bridge.o
- a - build/src/nnvm/graph_editor.o
- a - build/src/nnvm/legacy_json_util.o
- a - build/src/profiler/profiler.o
- a - build/src/profiler/aggregate_stats.o
- a - build/src/profiler/vtune.o
- a - build/src/imperative/cached_op.o
- a - build/src/imperative/imperative_utils.o
- a - build/src/imperative/imperative.o
- a - build/src/ndarray/ndarray_function.o
- a - build/src/ndarray/ndarray.o
- a - build/src/operator/instance_norm.o
- a - build/src/operator/subgraph_op_common.o
- a - build/src/operator/grid_generator.o
- a - build/src/operator/pooling_v1.o
- a - build/src/operator/l2_normalization.o
- a - build/src/operator/rnn.o
- a - build/src/operator/make_loss.o
- a - build/src/operator/crop.o
- a - build/src/operator/spatial_transformer.o
- a - build/src/operator/operator.o
- a - build/src/operator/control_flow.o
- a - build/src/operator/swapaxis.o
- a - build/src/operator/convolution_v1.o
- a - build/src/operator/softmax_output.o
- a - build/src/operator/operator_util.o
- a - build/src/operator/roi_pooling.o
- a - build/src/operator/slice_channel.o
- a - build/src/operator/batch_norm_v1.o
- a - build/src/operator/loss_binary_op.o
- a - build/src/operator/regression_output.o
- a - build/src/operator/sequence_reverse.o
- a - build/src/operator/c_lapack_api.o
- a - build/src/operator/identity_attach_KL_sparse_reg.o
- a - build/src/operator/bilinear_sampler.o
- a - build/src/operator/svm_output.o
- a - build/src/operator/optimizer_op.o
- a - build/src/operator/sequence_last.o
- a - build/src/operator/cross_device_copy.o
- a - build/src/operator/correlation.o
- a - build/src/operator/pad.o
- a - build/src/operator/leaky_relu.o
- a - build/src/operator/operator_tune.o
- a - build/src/operator/sequence_mask.o
- a - build/src/engine/naive_engine.o
- a - build/src/engine/openmp.o
- a - build/src/engine/threaded_engine_pooled.o
- a - build/src/engine/threaded_engine.o
- a - build/src/engine/engine.o
- a - build/src/engine/threaded_engine_perdevice.o
- a - build/src/storage/storage.o
- a - build/src/c_api/c_api_executor.o
- a - build/src/c_api/c_api_symbolic.o
- a - build/src/c_api/c_api_profile.o
- a - build/src/c_api/c_api_ndarray.o
- a - build/src/c_api/c_api_test.o
- a - build/src/c_api/c_predict_api.o
- a - build/src/c_api/c_api_function.o
- a - build/src/c_api/c_api.o
- a - build/src/c_api/c_api_error.o
- a - build/src/executor/onnx_to_tensorrt.o
- a - build/src/executor/inplace_addto_detect_pass.o
- a - build/src/executor/graph_executor.o
- a - build/src/executor/trt_graph_executor.o
- a - build/src/executor/infer_graph_attr_pass.o
- a - build/src/executor/tensorrt_pass.o
- a - build/src/executor/attach_op_execs_pass.o
- a - build/src/executor/attach_op_resource_pass.o
- a - build/src/kvstore/gradient_compression.o
- a - build/src/kvstore/kvstore_utils.o
- a - build/src/kvstore/kvstore.o
- a - build/src/resource.o
- a - build/src/libinfo.o
- a - build/src/initialize.o
- a - build/src/operator/nn/cudnn/cudnn_batch_norm_gpu.o
- a - build/src/operator/tensor/elemwise_binary_op_basic_gpu.o
- a - build/src/operator/tensor/elemwise_binary_scalar_op_basic_gpu.o
- a - build/src/operator/tensor/elemwise_binary_scalar_op_extended_gpu.o
- a - build/src/operator/tensor/matrix_op_gpu.o
- a - build/src/operator/tensor/ordering_op_gpu.o
- a - build/src/operator/tensor/elemwise_unary_op_trig_gpu.o
- a - build/src/operator/tensor/elemwise_binary_broadcast_op_extended_gpu.o
- a - build/src/operator/tensor/diag_op_gpu.o
- a - build/src/operator/tensor/square_sum_gpu.o
- a - build/src/operator/tensor/elemwise_binary_op_extended_gpu.o
- a - build/src/operator/tensor/elemwise_sum_gpu.o
- a - build/src/operator/tensor/init_op_gpu.o
- a - build/src/operator/tensor/cast_storage_gpu.o
- a - build/src/operator/tensor/histogram_gpu.o
- a - build/src/operator/tensor/dot_gpu.o
- a - build/src/operator/tensor/elemwise_binary_scalar_op_logic_gpu.o
- a - build/src/operator/tensor/ravel_gpu.o
- a - build/src/operator/tensor/control_flow_op_gpu.o
- a - build/src/operator/tensor/broadcast_reduce_op_value_gpu.o
- a - build/src/operator/tensor/elemwise_binary_broadcast_op_basic_gpu.o
- a - build/src/operator/tensor/broadcast_reduce_op_index_gpu.o
- a - build/src/operator/tensor/elemwise_scatter_op_gpu.o
- a - build/src/operator/tensor/indexing_op_gpu.o
- a - build/src/operator/tensor/elemwise_binary_broadcast_op_logic_gpu.o
- a - build/src/operator/tensor/la_op_gpu.o
- a - build/src/operator/tensor/elemwise_binary_op_logic_gpu.o
- a - build/src/operator/tensor/elemwise_unary_op_basic_gpu.o
- a - build/src/operator/tensor/sparse_retain_gpu.o
- a - build/src/operator/contrib/optimizer_op_gpu.o
- a - build/src/operator/contrib/boolean_mask_gpu.o
- a - build/src/operator/contrib/adaptive_avg_pooling_gpu.o
- a - build/src/operator/contrib/ifft_gpu.o
- a - build/src/operator/contrib/multibox_detection_gpu.o
- a - build/src/operator/contrib/index_copy_gpu.o
- a - build/src/operator/contrib/tensorrt_gpu.o
- a - build/src/operator/contrib/multibox_target_gpu.o
- a - build/src/operator/contrib/proposal_gpu.o
- a - build/src/operator/contrib/bilinear_resize_gpu.o
- a - build/src/operator/contrib/count_sketch_gpu.o
- a - build/src/operator/contrib/dgl_graph_gpu.o
- a - build/src/operator/contrib/gradient_multiplier_op_gpu.o
- a - build/src/operator/contrib/bounding_box_gpu.o
- a - build/src/operator/contrib/fft_gpu.o
- a - build/src/operator/contrib/multibox_prior_gpu.o
- a - build/src/operator/contrib/deformable_psroi_pooling_gpu.o
- a - build/src/operator/contrib/quadratic_op_gpu.o
- a - build/src/operator/contrib/transformer_gpu.o
- a - build/src/operator/contrib/multi_proposal_gpu.o
- a - build/src/operator/contrib/adamw_gpu.o
- a - build/src/operator/contrib/sync_batch_norm_gpu.o
- a - build/src/operator/contrib/psroi_pooling_gpu.o
- a - build/src/operator/contrib/deformable_convolution_gpu.o
- a - build/src/operator/contrib/roi_align_gpu.o
- a - build/src/operator/random/shuffle_op_gpu.o
- a - build/src/operator/random/sample_multinomial_op_gpu.o
- a - build/src/operator/random/multisample_op_gpu.o
- a - build/src/operator/random/sample_op_gpu.o
- a - build/src/operator/quantization/requantize_gpu.o
- a - build/src/operator/quantization/quantize_gpu.o
- a - build/src/operator/quantization/dequantize_gpu.o
- a - build/src/operator/quantization/quantized_conv_gpu.o
- a - build/src/operator/quantization/quantized_flatten_gpu.o
- a - build/src/operator/quantization/quantized_fully_connected_gpu.o
- a - build/src/operator/quantization/quantized_pooling_gpu.o
- a - build/src/operator/quantization/quantize_v2_gpu.o
- a - build/src/operator/custom/native_op_gpu.o
- a - build/src/operator/image/resize_gpu.o
- a - build/src/operator/image/image_random_gpu.o
- a - build/src/operator/nn/lrn_gpu.o
- a - build/src/operator/nn/dropout_gpu.o
- a - build/src/operator/nn/softmax_activation_gpu.o
- a - build/src/operator/nn/fully_connected_gpu.o
- a - build/src/operator/nn/deconvolution_gpu.o
- a - build/src/operator/nn/pooling_gpu.o
- a - build/src/operator/nn/softmax_gpu.o
- a - build/src/operator/nn/activation_gpu.o
- a - build/src/operator/nn/ctc_loss_gpu.o
- a - build/src/operator/nn/convolution_gpu.o
- a - build/src/operator/nn/upsampling_gpu.o
- a - build/src/operator/nn/batch_norm_gpu.o
- a - build/src/operator/nn/layer_norm_gpu.o
- a - build/src/operator/nn/concat_gpu.o
- a - build/src/common/utils_gpu.o
- a - build/src/common/random_generator_gpu.o
- a - build/src/ndarray/ndarray_function_gpu.o
- a - build/src/operator/svm_output_gpu.o
- a - build/src/operator/optimizer_op_gpu.o
- a - build/src/operator/spatial_transformer_gpu.o
- a - build/src/operator/make_loss_gpu.o
- a - build/src/operator/pooling_v1_gpu.o
- a - build/src/operator/instance_norm_gpu.o
- a - build/src/operator/sequence_mask_gpu.o
- a - build/src/operator/correlation_gpu.o
- a - build/src/operator/slice_channel_gpu.o
- a - build/src/operator/rnn_gpu.o
- a - build/src/operator/crop_gpu.o
- a - build/src/operator/convolution_v1_gpu.o
- a - build/src/operator/sequence_reverse_gpu.o
- a - build/src/operator/identity_attach_KL_sparse_reg_gpu.o
- a - build/src/operator/leaky_relu_gpu.o
- a - build/src/operator/swapaxis_gpu.o
- a - build/src/operator/grid_generator_gpu.o
- a - build/src/operator/pad_gpu.o
- a - build/src/operator/bilinear_sampler_gpu.o
- a - build/src/operator/roi_pooling_gpu.o
- a - build/src/operator/batch_norm_v1_gpu.o
- a - build/src/operator/loss_binary_op_gpu.o
- a - build/src/operator/regression_output_gpu.o
- a - build/src/operator/l2_normalization_gpu.o
- a - build/src/operator/sequence_last_gpu.o
- a - build/src/operator/softmax_output_gpu.o
- a - build/src/kvstore/gradient_compression_gpu.o
- a - build/src/kvstore/kvstore_utils_gpu.o
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement