Created
January 5, 2017 11:42
-
-
Save agibsonccc/73d57fbe87ce6d201a2e5ca4312d9cdc to your computer and use it in GitHub Desktop.
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
[agibsonccc@localhost libnd4j]$ ./buildnativeoperations.sh -c cuda | |
eval cmake | |
PACKAGING = none | |
BUILD = release | |
CHIP = cuda | |
ARCH = x86-64 | |
CHIP_VERSION = | |
GPU_COMPUTE_CAPABILITY = all | |
EXPERIMENTAL = no | |
LIBRARY TYPE = dynamic | |
/home/agibsonccc/code/libnd4j/blasbuild/cuda | |
-- The C compiler identification is GNU 5.3.1 | |
-- The CXX compiler identification is GNU 5.3.1 | |
-- Check for working C compiler: /bin/cc | |
-- Check for working C compiler: /bin/cc -- works | |
-- Detecting C compiler ABI info | |
-- Detecting C compiler ABI info - done | |
-- Detecting C compile features | |
-- Detecting C compile features - done | |
-- Check for working CXX compiler: /bin/c++ | |
-- Check for working CXX compiler: /bin/c++ -- works | |
-- Detecting CXX compiler ABI info | |
-- Detecting CXX compiler ABI info - done | |
-- Detecting CXX compile features | |
-- Detecting CXX compile features - done | |
-- Looking for pthread.h | |
-- Looking for pthread.h - found | |
-- Looking for pthread_create | |
-- Looking for pthread_create - not found | |
-- Looking for pthread_create in pthreads | |
-- Looking for pthread_create in pthreads - not found | |
-- Looking for pthread_create in pthread | |
-- Looking for pthread_create in pthread - found | |
-- Found Threads: TRUE | |
-- Found CUDA: /usr/local/cuda-8.0 (found version "8.0") | |
ADDING BLAS | |
Build cublas | |
CUDA found! | |
Compiling to external module | |
-- Configuring done | |
-- Generating done | |
CMake Warning: | |
Manually-specified variables were not used by the project: | |
MKL_MULTI_THREADED | |
-- Build files have been written to: /home/agibsonccc/code/libnd4j/blasbuild/cuda | |
/usr/bin/cmake -H/home/agibsonccc/code/libnd4j -B/home/agibsonccc/code/libnd4j/blasbuild/cuda --check-build-system CMakeFiles/Makefile.cmake 0 | |
/usr/bin/cmake -E cmake_progress_start /home/agibsonccc/code/libnd4j/blasbuild/cuda/CMakeFiles /home/agibsonccc/code/libnd4j/blasbuild/cuda/CMakeFiles/progress.marks | |
make -f CMakeFiles/Makefile2 all | |
make[1]: Entering directory '/home/agibsonccc/code/libnd4j/blasbuild/cuda' | |
make -f blas/CMakeFiles/nd4jcuda.dir/build.make blas/CMakeFiles/nd4jcuda.dir/depend | |
make[2]: Entering directory '/home/agibsonccc/code/libnd4j/blasbuild/cuda' | |
[ 50%] Building NVCC (Device) object blas/CMakeFiles/nd4jcuda.dir/cuda/nd4jcuda_generated_NativeOps.cu.o | |
cd /home/agibsonccc/code/libnd4j/blasbuild/cuda/blas/CMakeFiles/nd4jcuda.dir/cuda && /usr/bin/cmake -E make_directory /home/agibsonccc/code/libnd4j/blasbuild/cuda/blas/CMakeFiles/nd4jcuda.dir/cuda/. | |
cd /home/agibsonccc/code/libnd4j/blasbuild/cuda/blas/CMakeFiles/nd4jcuda.dir/cuda && /usr/bin/cmake -D verbose:BOOL=ON -D build_configuration:STRING=Release -D generated_file:STRING=/home/agibsonccc/code/libnd4j/blasbuild/cuda/blas/CMakeFiles/nd4jcuda.dir/cuda/./nd4jcuda_generated_NativeOps.cu.o -D generated_cubin_file:STRING=/home/agibsonccc/code/libnd4j/blasbuild/cuda/blas/CMakeFiles/nd4jcuda.dir/cuda/./nd4jcuda_generated_NativeOps.cu.o.cubin.txt -P /home/agibsonccc/code/libnd4j/blasbuild/cuda/blas/CMakeFiles/nd4jcuda.dir/cuda/nd4jcuda_generated_NativeOps.cu.o.cmake | |
-- Removing /home/agibsonccc/code/libnd4j/blasbuild/cuda/blas/CMakeFiles/nd4jcuda.dir/cuda/./nd4jcuda_generated_NativeOps.cu.o | |
/usr/bin/cmake -E remove /home/agibsonccc/code/libnd4j/blasbuild/cuda/blas/CMakeFiles/nd4jcuda.dir/cuda/./nd4jcuda_generated_NativeOps.cu.o | |
-- Generating dependency file: /home/agibsonccc/code/libnd4j/blasbuild/cuda/blas/CMakeFiles/nd4jcuda.dir/cuda/nd4jcuda_generated_NativeOps.cu.o.NVCC-depend | |
/usr/local/cuda-8.0/bin/nvcc -M -D__CUDACC__ /home/agibsonccc/code/libnd4j/blas/cuda/NativeOps.cu -o /home/agibsonccc/code/libnd4j/blasbuild/cuda/blas/CMakeFiles/nd4jcuda.dir/cuda/nd4jcuda_generated_NativeOps.cu.o.NVCC-depend -m64 --std c++11 -D__CUDABLAS__=true -Dnd4jcuda_EXPORTS -Xcompiler ,\"-Wall\",\"-O3\",\"-Wl,-rpath,$ORIGIN/\",\"-march=x86-64\",\"-mtune=x86-64\",\"-fPIC\",\"-Wall\",\"-O3\",\"-fassociative-math\",\"-funsafe-math-optimizations\" --ptxas-options=-v -DCUDA_8 -DVERBOSE --cudart=static -O3 -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_37,code=sm_37 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_53,code=sm_53 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_62,code=sm_62 -DNVCC -I/usr/local/cuda-8.0/include -I/home/agibsonccc/code/libnd4j/include -I/usr/include -I/usr/local/include -I/usr/local/cuda-8.0/include | |
/home/agibsonccc/code/libnd4j/blas/cuda/NativeOps.cu:1:0: warning: -mtune=x86-64 is deprecated; use -mtune=k8 or -mtune=generic instead as appropriate [-Wdeprecated] | |
^ | |
/home/agibsonccc/code/libnd4j/blas/cuda/NativeOps.cu:1:0: warning: -mtune=x86-64 is deprecated; use -mtune=k8 or -mtune=generic instead as appropriate [-Wdeprecated] | |
^ | |
/home/agibsonccc/code/libnd4j/blas/cuda/NativeOps.cu:1:0: warning: -mtune=x86-64 is deprecated; use -mtune=k8 or -mtune=generic instead as appropriate [-Wdeprecated] | |
^ | |
/home/agibsonccc/code/libnd4j/blas/cuda/NativeOps.cu:1:0: warning: -mtune=x86-64 is deprecated; use -mtune=k8 or -mtune=generic instead as appropriate [-Wdeprecated] | |
^ | |
/home/agibsonccc/code/libnd4j/blas/cuda/NativeOps.cu:1:0: warning: -mtune=x86-64 is deprecated; use -mtune=k8 or -mtune=generic instead as appropriate [-Wdeprecated] | |
^ | |
/home/agibsonccc/code/libnd4j/blas/cuda/NativeOps.cu:1:0: warning: -mtune=x86-64 is deprecated; use -mtune=k8 or -mtune=generic instead as appropriate [-Wdeprecated] | |
^ | |
/home/agibsonccc/code/libnd4j/blas/cuda/NativeOps.cu:1:0: warning: -mtune=x86-64 is deprecated; use -mtune=k8 or -mtune=generic instead as appropriate [-Wdeprecated] | |
^ | |
/home/agibsonccc/code/libnd4j/blas/cuda/NativeOps.cu:1:0: warning: -mtune=x86-64 is deprecated; use -mtune=k8 or -mtune=generic instead as appropriate [-Wdeprecated] | |
^ | |
/home/agibsonccc/code/libnd4j/blas/cuda/NativeOps.cu:1:0: warning: -mtune=x86-64 is deprecated; use -mtune=k8 or -mtune=generic instead as appropriate [-Wdeprecated] | |
^ | |
/home/agibsonccc/code/libnd4j/blas/cuda/NativeOps.cu:1:0: warning: -mtune=x86-64 is deprecated; use -mtune=k8 or -mtune=generic instead as appropriate [-Wdeprecated] | |
^ | |
-- Generating temporary cmake readable file: /home/agibsonccc/code/libnd4j/blasbuild/cuda/blas/CMakeFiles/nd4jcuda.dir/cuda/nd4jcuda_generated_NativeOps.cu.o.depend.tmp | |
/usr/bin/cmake -D input_file:FILEPATH=/home/agibsonccc/code/libnd4j/blasbuild/cuda/blas/CMakeFiles/nd4jcuda.dir/cuda/nd4jcuda_generated_NativeOps.cu.o.NVCC-depend -D output_file:FILEPATH=/home/agibsonccc/code/libnd4j/blasbuild/cuda/blas/CMakeFiles/nd4jcuda.dir/cuda/nd4jcuda_generated_NativeOps.cu.o.depend.tmp -P /home/agibsonccc/code/libnd4j/cmake/FindCUDA/make2cmake.cmake | |
-- Copy if different /home/agibsonccc/code/libnd4j/blasbuild/cuda/blas/CMakeFiles/nd4jcuda.dir/cuda/nd4jcuda_generated_NativeOps.cu.o.depend.tmp to /home/agibsonccc/code/libnd4j/blasbuild/cuda/blas/CMakeFiles/nd4jcuda.dir/cuda/nd4jcuda_generated_NativeOps.cu.o.depend | |
/usr/bin/cmake -E copy_if_different /home/agibsonccc/code/libnd4j/blasbuild/cuda/blas/CMakeFiles/nd4jcuda.dir/cuda/nd4jcuda_generated_NativeOps.cu.o.depend.tmp /home/agibsonccc/code/libnd4j/blasbuild/cuda/blas/CMakeFiles/nd4jcuda.dir/cuda/nd4jcuda_generated_NativeOps.cu.o.depend | |
-- Removing /home/agibsonccc/code/libnd4j/blasbuild/cuda/blas/CMakeFiles/nd4jcuda.dir/cuda/nd4jcuda_generated_NativeOps.cu.o.depend.tmp and /home/agibsonccc/code/libnd4j/blasbuild/cuda/blas/CMakeFiles/nd4jcuda.dir/cuda/nd4jcuda_generated_NativeOps.cu.o.NVCC-depend | |
/usr/bin/cmake -E remove /home/agibsonccc/code/libnd4j/blasbuild/cuda/blas/CMakeFiles/nd4jcuda.dir/cuda/nd4jcuda_generated_NativeOps.cu.o.depend.tmp /home/agibsonccc/code/libnd4j/blasbuild/cuda/blas/CMakeFiles/nd4jcuda.dir/cuda/nd4jcuda_generated_NativeOps.cu.o.NVCC-depend | |
-- Generating /home/agibsonccc/code/libnd4j/blasbuild/cuda/blas/CMakeFiles/nd4jcuda.dir/cuda/./nd4jcuda_generated_NativeOps.cu.o | |
/usr/local/cuda-8.0/bin/nvcc /home/agibsonccc/code/libnd4j/blas/cuda/NativeOps.cu -c -o /home/agibsonccc/code/libnd4j/blasbuild/cuda/blas/CMakeFiles/nd4jcuda.dir/cuda/./nd4jcuda_generated_NativeOps.cu.o -m64 --std c++11 -D__CUDABLAS__=true -Dnd4jcuda_EXPORTS -Xcompiler ,\"-Wall\",\"-O3\",\"-Wl,-rpath,$ORIGIN/\",\"-march=x86-64\",\"-mtune=x86-64\",\"-fPIC\",\"-Wall\",\"-O3\",\"-fassociative-math\",\"-funsafe-math-optimizations\" --ptxas-options=-v -DCUDA_8 -DVERBOSE --cudart=static -O3 -gencode arch=compute_30,code=sm_30 -gencode arch=compute_35,code=sm_35 -gencode arch=compute_37,code=sm_37 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_53,code=sm_53 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_62,code=sm_62 -DNVCC -I/usr/local/cuda-8.0/include -I/home/agibsonccc/code/libnd4j/include -I/usr/include -I/usr/local/include -I/usr/local/cuda-8.0/include | |
/home/agibsonccc/code/libnd4j/blas/cuda/NativeOps.cu:1:0: warning: -mtune=x86-64 is deprecated; use -mtune=k8 or -mtune=generic instead as appropriate [-Wdeprecated] | |
^ | |
/home/agibsonccc/code/libnd4j/include/types/float16.h(50): warning: a __host__ function("cpu_half2float") redeclared with __host__ __device__, hence treated as a __host__ __device__ function | |
/home/agibsonccc/code/libnd4j/include/types/float16.h(88): warning: a __host__ function("cpu_float2half_rn") redeclared with __host__ __device__, hence treated as a __host__ __device__ function | |
/home/agibsonccc/code/libnd4j/blas/cuda/NativeOps.cu(125): warning: variable "ccMinor" was declared but never referenced | |
/home/agibsonccc/code/libnd4j/blas/cuda/NativeOps.cu(193): warning: variable "regPerBlock" was declared but never referenced | |
/home/agibsonccc/code/libnd4j/blas/cuda/NativeOps.cu(209): warning: variable "effective_block_limit" was declared but never referenced | |
/home/agibsonccc/code/libnd4j/blas/cuda/NativeOps.cu(281): warning: variable "zRank" was declared but never referenced | |
/home/agibsonccc/code/libnd4j/blas/cuda/NativeOps.cu(286): warning: variable "regPerBlock" was declared but never referenced | |
/home/agibsonccc/code/libnd4j/blas/cuda/NativeOps.cu(301): warning: variable "memory_floor" was declared but never referenced | |
/home/agibsonccc/code/libnd4j/blas/cuda/NativeOps.cu(609): warning: variable "hostYShapeInfo" was declared but never referenced | |
/home/agibsonccc/code/libnd4j/blas/cuda/NativeOps.cu(610): warning: variable "hostZShapeInfo" was declared but never referenced | |
/home/agibsonccc/code/libnd4j/blas/cuda/NativeOps.cu(1836): warning: variable "hostYShapeInfo" was declared but never referenced | |
/home/agibsonccc/code/libnd4j/blas/cuda/NativeOps.cu(1837): warning: variable "hostZShapeInfo" was declared but never referenced | |
/home/agibsonccc/code/libnd4j/blas/cuda/NativeOps.cu(2057): warning: variable "hostYShapeInfo" was declared but never referenced | |
/home/agibsonccc/code/libnd4j/blas/cuda/NativeOps.cu(2058): warning: variable "hostZShapeInfo" was declared but never referenced | |
/home/agibsonccc/code/libnd4j/blas/cuda/NativeOps.cu(2132): warning: variable "hostYShapeInfo" was declared but never referenced | |
/home/agibsonccc/code/libnd4j/blas/cuda/NativeOps.cu(2133): warning: variable "hostZShapeInfo" was declared but never referenced | |
/home/agibsonccc/code/libnd4j/include/loops/reduce3.h(329): warning: variable "tid" was declared but never referenced | |
detected during: | |
instantiation of "void functions::reduce3::Reduce3<T>::exec(int, T *, int *, T *, int *, T *, T *, int *, int *, int, int, int *, UnifiedSharedMemory *, int *, int *, int *, int *) [with T=double]" | |
(840): here | |
instantiation of "void reduce3Generic(int, T *, int *, T *, int *, T *, T *, int *, int *, int, int, int *, int *, int *, int *, int *) [with T=double]" | |
(907): here | |
/home/agibsonccc/code/libnd4j/include/loops/reduce3.h(333): warning: variable "xElementWiseStride" was declared but never referenced | |
detected during: | |
instantiation of "void functions::reduce3::Reduce3<T>::exec(int, T *, int *, T *, int *, T *, T *, int *, int *, int, int, int *, UnifiedSharedMemory *, int *, int *, int *, int *) [with T=double]" | |
(840): here | |
instantiation of "void reduce3Generic(int, T *, int *, T *, int *, T *, T *, int *, int *, int, int, int *, int *, int *, int *, int *) [with T=double]" | |
(907): here | |
/home/agibsonccc/code/libnd4j/include/loops/reduce3.h(334): warning: variable "yElementWiseStride" was declared but never referenced | |
detected during: | |
instantiation of "void functions::reduce3::Reduce3<T>::exec(int, T *, int *, T *, int *, T *, T *, int *, int *, int, int, int *, UnifiedSharedMemory *, int *, int *, int *, int *) [with T=double]" | |
(840): here | |
instantiation of "void reduce3Generic(int, T *, int *, T *, int *, T *, T *, int *, int *, int, int, int *, int *, int *, int *, int *) [with T=double]" | |
(907): here | |
/home/agibsonccc/code/libnd4j/include/loops/reduce3.h(342): warning: __shared__ memory variable with non-empty constructor or destructor (potential race between threads) | |
detected during: | |
instantiation of "void functions::reduce3::Reduce3<T>::transform<OpType>(T *, int *, T *, int *, T *, T *, int *, int *, int, int, int *, UnifiedSharedMemory *, int *, int *, int *, int *) [with T=float16, OpType=simdOps::ManhattanDistance<float16>]" | |
(504): here | |
instantiation of "void functions::reduce3::Reduce3<T>::exec(int, T *, int *, T *, int *, T *, T *, int *, int *, int, int, int *, UnifiedSharedMemory *, int *, int *, int *, int *) [with T=float16]" | |
(840): here | |
instantiation of "void reduce3Generic(int, T *, int *, T *, int *, T *, T *, int *, int *, int, int, int *, int *, int *, int *, int *) [with T=float16]" | |
(979): here | |
/home/agibsonccc/code/libnd4j/include/loops/reduce3.h(342): warning: __shared__ memory variable with non-empty constructor or destructor (potential race between threads) | |
detected during: | |
instantiation of "void functions::reduce3::Reduce3<T>::transform<OpType>(T *, int *, T *, int *, T *, T *, int *, int *, int, int, int *, UnifiedSharedMemory *, int *, int *, int *, int *) [with T=float16, OpType=simdOps::EuclideanDistance<float16>]" | |
(504): here | |
instantiation of "void functions::reduce3::Reduce3<T>::exec(int, T *, int *, T *, int *, T *, T *, int *, int *, int, int, int *, UnifiedSharedMemory *, int *, int *, int *, int *) [with T=float16]" | |
(840): here | |
instantiation of "void reduce3Generic(int, T *, int *, T *, int *, T *, T *, int *, int *, int, int, int *, int *, int *, int *, int *) [with T=float16]" | |
(979): here | |
/home/agibsonccc/code/libnd4j/include/loops/reduce3.h(342): warning: __shared__ memory variable with non-empty constructor or destructor (potential race between threads) | |
detected during: | |
instantiation of "void functions::reduce3::Reduce3<T>::transform<OpType>(T *, int *, T *, int *, T *, T *, int *, int *, int, int, int *, UnifiedSharedMemory *, int *, int *, int *, int *) [with T=float16, OpType=simdOps::CosineSimilarity<float16>]" | |
(504): here | |
instantiation of "void functions::reduce3::Reduce3<T>::exec(int, T *, int *, T *, int *, T *, T *, int *, int *, int, int, int *, UnifiedSharedMemory *, int *, int *, int *, int *) [with T=float16]" | |
(840): here | |
instantiation of "void reduce3Generic(int, T *, int *, T *, int *, T *, T *, int *, int *, int, int, int *, int *, int *, int *, int *) [with T=float16]" | |
(979): here | |
/home/agibsonccc/code/libnd4j/include/loops/reduce3.h(342): warning: __shared__ memory variable with non-empty constructor or destructor (potential race between threads) | |
detected during: | |
instantiation of "void functions::reduce3::Reduce3<T>::transform<OpType>(T *, int *, T *, int *, T *, T *, int *, int *, int, int, int *, UnifiedSharedMemory *, int *, int *, int *, int *) [with T=float16, OpType=simdOps::Dot<float16>]" | |
(504): here | |
instantiation of "void functions::reduce3::Reduce3<T>::exec(int, T *, int *, T *, int *, T *, T *, int *, int *, int, int, int *, UnifiedSharedMemory *, int *, int *, int *, int *) [with T=float16]" | |
(840): here | |
instantiation of "void reduce3Generic(int, T *, int *, T *, int *, T *, T *, int *, int *, int, int, int *, int *, int *, int *, int *) [with T=float16]" | |
(979): here | |
/home/agibsonccc/code/libnd4j/include/loops/reduce3.h(342): warning: __shared__ memory variable with non-empty constructor or destructor (potential race between threads) | |
detected during: | |
instantiation of "void functions::reduce3::Reduce3<T>::transform<OpType>(T *, int *, T *, int *, T *, T *, int *, int *, int, int, int *, UnifiedSharedMemory *, int *, int *, int *, int *) [with T=float16, OpType=simdOps::EqualsWithEps<float16>]" | |
(504): here | |
instantiation of "void functions::reduce3::Reduce3<T>::exec(int, T *, int *, T *, int *, T *, T *, int *, int *, int, int, int *, UnifiedSharedMemory *, int *, int *, int *, int *) [with T=float16]" | |
(840): here | |
instantiation of "void reduce3Generic(int, T *, int *, T *, int *, T *, T *, int *, int *, int, int, int *, int *, int *, int *, int *) [with T=float16]" | |
(979): here | |
/home/agibsonccc/code/libnd4j/include/loops/reduce3.h(172): warning: __shared__ memory variable with non-empty constructor or destructor (potential race between threads) | |
detected during: | |
instantiation of "void functions::reduce3::Reduce3<T>::execScalarCuda<OpType>(T *, int *, T *, int *, T *, T *, int *, int *, T *, UnifiedSharedMemory *, int *) [with T=float16, OpType=simdOps::ManhattanDistance<float16>]" | |
(521): here | |
instantiation of "void functions::reduce3::Reduce3<T>::execScalarCuda(int, T *, int *, T *, int *, T *, T *, int *, int *, T *, UnifiedSharedMemory *, int *) [with T=float16]" | |
(876): here | |
instantiation of "void reduce3ScalarGeneric(int, T *, int *, T *, int *, T *, T *, int *, int *, T *, int *, int *, int *, int *) [with T=float16]" | |
(1032): here | |
/home/agibsonccc/code/libnd4j/include/loops/reduce3.h(172): warning: __shared__ memory variable with non-empty constructor or destructor (potential race between threads) | |
detected during: | |
instantiation of "void functions::reduce3::Reduce3<T>::execScalarCuda<OpType>(T *, int *, T *, int *, T *, T *, int *, int *, T *, UnifiedSharedMemory *, int *) [with T=float16, OpType=simdOps::EuclideanDistance<float16>]" | |
(521): here | |
instantiation of "void functions::reduce3::Reduce3<T>::execScalarCuda(int, T *, int *, T *, int *, T *, T *, int *, int *, T *, UnifiedSharedMemory *, int *) [with T=float16]" | |
(876): here | |
instantiation of "void reduce3ScalarGeneric(int, T *, int *, T *, int *, T *, T *, int *, int *, T *, int *, int *, int *, int *) [with T=float16]" | |
(1032): here | |
/home/agibsonccc/code/libnd4j/include/loops/reduce3.h(172): warning: __shared__ memory variable with non-empty constructor or destructor (potential race between threads) | |
detected during: | |
instantiation of "void functions::reduce3::Reduce3<T>::execScalarCuda<OpType>(T *, int *, T *, int *, T *, T *, int *, int *, T *, UnifiedSharedMemory *, int *) [with T=float16, OpType=simdOps::CosineSimilarity<float16>]" | |
(521): here | |
instantiation of "void functions::reduce3::Reduce3<T>::execScalarCuda(int, T *, int *, T *, int *, T *, T *, int *, int *, T *, UnifiedSharedMemory *, int *) [with T=float16]" | |
(876): here | |
instantiation of "void reduce3ScalarGeneric(int, T *, int *, T *, int *, T *, T *, int *, int *, T *, int *, int *, int *, int *) [with T=float16]" | |
(1032): here | |
/home/agibsonccc/code/libnd4j/include/loops/reduce3.h(172): warning: __shared__ memory variable with non-empty constructor or destructor (potential race between threads) | |
detected during: | |
instantiation of "void functions::reduce3::Reduce3<T>::execScalarCuda<OpType>(T *, int *, T *, int *, T *, T *, int *, int *, T *, UnifiedSharedMemory *, int *) [with T=float16, OpType=simdOps::Dot<float16>]" | |
(521): here | |
instantiation of "void functions::reduce3::Reduce3<T>::execScalarCuda(int, T *, int *, T *, int *, T *, T *, int *, int *, T *, UnifiedSharedMemory *, int *) [with T=float16]" | |
(876): here | |
instantiation of "void reduce3ScalarGeneric(int, T *, int *, T *, int *, T *, T *, int *, int *, T *, int *, int *, int *, int *) [with T=float16]" | |
(1032): here | |
/home/agibsonccc/code/libnd4j/include/loops/reduce3.h(172): warning: __shared__ memory variable with non-empty constructor or destructor (potential race between threads) | |
detected during: | |
instantiation of "void functions::reduce3::Reduce3<T>::execScalarCuda<OpType>(T *, int *, T *, int *, T *, T *, int *, int *, T *, UnifiedSharedMemory *, int *) [with T=float16, OpType=simdOps::EqualsWithEps<float16>]" | |
(521): here | |
instantiation of "void functions::reduce3::Reduce3<T>::execScalarCuda(int, T *, int *, T *, int *, T *, T *, int *, int *, T *, UnifiedSharedMemory *, int *) [with T=float16]" | |
(876): here | |
instantiation of "void reduce3ScalarGeneric(int, T *, int *, T *, int *, T *, T *, int *, int *, T *, int *, int *, int *, int *) [with T=float16]" | |
(1032): here | |
/home/agibsonccc/code/libnd4j/include/loops/indexreduce.h(296): warning: invalid narrowing conversion from "int" to "unsigned int" | |
detected during: | |
instantiation of "void functions::indexreduce::IndexReduce<T>::transform<OpType>(T *, int *, T *, T *, int *, int *, int, int, int *, T *, UnifiedSharedMemory *, int *, int *) [with T=double, OpType=simdOps::IndexMax<double>]" | |
(98): here | |
instantiation of "void functions::indexreduce::IndexReduce<T>::transform(int, T *, int *, T *, T *, int *, int *, int, int, int *, T *, UnifiedSharedMemory *, int *, int *) [with T=double]" | |
(692): here | |
instantiation of "void indexReduceGeneric(int, T *, int *, int, T *, T *, int *, int, int *, int, int, int *, T *, int *, int *) [with T=double]" | |
(720): here | |
/home/agibsonccc/code/libnd4j/include/loops/indexreduce.h(306): warning: invalid narrowing conversion from "int" to "unsigned int" | |
detected during: | |
instantiation of "void functions::indexreduce::IndexReduce<T>::transform<OpType>(T *, int *, T *, T *, int *, int *, int, int, int *, T *, UnifiedSharedMemory *, int *, int *) [with T=double, OpType=simdOps::IndexMax<double>]" | |
(98): here | |
instantiation of "void functions::indexreduce::IndexReduce<T>::transform(int, T *, int *, T *, T *, int *, int *, int, int, int *, T *, UnifiedSharedMemory *, int *, int *) [with T=double]" | |
(692): here | |
instantiation of "void indexReduceGeneric(int, T *, int *, int, T *, T *, int *, int, int *, int, int, int *, T *, int *, int *) [with T=double]" | |
(720): here | |
/home/agibsonccc/code/libnd4j/include/loops/indexreduce.h(296): warning: invalid narrowing conversion from "int" to "unsigned int" | |
detected during: | |
instantiation of "void functions::indexreduce::IndexReduce<T>::transform<OpType>(T *, int *, T *, T *, int *, int *, int, int, int *, T *, UnifiedSharedMemory *, int *, int *) [with T=double, OpType=simdOps::IndexMin<double>]" | |
(98): here | |
instantiation of "void functions::indexreduce::IndexReduce<T>::transform(int, T *, int *, T *, T *, int *, int *, int, int, int *, T *, UnifiedSharedMemory *, int *, int *) [with T=double]" | |
(692): here | |
instantiation of "void indexReduceGeneric(int, T *, int *, int, T *, T *, int *, int, int *, int, int, int *, T *, int *, int *) [with T=double]" | |
(720): here | |
/home/agibsonccc/code/libnd4j/include/loops/indexreduce.h(306): warning: invalid narrowing conversion from "int" to "unsigned int" | |
detected during: | |
instantiation of "void functions::indexreduce::IndexReduce<T>::transform<OpType>(T *, int *, T *, T *, int *, int *, int, int, int *, T *, UnifiedSharedMemory *, int *, int *) [with T=double, OpType=simdOps::IndexMin<double>]" | |
(98): here | |
instantiation of "void functions::indexreduce::IndexReduce<T>::transform(int, T *, int *, T *, T *, int *, int *, int, int, int *, T *, UnifiedSharedMemory *, int *, int *) [with T=double]" | |
(692): here | |
instantiation of "void indexReduceGeneric(int, T *, int *, int, T *, T *, int *, int, int *, int, int, int *, T *, int *, int *) [with T=double]" | |
(720): here | |
/home/agibsonccc/code/libnd4j/include/loops/indexreduce.h(296): warning: invalid narrowing conversion from "int" to "unsigned int" | |
detected during: | |
instantiation of "void functions::indexreduce::IndexReduce<T>::transform<OpType>(T *, int *, T *, T *, int *, int *, int, int, int *, T *, UnifiedSharedMemory *, int *, int *) [with T=double, OpType=simdOps::IndexAbsoluteMax<double>]" | |
(98): here | |
instantiation of "void functions::indexreduce::IndexReduce<T>::transform(int, T *, int *, T *, T *, int *, int *, int, int, int *, T *, UnifiedSharedMemory *, int *, int *) [with T=double]" | |
(692): here | |
instantiation of "void indexReduceGeneric(int, T *, int *, int, T *, T *, int *, int, int *, int, int, int *, T *, int *, int *) [with T=double]" | |
(720): here | |
/home/agibsonccc/code/libnd4j/include/loops/indexreduce.h(306): warning: invalid narrowing conversion from "int" to "unsigned int" | |
detected during: | |
instantiation of "void functions::indexreduce::IndexReduce<T>::transform<OpType>(T *, int *, T *, T *, int *, int *, int, int, int *, T *, UnifiedSharedMemory *, int *, int *) [with T=double, OpType=simdOps::IndexAbsoluteMax<double>]" | |
(98): here | |
instantiation of "void functions::indexreduce::IndexReduce<T>::transform(int, T *, int *, T *, T *, int *, int *, int, int, int *, T *, UnifiedSharedMemory *, int *, int *) [with T=double]" | |
(692): here | |
instantiation of "void indexReduceGeneric(int, T *, int *, int, T *, T *, int *, int, int *, int, int, int *, T *, int *, int *) [with T=double]" | |
(720): here | |
/home/agibsonccc/code/libnd4j/include/loops/indexreduce.h(296): warning: invalid narrowing conversion from "int" to "unsigned int" | |
detected during: | |
instantiation of "void functions::indexreduce::IndexReduce<T>::transform<OpType>(T *, int *, T *, T *, int *, int *, int, int, int *, T *, UnifiedSharedMemory *, int *, int *) [with T=double, OpType=simdOps::IndexAbsoluteMin<double>]" | |
(98): here | |
instantiation of "void functions::indexreduce::IndexReduce<T>::transform(int, T *, int *, T *, T *, int *, int *, int, int, int *, T *, UnifiedSharedMemory *, int *, int *) [with T=double]" | |
(692): here | |
instantiation of "void indexReduceGeneric(int, T *, int *, int, T *, T *, int *, int, int *, int, int, int *, T *, int *, int *) [with T=double]" | |
(720): here | |
/home/agibsonccc/code/libnd4j/include/loops/indexreduce.h(306): warning: invalid narrowing conversion from "int" to "unsigned int" | |
detected during: | |
instantiation of "void functions::indexreduce::IndexReduce<T>::transform<OpType>(T *, int *, T *, T *, int *, int *, int, int, int *, T *, UnifiedSharedMemory *, int *, int *) [with T=double, OpType=simdOps::IndexAbsoluteMin<double>]" | |
(98): here | |
instantiation of "void functions::indexreduce::IndexReduce<T>::transform(int, T *, int *, T *, T *, int *, int *, int, int, int *, T *, UnifiedSharedMemory *, int *, int *) [with T=double]" | |
(692): here | |
instantiation of "void indexReduceGeneric(int, T *, int *, int, T *, T *, int *, int, int *, int, int, int *, T *, int *, int *) [with T=double]" | |
(720): here | |
/home/agibsonccc/code/libnd4j/include/loops/indexreduce.h(296): warning: invalid narrowing conversion from "int" to "unsigned int" | |
detected during: | |
instantiation of "void functions::indexreduce::IndexReduce<T>::transform<OpType>(T *, int *, T *, T *, int *, int *, int, int, int *, T *, UnifiedSharedMemory *, int *, int *) [with T=float, OpType=simdOps::IndexMax<float>]" | |
(98): here | |
instantiation of "void functions::indexreduce::IndexReduce<T>::transform(int, T *, int *, T *, T *, int *, int *, int, int, int *, T *, UnifiedSharedMemory *, int *, int *) [with T=float]" | |
(692): here | |
instantiation of "void indexReduceGeneric(int, T *, int *, int, T *, T *, int *, int, int *, int, int, int *, T *, int *, int *) [with T=float]" | |
(758): here | |
/home/agibsonccc/code/libnd4j/include/loops/indexreduce.h(306): warning: invalid narrowing conversion from "int" to "unsigned int" | |
detected during: | |
instantiation of "void functions::indexreduce::IndexReduce<T>::transform<OpType>(T *, int *, T *, T *, int *, int *, int, int, int *, T *, UnifiedSharedMemory *, int *, int *) [with T=float, OpType=simdOps::IndexMax<float>]" | |
(98): here | |
instantiation of "void functions::indexreduce::IndexReduce<T>::transform(int, T *, int *, T *, T *, int *, int *, int, int, int *, T *, UnifiedSharedMemory *, int *, int *) [with T=float]" | |
(692): here | |
instantiation of "void indexReduceGeneric(int, T *, int *, int, T *, T *, int *, int, int *, int, int, int *, T *, int *, int *) [with T=float]" | |
(758): here | |
/home/agibsonccc/code/libnd4j/include/loops/indexreduce.h(296): warning: invalid narrowing conversion from "int" to "unsigned int" | |
detected during: | |
instantiation of "void functions::indexreduce::IndexReduce<T>::transform<OpType>(T *, int *, T *, T *, int *, int *, int, int, int *, T *, UnifiedSharedMemory *, int *, int *) [with T=float, OpType=simdOps::IndexMin<float>]" | |
(98): here | |
instantiation of "void functions::indexreduce::IndexReduce<T>::transform(int, T *, int *, T *, T *, int *, int *, int, int, int *, T *, UnifiedSharedMemory *, int *, int *) [with T=float]" | |
(692): here | |
instantiation of "void indexReduceGeneric(int, T *, int *, int, T *, T *, int *, int, int *, int, int, int *, T *, int *, int *) [with T=float]" | |
(758): here | |
/home/agibsonccc/code/libnd4j/include/loops/indexreduce.h(306): warning: invalid narrowing conversion from "int" to "unsigned int" | |
detected during: | |
instantiation of "void functions::indexreduce::IndexReduce<T>::transform<OpType>(T *, int *, T *, T *, int *, int *, int, int, int *, T *, UnifiedSharedMemory *, int *, int *) [with T=float, OpType=simdOps::IndexMin<float>]" | |
(98): here | |
instantiation of "void functions::indexreduce::IndexReduce<T>::transform(int, T *, int *, T *, T *, int *, int *, int, int, int *, T *, UnifiedSharedMemory *, int *, int *) [with T=float]" | |
(692): here | |
instantiation of "void indexReduceGeneric(int, T *, int *, int, T *, T *, int *, int, int *, int, int, int *, T *, int *, int *) [with T=float]" | |
(758): here | |
/home/agibsonccc/code/libnd4j/include/loops/indexreduce.h(296): warning: invalid narrowing conversion from "int" to "unsigned int" | |
detected during: | |
instantiation of "void functions::indexreduce::IndexReduce<T>::transform<OpType>(T *, int *, T *, T *, int *, int *, int, int, int *, T *, UnifiedSharedMemory *, int *, int *) [with T=float, OpType=simdOps::IndexAbsoluteMax<float>]" | |
(98): here | |
instantiation of "void functions::indexreduce::IndexReduce<T>::transform(int, T *, int *, T *, T *, int *, int *, int, int, int *, T *, UnifiedSharedMemory *, int *, int *) [with T=float]" | |
(692): here | |
instantiation of "void indexReduceGeneric(int, T *, int *, int, T *, T *, int *, int, int *, int, int, int *, T *, int *, int *) [with T=float]" | |
(758): here | |
/home/agibsonccc/code/libnd4j/include/loops/indexreduce.h(306): warning: invalid narrowing conversion from "int" to "unsigned int" | |
detected during: | |
instantiation of "void functions::indexreduce::IndexReduce<T>::transform<OpType>(T *, int *, T *, T *, int *, int *, int, int, int *, T *, UnifiedSharedMemory *, int *, int *) [with T=float, OpType=simdOps::IndexAbsoluteMax<float>]" | |
(98): here | |
instantiation of "void functions::indexreduce::IndexReduce<T>::transform(int, T *, int *, T *, T *, int *, int *, int, int, int *, T *, UnifiedSharedMemory *, int *, int *) [with T=float]" | |
(692): here | |
instantiation of "void indexReduceGeneric(int, T *, int *, int, T *, T *, int *, int, int *, int, int, int *, T *, int *, int *) [with T=float]" | |
(758): here | |
/home/agibsonccc/code/libnd4j/include/loops/indexreduce.h(296): warning: invalid narrowing conversion from "int" to "unsigned int" | |
detected during: | |
instantiation of "void functions::indexreduce::IndexReduce<T>::transform<OpType>(T *, int *, T *, T *, int *, int *, int, int, int *, T *, UnifiedSharedMemory *, int *, int *) [with T=float, OpType=simdOps::IndexAbsoluteMin<float>]" | |
(98): here | |
instantiation of "void functions::indexreduce::IndexReduce<T>::transform(int, T *, int *, T *, T *, int *, int *, int, int, int *, T *, UnifiedSharedMemory *, int *, int *) [with T=float]" | |
(692): here | |
instantiation of "void indexReduceGeneric(int, T *, int *, int, T *, T *, int *, int, int *, int, int, int *, T *, int *, int *) [with T=float]" | |
(758): here | |
/home/agibsonccc/code/libnd4j/include/loops/indexreduce.h(306): warning: invalid narrowing conversion from "int" to "unsigned int" | |
detected during: | |
instantiation of "void functions::indexreduce::IndexReduce<T>::transform<OpType>(T *, int *, T *, T *, int *, int *, int, int, int *, T *, UnifiedSharedMemory *, int *, int *) [with T=float, OpType=simdOps::IndexAbsoluteMin<float>]" | |
(98): here | |
instantiation of "void functions::indexreduce::IndexReduce<T>::transform(int, T *, int *, T *, T *, int *, int *, int, int, int *, T *, UnifiedSharedMemory *, int *, int *) [with T=float]" | |
(692): here | |
instantiation of "void indexReduceGeneric(int, T *, int *, int, T *, T *, int *, int, int *, int, int, int *, T *, int *, int *) [with T=float]" | |
(758): here | |
/home/agibsonccc/code/libnd4j/include/loops/indexreduce.h(296): warning: invalid narrowing conversion from "int" to "unsigned int" | |
detected during: | |
instantiation of "void functions::indexreduce::IndexReduce<T>::transform<OpType>(T *, int *, T *, T *, int *, int *, int, int, int *, T *, UnifiedSharedMemory *, int *, int *) [with T=float16, OpType=simdOps::IndexMax<float16>]" | |
(98): here | |
instantiation of "void functions::indexreduce::IndexReduce<T>::transform(int, T *, int *, T *, T *, int *, int *, int, int, int *, T *, UnifiedSharedMemory *, int *, int *) [with T=float16]" | |
(692): here | |
instantiation of "void indexReduceGeneric(int, T *, int *, int, T *, T *, int *, int, int *, int, int, int *, T *, int *, int *) [with T=float16]" | |
(781): here | |
/home/agibsonccc/code/libnd4j/include/loops/indexreduce.h(306): warning: invalid narrowing conversion from "int" to "unsigned int" | |
detected during: | |
instantiation of "void functions::indexreduce::IndexReduce<T>::transform<OpType>(T *, int *, T *, T *, int *, int *, int, int, int *, T *, UnifiedSharedMemory *, int *, int *) [with T=float16, OpType=simdOps::IndexMax<float16>]" | |
(98): here | |
instantiation of "void functions::indexreduce::IndexReduce<T>::transform(int, T *, int *, T *, T *, int *, int *, int, int, int *, T *, UnifiedSharedMemory *, int *, int *) [with T=float16]" | |
(692): here | |
instantiation of "void indexReduceGeneric(int, T *, int *, int, T *, T *, int *, int, int *, int, int, int *, T *, int *, int *) [with T=float16]" | |
(781): here | |
/home/agibsonccc/code/libnd4j/include/loops/indexreduce.h(296): warning: invalid narrowing conversion from "int" to "unsigned int" | |
detected during: | |
instantiation of "void functions::indexreduce::IndexReduce<T>::transform<OpType>(T *, int *, T *, T *, int *, int *, int, int, int *, T *, UnifiedSharedMemory *, int *, int *) [with T=float16, OpType=simdOps::IndexMin<float16>]" | |
(98): here | |
instantiation of "void functions::indexreduce::IndexReduce<T>::transform(int, T *, int *, T *, T *, int *, int *, int, int, int *, T *, UnifiedSharedMemory *, int *, int *) [with T=float16]" | |
(692): here | |
instantiation of "void indexReduceGeneric(int, T *, int *, int, T *, T *, int *, int, int *, int, int, int *, T *, int *, int *) [with T=float16]" | |
(781): here | |
/home/agibsonccc/code/libnd4j/include/loops/indexreduce.h(306): warning: invalid narrowing conversion from "int" to "unsigned int" | |
detected during: | |
instantiation of "void functions::indexreduce::IndexReduce<T>::transform<OpType>(T *, int *, T *, T *, int *, int *, int, int, int *, T *, UnifiedSharedMemory *, int *, int *) [with T=float16, OpType=simdOps::IndexMin<float16>]" | |
(98): here | |
instantiation of "void functions::indexreduce::IndexReduce<T>::transform(int, T *, int *, T *, T *, int *, int *, int, int, int *, T *, UnifiedSharedMemory *, int *, int *) [with T=float16]" | |
(692): here | |
instantiation of "void indexReduceGeneric(int, T *, int *, int, T *, T *, int *, int, int *, int, int, int *, T *, int *, int *) [with T=float16]" | |
(781): here | |
/home/agibsonccc/code/libnd4j/include/loops/indexreduce.h(296): warning: invalid narrowing conversion from "int" to "unsigned int" | |
detected during: | |
instantiation of "void functions::indexreduce::IndexReduce<T>::transform<OpType>(T *, int *, T *, T *, int *, int *, int, int, int *, T *, UnifiedSharedMemory *, int *, int *) [with T=float16, OpType=simdOps::IndexAbsoluteMax<float16>]" | |
(98): here | |
instantiation of "void functions::indexreduce::IndexReduce<T>::transform(int, T *, int *, T *, T *, int *, int *, int, int, int *, T *, UnifiedSharedMemory *, int *, int *) [with T=float16]" | |
(692): here | |
instantiation of "void indexReduceGeneric(int, T *, int *, int, T *, T *, int *, int, int *, int, int, int *, T *, int *, int *) [with T=float16]" | |
(781): here | |
/home/agibsonccc/code/libnd4j/include/loops/indexreduce.h(306): warning: invalid narrowing conversion from "int" to "unsigned int" | |
detected during: | |
instantiation of "void functions::indexreduce::IndexReduce<T>::transform<OpType>(T *, int *, T *, T *, int *, int *, int, int, int *, T *, UnifiedSharedMemory *, int *, int *) [with T=float16, OpType=simdOps::IndexAbsoluteMax<float16>]" | |
(98): here | |
instantiation of "void functions::indexreduce::IndexReduce<T>::transform(int, T *, int *, T *, T *, int *, int *, int, int, int *, T *, UnifiedSharedMemory *, int *, int *) [with T=float16]" | |
(692): here | |
instantiation of "void indexReduceGeneric(int, T *, int *, int, T *, T *, int *, int, int *, int, int, int *, T *, int *, int *) [with T=float16]" | |
(781): here | |
/home/agibsonccc/code/libnd4j/include/loops/indexreduce.h(296): warning: invalid narrowing conversion from "int" to "unsigned int" | |
detected during: | |
instantiation of "void functions::indexreduce::IndexReduce<T>::transform<OpType>(T *, int *, T *, T *, int *, int *, int, int, int *, T *, UnifiedSharedMemory *, int *, int *) [with T=float16, OpType=simdOps::IndexAbsoluteMin<float16>]" | |
(98): here | |
instantiation of "void functions::indexreduce::IndexReduce<T>::transform(int, T *, int *, T *, T *, int *, int *, int, int, int *, T *, UnifiedSharedMemory *, int *, int *) [with T=float16]" | |
(692): here | |
instantiation of "void indexReduceGeneric(int, T *, int *, int, T *, T *, int *, int, int *, int, int, int *, T *, int *, int *) [with T=float16]" | |
(781): here | |
/home/agibsonccc/code/libnd4j/include/loops/indexreduce.h(306): warning: invalid narrowing conversion from "int" to "unsigned int" | |
detected during: | |
instantiation of "void functions::indexreduce::IndexReduce<T>::transform<OpType>(T *, int *, T *, T *, int *, int *, int, int, int *, T *, UnifiedSharedMemory *, int *, int *) [with T=float16, OpType=simdOps::IndexAbsoluteMin<float16>]" | |
(98): here | |
instantiation of "void functions::indexreduce::IndexReduce<T>::transform(int, T *, int *, T *, T *, int *, int *, int, int, int *, T *, UnifiedSharedMemory *, int *, int *) [with T=float16]" | |
(692): here | |
instantiation of "void indexReduceGeneric(int, T *, int *, int, T *, T *, int *, int, int *, int, int, int *, T *, int *, int *) [with T=float16]" | |
(781): here | |
/home/agibsonccc/code/libnd4j/include/ops/special_ops.h(824): warning: __shared__ memory variable with non-empty constructor or destructor (potential race between threads) | |
detected during: | |
instantiation of "void simdOps::SoftMax<T>::execSpecialCuda(T *, int *, T *, int *, T *, int *, T *, UnifiedSharedMemory *) [with T=float16]" | |
/home/agibsonccc/code/libnd4j/include/loops/transform.h(148): here | |
instantiation of "void functions::transform::Transform<T>::transformCuda<OpType>(T *, int *, T *, T *, int *, int *, T *, UnifiedSharedMemory *) [with T=float16, OpType=simdOps::SoftMax<float16>]" | |
/home/agibsonccc/code/libnd4j/include/loops/transform.h(245): here | |
instantiation of "void functions::transform::Transform<T>::transformCuda(int, T *, int *, T *, T *, int *, int *, T *, UnifiedSharedMemory *) [with T=float16]" | |
/home/agibsonccc/code/libnd4j/include/loops/transform.h(615): here | |
instantiation of "void transformGenericIndexes(int, T *, int *, int, T *, T *, int *, int *, T *) [with T=float16]" | |
/home/agibsonccc/code/libnd4j/include/loops/transform.h(684): here | |
/home/agibsonccc/code/libnd4j/include/ops/special_ops.h(1154): warning: __shared__ memory variable with non-empty constructor or destructor (potential race between threads) | |
detected during: | |
instantiation of "void simdOps::SoftMaxDerivative<T>::execSpecialCuda(T *, int *, T *, int *, T *, int *, T *, UnifiedSharedMemory *) [with T=float16]" | |
/home/agibsonccc/code/libnd4j/include/loops/transform.h(148): here | |
instantiation of "void functions::transform::Transform<T>::transformCuda<OpType>(T *, int *, T *, T *, int *, int *, T *, UnifiedSharedMemory *) [with T=float16, OpType=simdOps::SoftMaxDerivative<float16>]" | |
/home/agibsonccc/code/libnd4j/include/loops/transform.h(245): here | |
instantiation of "void functions::transform::Transform<T>::transformCuda(int, T *, int *, T *, T *, int *, int *, T *, UnifiedSharedMemory *) [with T=float16]" | |
/home/agibsonccc/code/libnd4j/include/loops/transform.h(615): here | |
instantiation of "void transformGenericIndexes(int, T *, int *, int, T *, T *, int *, int *, T *) [with T=float16]" | |
/home/agibsonccc/code/libnd4j/include/loops/transform.h(684): here | |
/home/agibsonccc/code/libnd4j/include/ops/special_ops.h(995): warning: __shared__ memory variable with non-empty constructor or destructor (potential race between threads) | |
detected during: | |
instantiation of "void simdOps::LogSoftMax<T>::execSpecialCuda(T *, int *, T *, int *, T *, int *, T *, UnifiedSharedMemory *) [with T=float16]" | |
/home/agibsonccc/code/libnd4j/include/loops/transform.h(148): here | |
instantiation of "void functions::transform::Transform<T>::transformCuda<OpType>(T *, int *, T *, T *, int *, int *, T *, UnifiedSharedMemory *) [with T=float16, OpType=simdOps::LogSoftMax<float16>]" | |
/home/agibsonccc/code/libnd4j/include/loops/transform.h(245): here | |
instantiation of "void functions::transform::Transform<T>::transformCuda(int, T *, int *, T *, T *, int *, int *, T *, UnifiedSharedMemory *) [with T=float16]" | |
/home/agibsonccc/code/libnd4j/include/loops/transform.h(615): here | |
instantiation of "void transformGenericIndexes(int, T *, int *, int, T *, T *, int *, int *, T *) [with T=float16]" | |
/home/agibsonccc/code/libnd4j/include/loops/transform.h(684): here | |
/home/agibsonccc/code/libnd4j/include/helpers/../templatemath.h(137): error: more than one operator "<" matches these operands: | |
built-in operator "arithmetic < arithmetic" | |
function "operator<(const float16 &, const float16 &)" | |
operand types are: float16 < int | |
detected during: | |
instantiation of "T nd4j::math::nd4j_sgn(T) [with T=float16]" | |
/home/agibsonccc/code/libnd4j/include/ops/ops.h(681): here | |
instantiation of "T simdOps::RationalTanh<T>::op(T, T *) [with T=float16]" | |
/home/agibsonccc/code/libnd4j/include/loops/transform.h(221): here | |
instantiation of "void functions::transform::Transform<T>::transformCuda<OpType>(Nd4jIndex, T *, int, T *, T *, int, int *, T *, UnifiedSharedMemory *) [with T=float16, OpType=simdOps::RationalTanh<float16>]" | |
/home/agibsonccc/code/libnd4j/include/loops/transform.h(176): here | |
instantiation of "void functions::transform::Transform<T>::transformCuda<OpType>(T *, int *, T *, T *, int *, int *, T *, UnifiedSharedMemory *) [with T=float16, OpType=simdOps::RationalTanh<float16>]" | |
/home/agibsonccc/code/libnd4j/include/loops/transform.h(245): here | |
instantiation of "void functions::transform::Transform<T>::transformCuda(int, T *, int *, T *, T *, int *, int *, T *, UnifiedSharedMemory *) [with T=float16]" | |
/home/agibsonccc/code/libnd4j/include/loops/transform.h(615): here | |
instantiation of "void transformGenericIndexes(int, T *, int *, int, T *, T *, int *, int *, T *) [with T=float16]" | |
/home/agibsonccc/code/libnd4j/include/loops/transform.h(684): here | |
/home/agibsonccc/code/libnd4j/include/loops/transform.h(1413): warning: variable "yStride" was declared but never referenced | |
/home/agibsonccc/code/libnd4j/include/loops/transform.h(1449): warning: variable "zX" was declared but never referenced | |
detected during instantiation of "void shuffleKernelGeneric(T **, int **, T **, int **, int, int *, int **, int **) [with T=double]" | |
(1482): here | |
/home/agibsonccc/code/libnd4j/include/loops/transform.h(1449): warning: variable "zX" was declared but never referenced | |
detected during instantiation of "void shuffleKernelGeneric(T **, int **, T **, int **, int, int *, int **, int **) [with T=float]" | |
(1486): here | |
/home/agibsonccc/code/libnd4j/include/loops/transform.h(1449): warning: variable "zX" was declared but never referenced | |
detected during instantiation of "void shuffleKernelGeneric(T **, int **, T **, int **, int, int *, int **, int **) [with T=float16]" | |
(1490): here | |
/home/agibsonccc/code/libnd4j/include/loops/summarystatsreduce.h(355): warning: variable "numElements" was declared but never referenced | |
detected during: | |
instantiation of "void functions::summarystats::SummaryStatsReduce<T>::transform(int, T *, int *, T *, T *, int *, int *, int, int, int *, T *, UnifiedSharedMemory *, int *, int *) [with T=double]" | |
(875): here | |
instantiation of "void summaryStatsReduceGeneric(int, T *, int *, int, T *, T *, int *, int, int *, int, int, __nv_bool, int *, T *, int *, int *) [with T=double]" | |
(903): here | |
/home/agibsonccc/code/libnd4j/include/ops/special_random_ops.h(34): warning: variable "xLength" was set but never used | |
detected during: | |
instantiation of "void functions::random::RandomFunction<T>::execTransformCuda<OpClass>(Nd4jPointer, T *, int *, T *, int *, T *, int *, T *) [with T=float, OpClass=randomOps::Choice<float>]" | |
/home/agibsonccc/code/libnd4j/include/loops/random.h(489): here | |
instantiation of "void randomTripleGeneric<T,OpClass>(Nd4jPointer, T *, int *, T *, int *, T *, int *, T *) [with T=float, OpClass=randomOps::Choice<float>]" | |
/home/agibsonccc/code/libnd4j/include/loops/random.h(502): here | |
/home/agibsonccc/code/libnd4j/include/ops/aggregate_ops.h(825): warning: variable "initialIdx" was set but never used | |
detected during: | |
instantiation of "void functions::aggregate::AggregatedFunction<T>::execCuda<OpClass>(T **, int, int **, int, int *, int, int **, int, T *, int) [with T=float, OpClass=aggregateOps::CBOW<float>]" | |
/home/agibsonccc/code/libnd4j/include/loops/aggregates.h(50): here | |
instantiation of "void aggregateGeneric<T,OpClass>(T **, int, int **, int, int *, int, int **, int, T *, int) [with T=float, OpClass=aggregateOps::CBOW<float>]" | |
/home/agibsonccc/code/libnd4j/include/loops/aggregates.h(100): here | |
/home/agibsonccc/code/libnd4j/include/ops/aggregate_ops.h(842): warning: variable "expTable" was declared but never referenced | |
detected during: | |
instantiation of "void aggregateOps::CBOW<T>::executeAggregateCuda(T **, int, int **, int, int *, int, int **, int, T *, int) [with T=float]" | |
/home/agibsonccc/code/libnd4j/include/loops/aggregates.h(30): here | |
instantiation of "void functions::aggregate::AggregatedFunction<T>::execCuda<OpClass>(T **, int, int **, int, int *, int, int **, int, T *, int) [with T=float, OpClass=aggregateOps::CBOW<float>]" | |
/home/agibsonccc/code/libnd4j/include/loops/aggregates.h(50): here | |
instantiation of "void aggregateGeneric<T,OpClass>(T **, int, int **, int, int *, int, int **, int, T *, int) [with T=float, OpClass=aggregateOps::CBOW<float>]" | |
/home/agibsonccc/code/libnd4j/include/loops/aggregates.h(100): here | |
/home/agibsonccc/code/libnd4j/include/ops/aggregate_ops.h(842): warning: variable "expTable" was declared but never referenced | |
detected during: | |
instantiation of "void aggregateOps::CBOW<T>::executeAggregateCuda(T **, int, int **, int, int *, int, int **, int, T *, int) [with T=double]" | |
/home/agibsonccc/code/libnd4j/include/loops/aggregates.h(30): here | |
instantiation of "void functions::aggregate::AggregatedFunction<T>::execCuda<OpClass>(T **, int, int **, int, int *, int, int **, int, T *, int) [with T=double, OpClass=aggregateOps::CBOW<double>]" | |
/home/agibsonccc/code/libnd4j/include/loops/aggregates.h(50): here | |
instantiation of "void aggregateGeneric<T,OpClass>(T **, int, int **, int, int *, int, int **, int, T *, int) [with T=double, OpClass=aggregateOps::CBOW<double>]" | |
/home/agibsonccc/code/libnd4j/include/loops/aggregates.h(101): here | |
/home/agibsonccc/code/libnd4j/include/ops/aggregate_ops.h(842): warning: variable "expTable" was declared but never referenced | |
detected during: | |
instantiation of "void aggregateOps::CBOW<T>::executeAggregateCuda(T **, int, int **, int, int *, int, int **, int, T *, int) [with T=float16]" | |
/home/agibsonccc/code/libnd4j/include/loops/aggregates.h(30): here | |
instantiation of "void functions::aggregate::AggregatedFunction<T>::execCuda<OpClass>(T **, int, int **, int, int *, int, int **, int, T *, int) [with T=float16, OpClass=aggregateOps::CBOW<float16>]" | |
/home/agibsonccc/code/libnd4j/include/loops/aggregates.h(50): here | |
instantiation of "void aggregateGeneric<T,OpClass>(T **, int, int **, int, int *, int, int **, int, T *, int) [with T=float16, OpClass=aggregateOps::CBOW<float16>]" | |
/home/agibsonccc/code/libnd4j/include/loops/aggregates.h(102): here | |
1 error detected in the compilation of "/tmp/tmpxft_00006b61_00000000-23_NativeOps.compute_62.cpp1.ii". | |
-- Removing /home/agibsonccc/code/libnd4j/blasbuild/cuda/blas/CMakeFiles/nd4jcuda.dir/cuda/./nd4jcuda_generated_NativeOps.cu.o | |
/usr/bin/cmake -E remove /home/agibsonccc/code/libnd4j/blasbuild/cuda/blas/CMakeFiles/nd4jcuda.dir/cuda/./nd4jcuda_generated_NativeOps.cu.o | |
CMake Error at nd4jcuda_generated_NativeOps.cu.o.cmake:257 (message): | |
Error generating file | |
/home/agibsonccc/code/libnd4j/blasbuild/cuda/blas/CMakeFiles/nd4jcuda.dir/cuda/./nd4jcuda_generated_NativeOps.cu.o | |
blas/CMakeFiles/nd4jcuda.dir/build.make:66: recipe for target 'blas/CMakeFiles/nd4jcuda.dir/cuda/nd4jcuda_generated_NativeOps.cu.o' failed | |
make[2]: *** [blas/CMakeFiles/nd4jcuda.dir/cuda/nd4jcuda_generated_NativeOps.cu.o] Error 1 | |
make[2]: Leaving directory '/home/agibsonccc/code/libnd4j/blasbuild/cuda' | |
CMakeFiles/Makefile2:124: recipe for target 'blas/CMakeFiles/nd4jcuda.dir/all' failed | |
make[1]: *** [blas/CMakeFiles/nd4jcuda.dir/all] Error 2 | |
make[1]: Leaving directory '/home/agibsonccc/code/libnd4j/blasbuild/cuda' | |
Makefile:86: recipe for target 'all' failed | |
make: *** [all] Error 2 |
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment