ext/torch/extconf.rb in torch-rb-0.1.8 vs ext/torch/extconf.rb in torch-rb-0.2.0

- old
+ new

@@ -1,30 +1,57 @@ require "mkmf-rice" abort "Missing stdc++" unless have_library("stdc++") -$CXXFLAGS << " -std=c++11" +$CXXFLAGS << " -std=c++14" -# needed for Linux pre-cxx11 ABI version -# $CXXFLAGS << " -D_GLIBCXX_USE_CXX11_ABI=0" +# change to 0 for Linux pre-cxx11 ABI version +$CXXFLAGS << " -D_GLIBCXX_USE_CXX11_ABI=1" +# TODO check compiler name +clang = RbConfig::CONFIG["host_os"] =~ /darwin/i + +if have_library("omp") || have_library("gomp") + $CXXFLAGS << " -DAT_PARALLEL_OPENMP=1" + $CXXFLAGS << " -Xclang" if clang + $CXXFLAGS << " -fopenmp" +end + # silence ruby/intern.h warning $CXXFLAGS << " -Wno-deprecated-register" # silence torch warnings -$CXXFLAGS << " -Wno-shorten-64-to-32 -Wno-missing-noreturn" +if clang + $CXXFLAGS << " -Wno-shorten-64-to-32 -Wno-missing-noreturn" +else + $CXXFLAGS << " -Wno-duplicated-cond -Wno-suggest-attribute=noreturn" +end inc, lib = dir_config("torch") - inc ||= "/usr/local/include" lib ||= "/usr/local/lib" +cuda_inc, cuda_lib = dir_config("cuda") +cuda_inc ||= "/usr/local/cuda/include" +cuda_lib ||= "/usr/local/cuda/lib64" + +with_cuda = Dir["#{lib}/*torch_cuda*"].any? && have_library("cuda") && have_library("cudnn") + $INCFLAGS << " -I#{inc}" $INCFLAGS << " -I#{inc}/torch/csrc/api/include" $LDFLAGS << " -Wl,-rpath,#{lib}" +$LDFLAGS << ":#{cuda_lib}/stubs:#{cuda_lib}" if with_cuda $LDFLAGS << " -L#{lib}" -$LDFLAGS << " -ltorch -lc10" +$LDFLAGS << " -L#{cuda_lib}" if with_cuda + +# https://github.com/pytorch/pytorch/blob/v1.5.0/torch/utils/cpp_extension.py#L1232-L1238 +$LDFLAGS << " -lc10 -ltorch_cpu -ltorch" +if with_cuda + $LDFLAGS << " -lcuda -lnvrtc -lnvToolsExt -lcudart -lc10_cuda -ltorch_cuda -lcufft -lcurand -lcublas -lcudnn" + # TODO figure out why this is needed + $LDFLAGS << " -Wl,--no-as-needed,#{lib}/libtorch.so" +end # generate C++ functions puts "Generating C++ functions..." require_relative "../../lib/torch/native/generator" Torch::Native::Generator.generate_cpp_functions