Skip to content

Setting up PyTorch plugin "bias_act_plugin"... Failed! #15

@beeternity

Description

@beeternity

Traceback (most recent call last):
File "/dssg/apps/lico/ohpc_pub/apps/anaconda3/envs/R3GAN_env/lib/python3.9/site-packages/torch/utils/cpp_extension.py", line 1808, in _run_ninja_build
subprocess.run(
File "/dssg/apps/lico/ohpc_pub/apps/anaconda3/envs/R3GAN_env/lib/python3.9/subprocess.py", line 528, in run
raise CalledProcessError(retcode, process.args,
subprocess.CalledProcessError: Command '['ninja', '-v']' returned non-zero exit status 1.

The above exception was the direct cause of the following exception:

Traceback (most recent call last):
File "/dssg/home/zn_lzhx/R3GAN_Experiments/train.py", line 320, in
main() # pylint: disable=no-value-for-parameter
File "/dssg/apps/lico/ohpc_pub/apps/anaconda3/envs/R3GAN_env/lib/python3.9/site-packages/click/core.py", line 1161, in call
return self.main(*args, **kwargs)
File "/dssg/apps/lico/ohpc_pub/apps/anaconda3/envs/R3GAN_env/lib/python3.9/site-packages/click/core.py", line 1082, in main
rv = self.invoke(ctx)
File "/dssg/apps/lico/ohpc_pub/apps/anaconda3/envs/R3GAN_env/lib/python3.9/site-packages/click/core.py", line 1443, in invoke
return ctx.invoke(self.callback, **ctx.params)
File "/dssg/apps/lico/ohpc_pub/apps/anaconda3/envs/R3GAN_env/lib/python3.9/site-packages/click/core.py", line 788, in invoke
return __callback(*args, **kwargs)
File "/dssg/home/zn_lzhx/R3GAN_Experiments/train.py", line 315, in main
launch_training(c=c, desc=desc, outdir=opts.outdir, dry_run=opts.dry_run)
File "/dssg/home/zn_lzhx/R3GAN_Experiments/train.py", line 93, in launch_training
subprocess_fn(rank=0, c=c, temp_dir=temp_dir)
File "/dssg/home/zn_lzhx/R3GAN_Experiments/train.py", line 44, in subprocess_fn
training_loop.training_loop(rank=rank, **c)
File "/dssg/home/zn_lzhx/R3GAN_Experiments/training/training_loop.py", line 194, in training_loop
img = misc.print_module_summary(G, [z, c])
File "/dssg/home/zn_lzhx/R3GAN_Experiments/torch_utils/misc.py", line 199, in print_module_summary
outputs = module(*inputs)
File "/dssg/apps/lico/ohpc_pub/apps/anaconda3/envs/R3GAN_env/lib/python3.9/site-packages/torch/nn/modules/module.py", line 1148, in _call_impl
result = forward_call(*input, **kwargs)
File "/dssg/home/zn_lzhx/R3GAN_Experiments/training/networks.py", line 27, in forward
return self.Model(x, c)
File "/dssg/apps/lico/ohpc_pub/apps/anaconda3/envs/R3GAN_env/lib/python3.9/site-packages/torch/nn/modules/module.py", line 1148, in _call_impl
result = forward_call(*input, **kwargs)
File "/dssg/home/zn_lzhx/R3GAN_Experiments/R3GAN/Networks.py", line 149, in forward
x = Layer(x)
File "/dssg/apps/lico/ohpc_pub/apps/anaconda3/envs/R3GAN_env/lib/python3.9/site-packages/torch/nn/modules/module.py", line 1148, in _call_impl
result = forward_call(*input, **kwargs)
File "/dssg/home/zn_lzhx/R3GAN_Experiments/R3GAN/Networks.py", line 111, in forward
x = Layer(x)
File "/dssg/apps/lico/ohpc_pub/apps/anaconda3/envs/R3GAN_env/lib/python3.9/site-packages/torch/nn/modules/module.py", line 1148, in _call_impl
result = forward_call(*input, **kwargs)
File "/dssg/home/zn_lzhx/R3GAN_Experiments/R3GAN/Networks.py", line 44, in forward
y = self.LinearLayer2(self.NonLinearity1(y))
File "/dssg/apps/lico/ohpc_pub/apps/anaconda3/envs/R3GAN_env/lib/python3.9/site-packages/torch/nn/modules/module.py", line 1148, in call_impl
result = forward_call(*input, **kwargs)
File "/dssg/home/zn_lzhx/R3GAN_Experiments/R3GAN/FusedOperators.py", line 31, in forward
return bias_act.bias_act(x, self.Bias.to(x.dtype), act=BiasedActivationCUDA.Function, gain=1)
File "/dssg/home/zn_lzhx/R3GAN_Experiments/torch_utils/ops/bias_act.py", line 84, in bias_act
if impl == 'cuda' and x.device.type == 'cuda' and init():
File "/dssg/home/zn_lzhx/R3GAN_Experiments/torch_utils/ops/bias_act.py", line 41, in init
plugin = custom_ops.get_plugin(
File "/dssg/home/zn_lzhx/R3GAN_Experiments/torch_utils/custom_ops.py", line 136, in get_plugin
torch.utils.cpp_extension.load(name=module_name, build_directory=cached_build_dir,
File "/dssg/apps/lico/ohpc_pub/apps/anaconda3/envs/R3GAN_env/lib/python3.9/site-packages/torch/utils/cpp_extension.py", line 1202, in load
return jit_compile(
File "/dssg/apps/lico/ohpc_pub/apps/anaconda3/envs/R3GAN_env/lib/python3.9/site-packages/torch/utils/cpp_extension.py", line 1425, in jit_compile
write_ninja_file_and_build_library(
File "/dssg/apps/lico/ohpc_pub/apps/anaconda3/envs/R3GAN_env/lib/python3.9/site-packages/torch/utils/cpp_extension.py", line 1537, in write_ninja_file_and_build_library
run_ninja_build(
File "/dssg/apps/lico/ohpc_pub/apps/anaconda3/envs/R3GAN_env/lib/python3.9/site-packages/torch/utils/cpp_extension.py", line 1824, in run_ninja_build
raise RuntimeError(message) from e
RuntimeError: Error building extension 'bias_act_plugin': [1/3] /dssg/apps/lico/ohpc_pub/apps/anaconda3/envs/R3GAN_env/bin/nvcc -ccbin /dssg/apps/lico/ohpc_pub/apps/anaconda3/envs/R3GAN_env/bin/x86_64-conda-linux-gnu-cc -DTORCH_EXTENSION_NAME=bias_act_plugin -DTORCH_API_INCLUDE_EXTENSION_H -DPYBIND11_COMPILER_TYPE="gcc" -DPYBIND11_STDLIB="libstdcpp" -DPYBIND11_BUILD_ABI="cxxabi1011" -isystem /dssg/apps/lico/ohpc_pub/apps/anaconda3/envs/R3GAN_env/lib/python3.9/site-packages/torch/include -isystem /dssg/apps/lico/ohpc_pub/apps/anaconda3/envs/R3GAN_env/lib/python3.9/site-packages/torch/include/torch/csrc/api/include -isystem /dssg/apps/lico/ohpc_pub/apps/anaconda3/envs/R3GAN_env/lib/python3.9/site-packages/torch/include/TH -isystem /dssg/apps/lico/ohpc_pub/apps/anaconda3/envs/R3GAN_env/lib/python3.9/site-packages/torch/include/THC -isystem /dssg/apps/lico/ohpc_pub/apps/anaconda3/envs/R3GAN_env/include -isystem /dssg/apps/lico/ohpc_pub/apps/anaconda3/envs/R3GAN_env/include/python3.9 -D_GLIBCXX_USE_CXX11_ABI=0 -D__CUDA_NO_HALF_OPERATORS -D__CUDA_NO_HALF_CONVERSIONS
-D__CUDA_NO_BFLOAT16_CONVERSIONS
-D__CUDA_NO_HALF2_OPERATORS
--expt-relaxed-constexpr -gencode=arch=compute_70,code=compute_70 -gencode=arch=compute_70,code=sm_70 --compiler-options '-fPIC' --use_fast_math --allow-unsupported-compiler -std=c++14 -c /dssg/home/zn_lzhx/.cache/torch_extensions/py39_cu113/bias_act_plugin/923aace9669174ee9624e9f9a8189528-tesla-v100-pcie-32gb/bias_act.cu -o bias_act.cuda.o
FAILED: bias_act.cuda.o
/dssg/apps/lico/ohpc_pub/apps/anaconda3/envs/R3GAN_env/bin/nvcc -ccbin /dssg/apps/lico/ohpc_pub/apps/anaconda3/envs/R3GAN_env/bin/x86_64-conda-linux-gnu-cc -DTORCH_EXTENSION_NAME=bias_act_plugin -DTORCH_API_INCLUDE_EXTENSION_H -DPYBIND11_COMPILER_TYPE="gcc" -DPYBIND11_STDLIB="libstdcpp" -DPYBIND11_BUILD_ABI="cxxabi1011" -isystem /dssg/apps/lico/ohpc_pub/apps/anaconda3/envs/R3GAN_env/lib/python3.9/site-packages/torch/include -isystem /dssg/apps/lico/ohpc_pub/apps/anaconda3/envs/R3GAN_env/lib/python3.9/site-packages/torch/include/torch/csrc/api/include -isystem /dssg/apps/lico/ohpc_pub/apps/anaconda3/envs/R3GAN_env/lib/python3.9/site-packages/torch/include/TH -isystem /dssg/apps/lico/ohpc_pub/apps/anaconda3/envs/R3GAN_env/lib/python3.9/site-packages/torch/include/THC -isystem /dssg/apps/lico/ohpc_pub/apps/anaconda3/envs/R3GAN_env/include -isystem /dssg/apps/lico/ohpc_pub/apps/anaconda3/envs/R3GAN_env/include/python3.9 -D_GLIBCXX_USE_CXX11_ABI=0 -D__CUDA_NO_HALF_OPERATORS -D__CUDA_NO_HALF_CONVERSIONS
-D__CUDA_NO_BFLOAT16_CONVERSIONS
-D__CUDA_NO_HALF2_OPERATORS
--expt-relaxed-constexpr -gencode=arch=compute_70,code=compute_70 -gencode=arch=compute_70,code=sm_70 --compiler-options '-fPIC' --use_fast_math --allow-unsupported-compiler -std=c++14 -c /dssg/home/zn_lzhx/.cache/torch_extensions/py39_cu113/bias_act_plugin/923aace9669174ee9624e9f9a8189528-tesla-v100-pcie-32gb/bias_act.cu -o bias_act.cuda.o
x86_64-conda-linux-gnu-cc: fatal error: cannot execute 'cc1plus': execvp: No such file or directory
compilation terminated.
nvcc fatal : Failed to preprocess host compiler properties.
[2/3] c++ -MMD -MF bias_act.o.d -DTORCH_EXTENSION_NAME=bias_act_plugin -DTORCH_API_INCLUDE_EXTENSION_H -DPYBIND11_COMPILER_TYPE="_gcc" -DPYBIND11_STDLIB="_libstdcpp" -DPYBIND11_BUILD_ABI="_cxxabi1011" -isystem /dssg/apps/lico/ohpc_pub/apps/anaconda3/envs/R3GAN_env/lib/python3.9/site-packages/torch/include -isystem /dssg/apps/lico/ohpc_pub/apps/anaconda3/envs/R3GAN_env/lib/python3.9/site-packages/torch/include/torch/csrc/api/include -isystem /dssg/apps/lico/ohpc_pub/apps/anaconda3/envs/R3GAN_env/lib/python3.9/site-packages/torch/include/TH -isystem /dssg/apps/lico/ohpc_pub/apps/anaconda3/envs/R3GAN_env/lib/python3.9/site-packages/torch/include/THC -isystem /dssg/apps/lico/ohpc_pub/apps/anaconda3/envs/R3GAN_env/include -isystem /dssg/apps/lico/ohpc_pub/apps/anaconda3/envs/R3GAN_env/include/python3.9 -D_GLIBCXX_USE_CXX11_ABI=0 -fPIC -std=c++14 -c /dssg/home/zn_lzhx/.cache/torch_extensions/py39_cu113/bias_act_plugin/923aace9669174ee9624e9f9a8189528-tesla-v100-pcie-32gb/bias_act.cpp -o bias_act.o
FAILED: bias_act.o
c++ -MMD -MF bias_act.o.d -DTORCH_EXTENSION_NAME=bias_act_plugin -DTORCH_API_INCLUDE_EXTENSION_H -DPYBIND11_COMPILER_TYPE="_gcc" -DPYBIND11_STDLIB="_libstdcpp" -DPYBIND11_BUILD_ABI="_cxxabi1011" -isystem /dssg/apps/lico/ohpc_pub/apps/anaconda3/envs/R3GAN_env/lib/python3.9/site-packages/torch/include -isystem /dssg/apps/lico/ohpc_pub/apps/anaconda3/envs/R3GAN_env/lib/python3.9/site-packages/torch/include/torch/csrc/api/include -isystem /dssg/apps/lico/ohpc_pub/apps/anaconda3/envs/R3GAN_env/lib/python3.9/site-packages/torch/include/TH -isystem /dssg/apps/lico/ohpc_pub/apps/anaconda3/envs/R3GAN_env/lib/python3.9/site-packages/torch/include/THC -isystem /dssg/apps/lico/ohpc_pub/apps/anaconda3/envs/R3GAN_env/include -isystem /dssg/apps/lico/ohpc_pub/apps/anaconda3/envs/R3GAN_env/include/python3.9 -D_GLIBCXX_USE_CXX11_ABI=0 -fPIC -std=c++14 -c /dssg/home/zn_lzhx/.cache/torch_extensions/py39_cu113/bias_act_plugin/923aace9669174ee9624e9f9a8189528-tesla-v100-pcie-32gb/bias_act.cpp -o bias_act.o
In file included from /dssg/home/zn_lzhx/.cache/torch_extensions/py39_cu113/bias_act_plugin/923aace9669174ee9624e9f9a8189528-tesla-v100-pcie-32gb/bias_act.cpp:10:
/dssg/apps/lico/ohpc_pub/apps/anaconda3/envs/R3GAN_env/lib/python3.9/site-packages/torch/include/ATen/cuda/CUDAContext.h:5:10: fatal error: cuda_runtime_api.h: No such file or directory
#include <cuda_runtime_api.h>
^~~~~~~~~~~~~~~~~~~~
compilation terminated.
ninja: build stopped: subcommand failed.

Metadata

Metadata

Assignees

No one assigned

    Labels

    No labels
    No labels

    Type

    No type

    Projects

    No projects

    Milestone

    No milestone

    Relationships

    None yet

    Development

    No branches or pull requests

    Issue actions