-
Notifications
You must be signed in to change notification settings - Fork 45
Description
Traceback (most recent call last):
File "/dssg/apps/lico/ohpc_pub/apps/anaconda3/envs/R3GAN_env/lib/python3.9/site-packages/torch/utils/cpp_extension.py", line 1808, in _run_ninja_build
subprocess.run(
File "/dssg/apps/lico/ohpc_pub/apps/anaconda3/envs/R3GAN_env/lib/python3.9/subprocess.py", line 528, in run
raise CalledProcessError(retcode, process.args,
subprocess.CalledProcessError: Command '['ninja', '-v']' returned non-zero exit status 1.
The above exception was the direct cause of the following exception:
Traceback (most recent call last):
File "/dssg/home/zn_lzhx/R3GAN_Experiments/train.py", line 320, in
main() # pylint: disable=no-value-for-parameter
File "/dssg/apps/lico/ohpc_pub/apps/anaconda3/envs/R3GAN_env/lib/python3.9/site-packages/click/core.py", line 1161, in call
return self.main(*args, **kwargs)
File "/dssg/apps/lico/ohpc_pub/apps/anaconda3/envs/R3GAN_env/lib/python3.9/site-packages/click/core.py", line 1082, in main
rv = self.invoke(ctx)
File "/dssg/apps/lico/ohpc_pub/apps/anaconda3/envs/R3GAN_env/lib/python3.9/site-packages/click/core.py", line 1443, in invoke
return ctx.invoke(self.callback, **ctx.params)
File "/dssg/apps/lico/ohpc_pub/apps/anaconda3/envs/R3GAN_env/lib/python3.9/site-packages/click/core.py", line 788, in invoke
return __callback(*args, **kwargs)
File "/dssg/home/zn_lzhx/R3GAN_Experiments/train.py", line 315, in main
launch_training(c=c, desc=desc, outdir=opts.outdir, dry_run=opts.dry_run)
File "/dssg/home/zn_lzhx/R3GAN_Experiments/train.py", line 93, in launch_training
subprocess_fn(rank=0, c=c, temp_dir=temp_dir)
File "/dssg/home/zn_lzhx/R3GAN_Experiments/train.py", line 44, in subprocess_fn
training_loop.training_loop(rank=rank, **c)
File "/dssg/home/zn_lzhx/R3GAN_Experiments/training/training_loop.py", line 194, in training_loop
img = misc.print_module_summary(G, [z, c])
File "/dssg/home/zn_lzhx/R3GAN_Experiments/torch_utils/misc.py", line 199, in print_module_summary
outputs = module(*inputs)
File "/dssg/apps/lico/ohpc_pub/apps/anaconda3/envs/R3GAN_env/lib/python3.9/site-packages/torch/nn/modules/module.py", line 1148, in _call_impl
result = forward_call(*input, **kwargs)
File "/dssg/home/zn_lzhx/R3GAN_Experiments/training/networks.py", line 27, in forward
return self.Model(x, c)
File "/dssg/apps/lico/ohpc_pub/apps/anaconda3/envs/R3GAN_env/lib/python3.9/site-packages/torch/nn/modules/module.py", line 1148, in _call_impl
result = forward_call(*input, **kwargs)
File "/dssg/home/zn_lzhx/R3GAN_Experiments/R3GAN/Networks.py", line 149, in forward
x = Layer(x)
File "/dssg/apps/lico/ohpc_pub/apps/anaconda3/envs/R3GAN_env/lib/python3.9/site-packages/torch/nn/modules/module.py", line 1148, in _call_impl
result = forward_call(*input, **kwargs)
File "/dssg/home/zn_lzhx/R3GAN_Experiments/R3GAN/Networks.py", line 111, in forward
x = Layer(x)
File "/dssg/apps/lico/ohpc_pub/apps/anaconda3/envs/R3GAN_env/lib/python3.9/site-packages/torch/nn/modules/module.py", line 1148, in _call_impl
result = forward_call(*input, **kwargs)
File "/dssg/home/zn_lzhx/R3GAN_Experiments/R3GAN/Networks.py", line 44, in forward
y = self.LinearLayer2(self.NonLinearity1(y))
File "/dssg/apps/lico/ohpc_pub/apps/anaconda3/envs/R3GAN_env/lib/python3.9/site-packages/torch/nn/modules/module.py", line 1148, in call_impl
result = forward_call(*input, **kwargs)
File "/dssg/home/zn_lzhx/R3GAN_Experiments/R3GAN/FusedOperators.py", line 31, in forward
return bias_act.bias_act(x, self.Bias.to(x.dtype), act=BiasedActivationCUDA.Function, gain=1)
File "/dssg/home/zn_lzhx/R3GAN_Experiments/torch_utils/ops/bias_act.py", line 84, in bias_act
if impl == 'cuda' and x.device.type == 'cuda' and init():
File "/dssg/home/zn_lzhx/R3GAN_Experiments/torch_utils/ops/bias_act.py", line 41, in init
plugin = custom_ops.get_plugin(
File "/dssg/home/zn_lzhx/R3GAN_Experiments/torch_utils/custom_ops.py", line 136, in get_plugin
torch.utils.cpp_extension.load(name=module_name, build_directory=cached_build_dir,
File "/dssg/apps/lico/ohpc_pub/apps/anaconda3/envs/R3GAN_env/lib/python3.9/site-packages/torch/utils/cpp_extension.py", line 1202, in load
return jit_compile(
File "/dssg/apps/lico/ohpc_pub/apps/anaconda3/envs/R3GAN_env/lib/python3.9/site-packages/torch/utils/cpp_extension.py", line 1425, in jit_compile
write_ninja_file_and_build_library(
File "/dssg/apps/lico/ohpc_pub/apps/anaconda3/envs/R3GAN_env/lib/python3.9/site-packages/torch/utils/cpp_extension.py", line 1537, in write_ninja_file_and_build_library
run_ninja_build(
File "/dssg/apps/lico/ohpc_pub/apps/anaconda3/envs/R3GAN_env/lib/python3.9/site-packages/torch/utils/cpp_extension.py", line 1824, in run_ninja_build
raise RuntimeError(message) from e
RuntimeError: Error building extension 'bias_act_plugin': [1/3] /dssg/apps/lico/ohpc_pub/apps/anaconda3/envs/R3GAN_env/bin/nvcc -ccbin /dssg/apps/lico/ohpc_pub/apps/anaconda3/envs/R3GAN_env/bin/x86_64-conda-linux-gnu-cc -DTORCH_EXTENSION_NAME=bias_act_plugin -DTORCH_API_INCLUDE_EXTENSION_H -DPYBIND11_COMPILER_TYPE="gcc" -DPYBIND11_STDLIB="libstdcpp" -DPYBIND11_BUILD_ABI="cxxabi1011" -isystem /dssg/apps/lico/ohpc_pub/apps/anaconda3/envs/R3GAN_env/lib/python3.9/site-packages/torch/include -isystem /dssg/apps/lico/ohpc_pub/apps/anaconda3/envs/R3GAN_env/lib/python3.9/site-packages/torch/include/torch/csrc/api/include -isystem /dssg/apps/lico/ohpc_pub/apps/anaconda3/envs/R3GAN_env/lib/python3.9/site-packages/torch/include/TH -isystem /dssg/apps/lico/ohpc_pub/apps/anaconda3/envs/R3GAN_env/lib/python3.9/site-packages/torch/include/THC -isystem /dssg/apps/lico/ohpc_pub/apps/anaconda3/envs/R3GAN_env/include -isystem /dssg/apps/lico/ohpc_pub/apps/anaconda3/envs/R3GAN_env/include/python3.9 -D_GLIBCXX_USE_CXX11_ABI=0 -D__CUDA_NO_HALF_OPERATORS -D__CUDA_NO_HALF_CONVERSIONS -D__CUDA_NO_BFLOAT16_CONVERSIONS -D__CUDA_NO_HALF2_OPERATORS --expt-relaxed-constexpr -gencode=arch=compute_70,code=compute_70 -gencode=arch=compute_70,code=sm_70 --compiler-options '-fPIC' --use_fast_math --allow-unsupported-compiler -std=c++14 -c /dssg/home/zn_lzhx/.cache/torch_extensions/py39_cu113/bias_act_plugin/923aace9669174ee9624e9f9a8189528-tesla-v100-pcie-32gb/bias_act.cu -o bias_act.cuda.o
FAILED: bias_act.cuda.o
/dssg/apps/lico/ohpc_pub/apps/anaconda3/envs/R3GAN_env/bin/nvcc -ccbin /dssg/apps/lico/ohpc_pub/apps/anaconda3/envs/R3GAN_env/bin/x86_64-conda-linux-gnu-cc -DTORCH_EXTENSION_NAME=bias_act_plugin -DTORCH_API_INCLUDE_EXTENSION_H -DPYBIND11_COMPILER_TYPE="gcc" -DPYBIND11_STDLIB="libstdcpp" -DPYBIND11_BUILD_ABI="cxxabi1011" -isystem /dssg/apps/lico/ohpc_pub/apps/anaconda3/envs/R3GAN_env/lib/python3.9/site-packages/torch/include -isystem /dssg/apps/lico/ohpc_pub/apps/anaconda3/envs/R3GAN_env/lib/python3.9/site-packages/torch/include/torch/csrc/api/include -isystem /dssg/apps/lico/ohpc_pub/apps/anaconda3/envs/R3GAN_env/lib/python3.9/site-packages/torch/include/TH -isystem /dssg/apps/lico/ohpc_pub/apps/anaconda3/envs/R3GAN_env/lib/python3.9/site-packages/torch/include/THC -isystem /dssg/apps/lico/ohpc_pub/apps/anaconda3/envs/R3GAN_env/include -isystem /dssg/apps/lico/ohpc_pub/apps/anaconda3/envs/R3GAN_env/include/python3.9 -D_GLIBCXX_USE_CXX11_ABI=0 -D__CUDA_NO_HALF_OPERATORS -D__CUDA_NO_HALF_CONVERSIONS -D__CUDA_NO_BFLOAT16_CONVERSIONS -D__CUDA_NO_HALF2_OPERATORS --expt-relaxed-constexpr -gencode=arch=compute_70,code=compute_70 -gencode=arch=compute_70,code=sm_70 --compiler-options '-fPIC' --use_fast_math --allow-unsupported-compiler -std=c++14 -c /dssg/home/zn_lzhx/.cache/torch_extensions/py39_cu113/bias_act_plugin/923aace9669174ee9624e9f9a8189528-tesla-v100-pcie-32gb/bias_act.cu -o bias_act.cuda.o
x86_64-conda-linux-gnu-cc: fatal error: cannot execute 'cc1plus': execvp: No such file or directory
compilation terminated.
nvcc fatal : Failed to preprocess host compiler properties.
[2/3] c++ -MMD -MF bias_act.o.d -DTORCH_EXTENSION_NAME=bias_act_plugin -DTORCH_API_INCLUDE_EXTENSION_H -DPYBIND11_COMPILER_TYPE="_gcc" -DPYBIND11_STDLIB="_libstdcpp" -DPYBIND11_BUILD_ABI="_cxxabi1011" -isystem /dssg/apps/lico/ohpc_pub/apps/anaconda3/envs/R3GAN_env/lib/python3.9/site-packages/torch/include -isystem /dssg/apps/lico/ohpc_pub/apps/anaconda3/envs/R3GAN_env/lib/python3.9/site-packages/torch/include/torch/csrc/api/include -isystem /dssg/apps/lico/ohpc_pub/apps/anaconda3/envs/R3GAN_env/lib/python3.9/site-packages/torch/include/TH -isystem /dssg/apps/lico/ohpc_pub/apps/anaconda3/envs/R3GAN_env/lib/python3.9/site-packages/torch/include/THC -isystem /dssg/apps/lico/ohpc_pub/apps/anaconda3/envs/R3GAN_env/include -isystem /dssg/apps/lico/ohpc_pub/apps/anaconda3/envs/R3GAN_env/include/python3.9 -D_GLIBCXX_USE_CXX11_ABI=0 -fPIC -std=c++14 -c /dssg/home/zn_lzhx/.cache/torch_extensions/py39_cu113/bias_act_plugin/923aace9669174ee9624e9f9a8189528-tesla-v100-pcie-32gb/bias_act.cpp -o bias_act.o
FAILED: bias_act.o
c++ -MMD -MF bias_act.o.d -DTORCH_EXTENSION_NAME=bias_act_plugin -DTORCH_API_INCLUDE_EXTENSION_H -DPYBIND11_COMPILER_TYPE="_gcc" -DPYBIND11_STDLIB="_libstdcpp" -DPYBIND11_BUILD_ABI="_cxxabi1011" -isystem /dssg/apps/lico/ohpc_pub/apps/anaconda3/envs/R3GAN_env/lib/python3.9/site-packages/torch/include -isystem /dssg/apps/lico/ohpc_pub/apps/anaconda3/envs/R3GAN_env/lib/python3.9/site-packages/torch/include/torch/csrc/api/include -isystem /dssg/apps/lico/ohpc_pub/apps/anaconda3/envs/R3GAN_env/lib/python3.9/site-packages/torch/include/TH -isystem /dssg/apps/lico/ohpc_pub/apps/anaconda3/envs/R3GAN_env/lib/python3.9/site-packages/torch/include/THC -isystem /dssg/apps/lico/ohpc_pub/apps/anaconda3/envs/R3GAN_env/include -isystem /dssg/apps/lico/ohpc_pub/apps/anaconda3/envs/R3GAN_env/include/python3.9 -D_GLIBCXX_USE_CXX11_ABI=0 -fPIC -std=c++14 -c /dssg/home/zn_lzhx/.cache/torch_extensions/py39_cu113/bias_act_plugin/923aace9669174ee9624e9f9a8189528-tesla-v100-pcie-32gb/bias_act.cpp -o bias_act.o
In file included from /dssg/home/zn_lzhx/.cache/torch_extensions/py39_cu113/bias_act_plugin/923aace9669174ee9624e9f9a8189528-tesla-v100-pcie-32gb/bias_act.cpp:10:
/dssg/apps/lico/ohpc_pub/apps/anaconda3/envs/R3GAN_env/lib/python3.9/site-packages/torch/include/ATen/cuda/CUDAContext.h:5:10: fatal error: cuda_runtime_api.h: No such file or directory
#include <cuda_runtime_api.h>
^~~~~~~~~~~~~~~~~~~~
compilation terminated.
ninja: build stopped: subcommand failed.