-
Notifications
You must be signed in to change notification settings - Fork 10
Description
Using /root/.cache/torch_extensions/py38_cu117 as PyTorch extensions root...
Detected CUDA files, patching ldflags
Emitting ninja build file /root/.cache/torch_extensions/py38_cu117/custom_conv2d_wmma_ops_optimized_k_pipe_vec_smem/build.ninja...
Building extension module custom_conv2d_wmma_ops_optimized_k_pipe_vec_smem...
Allowing ninja to set a default number of workers... (overridable by setting the environment variable MAX_JOBS=N)
[1/3] c++ -MMD -MF main.o.d -DTORCH_EXTENSION_NAME=custom_conv2d_wmma_ops_optimized_k_pipe_vec_smem -DTORCH_API_INCLUDE_EXTENSION_H -DPYBIND11_COMPILER_TYPE="gcc" -DPYBIND11_STDLIB="libstdcpp" -DPYBIND11_BUILD_ABI="cxxabi1013" -isystem /opt/conda/lib/python3.8/site-packages/torch/include -isystem /opt/conda/lib/python3.8/site-packages/torch/include/torch/csrc/api/include -isystem /opt/conda/lib/python3.8/site-packages/torch/include/TH -isystem /opt/conda/lib/python3.8/site-packages/torch/include/THC -isystem /usr/local/cuda/include -isystem /opt/conda/include/python3.8 -D_GLIBCXX_USE_CXX11_ABI=1 -fPIC -std=c++14 -c /root/.cache/torch_extensions/py38_cu117/custom_conv2d_wmma_ops_optimized_k_pipe_vec_smem/main.cpp -o main.o
[2/3] /usr/local/cuda/bin/nvcc -DTORCH_EXTENSION_NAME=custom_conv2d_wmma_ops_optimized_k_pipe_vec_smem -DTORCH_API_INCLUDE_EXTENSION_H -DPYBIND11_COMPILER_TYPE="gcc" -DPYBIND11_STDLIB="libstdcpp" -DPYBIND11_BUILD_ABI="cxxabi1013" -isystem /opt/conda/lib/python3.8/site-packages/torch/include -isystem /opt/conda/lib/python3.8/site-packages/torch/include/torch/csrc/api/include -isystem /opt/conda/lib/python3.8/site-packages/torch/include/TH -isystem /opt/conda/lib/python3.8/site-packages/torch/include/THC -isystem /usr/local/cuda/include -isystem /opt/conda/include/python3.8 -D_GLIBCXX_USE_CXX11_ABI=1 -D__CUDA_NO_HALF_OPERATORS -D__CUDA_NO_HALF_CONVERSIONS -D__CUDA_NO_BFLOAT16_CONVERSIONS -D__CUDA_NO_HALF2_OPERATORS__ --expt-relaxed-constexpr -gencode=arch=compute_52,code=sm_52 -gencode=arch=compute_60,code=sm_60 -gencode=arch=compute_61,code=sm_61 -gencode=arch=compute_70,code=sm_70 -gencode=arch=compute_75,code=sm_75 -gencode=arch=compute_80,code=sm_80 -gencode=arch=compute_86,code=compute_86 -gencode=arch=compute_86,code=sm_86 --compiler-options '-fPIC' -arch=sm_70 --use_fast_math -std=c++17 -c /root/.cache/torch_extensions/py38_cu117/custom_conv2d_wmma_ops_optimized_k_pipe_vec_smem/cuda.cu -o cuda.cuda.o
FAILED: cuda.cuda.o
/usr/local/cuda/bin/nvcc -DTORCH_EXTENSION_NAME=custom_conv2d_wmma_ops_optimized_k_pipe_vec_smem -DTORCH_API_INCLUDE_EXTENSION_H -DPYBIND11_COMPILER_TYPE="gcc" -DPYBIND11_STDLIB="libstdcpp" -DPYBIND11_BUILD_ABI="cxxabi1013" -isystem /opt/conda/lib/python3.8/site-packages/torch/include -isystem /opt/conda/lib/python3.8/site-packages/torch/include/torch/csrc/api/include -isystem /opt/conda/lib/python3.8/site-packages/torch/include/TH -isystem /opt/conda/lib/python3.8/site-packages/torch/include/THC -isystem /usr/local/cuda/include -isystem /opt/conda/include/python3.8 -D_GLIBCXX_USE_CXX11_ABI=1 -D__CUDA_NO_HALF_OPERATORS -D__CUDA_NO_HALF_CONVERSIONS_ -D__CUDA_NO_BFLOAT16_CONVERSIONS__ -D__CUDA_NO_HALF2_OPERATORS__ --expt-relaxed-constexpr -gencode=arch=compute_52,code=sm_52 -gencode=arch=compute_60,code=sm_60 -gencode=arch=compute_61,code=sm_61 -gencode=arch=compute_70,code=sm_70 -gencode=arch=compute_75,code=sm_75 -gencode=arch=compute_80,code=sm_80 -gencode=arch=compute_86,code=compute_86 -gencode=arch=compute_86,code=sm_86 --compiler-options '-fPIC' -arch=sm_70 --use_fast_math -std=c++17 -c /root/.cache/torch_extensions/py38_cu117/custom_conv2d_wmma_ops_optimized_k_pipe_vec_smem/cuda.cu -o cuda.cuda.o
/root/.cache/torch_extensions/py38_cu117/custom_conv2d_wmma_ops_optimized_k_pipe_vec_smem/cuda.cu(10): error: name must be a namespace name
/root/.cache/torch_extensions/py38_cu117/custom_conv2d_wmma_ops_optimized_k_pipe_vec_smem/cuda.cu(84): error: name followed by "::" must be a class or namespace name
/root/.cache/torch_extensions/py38_cu117/custom_conv2d_wmma_ops_optimized_k_pipe_vec_smem/cuda.cu(84): error: type name is not allowed
/root/.cache/torch_extensions/py38_cu117/custom_conv2d_wmma_ops_optimized_k_pipe_vec_smem/cuda.cu(84): error: identifier "acc_frag" is undefined
/root/.cache/torch_extensions/py38_cu117/custom_conv2d_wmma_ops_optimized_k_pipe_vec_smem/cuda.cu(87): error: name followed by "::" must be a class or namespace name
/root/.cache/torch_extensions/py38_cu117/custom_conv2d_wmma_ops_optimized_k_pipe_vec_smem/cuda.cu(374): error: name followed by "::" must be a class or namespace name
/root/.cache/torch_extensions/py38_cu117/custom_conv2d_wmma_ops_optimized_k_pipe_vec_smem/cuda.cu(374): error: type name is not allowed
/root/.cache/torch_extensions/py38_cu117/custom_conv2d_wmma_ops_optimized_k_pipe_vec_smem/cuda.cu(374): error: name followed by "::" must be a class or namespace name
/root/.cache/torch_extensions/py38_cu117/custom_conv2d_wmma_ops_optimized_k_pipe_vec_smem/cuda.cu(374): error: identifier "a_frag" is undefined
/root/.cache/torch_extensions/py38_cu117/custom_conv2d_wmma_ops_optimized_k_pipe_vec_smem/cuda.cu(375): error: name followed by "::" must be a class or namespace name
/root/.cache/torch_extensions/py38_cu117/custom_conv2d_wmma_ops_optimized_k_pipe_vec_smem/cuda.cu(377): error: name followed by "::" must be a class or namespace name
/root/.cache/torch_extensions/py38_cu117/custom_conv2d_wmma_ops_optimized_k_pipe_vec_smem/cuda.cu(377): error: type name is not allowed
/root/.cache/torch_extensions/py38_cu117/custom_conv2d_wmma_ops_optimized_k_pipe_vec_smem/cuda.cu(377): error: name followed by "::" must be a class or namespace name
/root/.cache/torch_extensions/py38_cu117/custom_conv2d_wmma_ops_optimized_k_pipe_vec_smem/cuda.cu(377): error: identifier "b_frag_inner_pipe" is undefined
/root/.cache/torch_extensions/py38_cu117/custom_conv2d_wmma_ops_optimized_k_pipe_vec_smem/cuda.cu(381): error: name followed by "::" must be a class or namespace name
/root/.cache/torch_extensions/py38_cu117/custom_conv2d_wmma_ops_optimized_k_pipe_vec_smem/cuda.cu(392): error: name followed by "::" must be a class or namespace name
/root/.cache/torch_extensions/py38_cu117/custom_conv2d_wmma_ops_optimized_k_pipe_vec_smem/cuda.cu(395): error: name followed by "::" must be a class or namespace name
/root/.cache/torch_extensions/py38_cu117/custom_conv2d_wmma_ops_optimized_k_pipe_vec_smem/cuda.cu(405): error: name followed by "::" must be a class or namespace name
/root/.cache/torch_extensions/py38_cu117/custom_conv2d_wmma_ops_optimized_k_pipe_vec_smem/cuda.cu(405): error: name followed by "::" must be a class or namespace name
19 errors detected in the compilation of "/root/.cache/torch_extensions/py38_cu117/custom_conv2d_wmma_ops_optimized_k_pipe_vec_smem/cuda.cu".
ninja: build stopped: subcommand failed.
Traceback (most recent call last):
File "/opt/conda/lib/python3.8/site-packages/torch/utils/cpp_extension.py", line 1869, in _run_ninja_build
subprocess.run(
File "/opt/conda/lib/python3.8/subprocess.py", line 516, in run
raise CalledProcessError(retcode, process.args,
subprocess.CalledProcessError: Command '['ninja', '-v']' returned non-zero exit status 1.
The above exception was the direct cause of the following exception:
Traceback (most recent call last):
File "good_kernels/cuda_evaluator.py", line 19, in
from good_kernels.Conv2D.src import ModelNew as CudaModel
File "/workspace/alpha_evolve/good_kernels/Conv2D/src.py", line 521, in
custom_conv2d_wmma_ops = load_inline(
File "/opt/conda/lib/python3.8/site-packages/torch/utils/cpp_extension.py", line 1406, in load_inline
return _jit_compile(
File "/opt/conda/lib/python3.8/site-packages/torch/utils/cpp_extension.py", line 1480, in _jit_compile
_write_ninja_file_and_build_library(
File "/opt/conda/lib/python3.8/site-packages/torch/utils/cpp_extension.py", line 1594, in _write_ninja_file_and_build_library
_run_ninja_build(
File "/opt/conda/lib/python3.8/site-packages/torch/utils/cpp_extension.py", line 1885, in _run_ninja_build
raise RuntimeError(message) from e
RuntimeError: Error building extension 'custom_conv2d_wmma_ops_optimized_k_pipe_vec_smem'