Not a member of Pastebin yet?
Sign Up,
it unlocks many cool features!
- [50/58] /opt/rocm-6.3.4/bin/hipcc -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/include -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/library/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/torch/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/torch/include/torch/csrc/api/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/torch/include/THH -I/opt/rocm-6.3.4/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/include -I/usr/include/python3.12 -c -c /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src/flash_fwd_runner_batched_gqa_fp16_casual_gfx110x_hip.hip -o /tmp/pip-req-build-jdvqq1lu/build/temp.linux-x86_64-cpython-312/csrc/flash_attn_rocm/src/flash_fwd_runner_batched_gqa_fp16_casual_gfx110x_hip.o -D__HIP_PLATFORM_AMD__=1 -DUSE_ROCM=1 -DHIPBLAS_V2 -fPIC -DCUDA_HAS_FP16=1 -D__HIP_NO_HALF_OPERATORS__=1 -D__HIP_NO_HALF_CONVERSIONS__=1 -DHIP_ENABLE_WARP_SYNC_BUILTINS=1 -O3 -std=c++17 -DNDEBUG -U__HIP_NO_HALF_OPERATORS__ -U__HIP_NO_HALF_CONVERSIONS__ --offload-arch=native -D__WMMA__ -DTORCH_API_INCLUDE_EXTENSION_H '-DPYBIND11_COMPILER_TYPE="_gcc"' '-DPYBIND11_STDLIB="_libstdcpp"' '-DPYBIND11_BUILD_ABI="_cxxabi1016"' -DTORCH_EXTENSION_NAME=flash_attn_2_cuda -fno-gpu-rdc
- FAILED: /tmp/pip-req-build-jdvqq1lu/build/temp.linux-x86_64-cpython-312/csrc/flash_attn_rocm/src/flash_fwd_runner_batched_gqa_fp16_casual_gfx110x_hip.o
- /opt/rocm-6.3.4/bin/hipcc -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/include -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/library/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/torch/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/torch/include/torch/csrc/api/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/torch/include/THH -I/opt/rocm-6.3.4/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/include -I/usr/include/python3.12 -c -c /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src/flash_fwd_runner_batched_gqa_fp16_casual_gfx110x_hip.hip -o /tmp/pip-req-build-jdvqq1lu/build/temp.linux-x86_64-cpython-312/csrc/flash_attn_rocm/src/flash_fwd_runner_batched_gqa_fp16_casual_gfx110x_hip.o -D__HIP_PLATFORM_AMD__=1 -DUSE_ROCM=1 -DHIPBLAS_V2 -fPIC -DCUDA_HAS_FP16=1 -D__HIP_NO_HALF_OPERATORS__=1 -D__HIP_NO_HALF_CONVERSIONS__=1 -DHIP_ENABLE_WARP_SYNC_BUILTINS=1 -O3 -std=c++17 -DNDEBUG -U__HIP_NO_HALF_OPERATORS__ -U__HIP_NO_HALF_CONVERSIONS__ --offload-arch=native -D__WMMA__ -DTORCH_API_INCLUDE_EXTENSION_H '-DPYBIND11_COMPILER_TYPE="_gcc"' '-DPYBIND11_STDLIB="_libstdcpp"' '-DPYBIND11_BUILD_ABI="_cxxabi1016"' -DTORCH_EXTENSION_NAME=flash_attn_2_cuda -fno-gpu-rdc
- In file included from /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src/flash_fwd_runner_batched_gqa_fp16_casual_gfx110x_hip.hip:25:
- In file included from /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src/flash_runner_hip.hpp:30:
- In file included from /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src/fwd_device_gemm_invoker_hip.hpp:27:
- In file included from /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src/fwd_device_gemm_template_hip.hpp:27:
- In file included from /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src/device_gemm_trait_hip.hpp:45:
- In file included from /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/include/ck/tensor_operation/gpu/device/impl/device_grouped_query_attention_forward_wmma_hip.hpp:17:
- In file included from /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/include/ck/tensor_description/tensor_descriptor_hip.hpp:7:
- In file included from /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/include/ck/utility/common_header_hip.hpp:37:
- /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/include/ck/utility/amd_buffer_addressing.hpp:32:48: error: use of undeclared identifier 'CK_BUFFER_RESOURCE_3RD_DWORD'
- 32 | wave_buffer_resource.config(Number<3>{}) = CK_BUFFER_RESOURCE_3RD_DWORD;
- | ^
- /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/include/ck/utility/amd_buffer_addressing.hpp:47:48: error: use of undeclared identifier 'CK_BUFFER_RESOURCE_3RD_DWORD'
- 47 | wave_buffer_resource.config(Number<3>{}) = CK_BUFFER_RESOURCE_3RD_DWORD;
- | ^
- 2 errors generated when compiling for gfx1036.
- failed to execute:/opt/rocm-6.3.4/lib/llvm/bin/clang++ --offload-arch=native -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/include -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/library/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/torch/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/torch/include/torch/csrc/api/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/torch/include/THH -I/opt/rocm-6.3.4/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/include -I/usr/include/python3.12 -c -c -x hip /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src/flash_fwd_runner_batched_gqa_fp16_casual_gfx110x_hip.hip -o "/tmp/pip-req-build-jdvqq1lu/build/temp.linux-x86_64-cpython-312/csrc/flash_attn_rocm/src/flash_fwd_runner_batched_gqa_fp16_casual_gfx110x_hip.o" -D__HIP_PLATFORM_AMD__=1 -DUSE_ROCM=1 -DHIPBLAS_V2 -fPIC -DCUDA_HAS_FP16=1 -D__HIP_NO_HALF_OPERATORS__=1 -D__HIP_NO_HALF_CONVERSIONS__=1 -DHIP_ENABLE_WARP_SYNC_BUILTINS=1 -O3 -std=c++17 -DNDEBUG -U__HIP_NO_HALF_OPERATORS__ -U__HIP_NO_HALF_CONVERSIONS__ -D__WMMA__ -DTORCH_API_INCLUDE_EXTENSION_H -DPYBIND11_COMPILER_TYPE=\"_gcc\" -DPYBIND11_STDLIB=\"_libstdcpp\" -DPYBIND11_BUILD_ABI=\"_cxxabi1016\" -DTORCH_EXTENSION_NAME=flash_attn_2_cuda -fno-gpu-rdc
- [51/58] /opt/rocm-6.3.4/bin/hipcc -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/include -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/library/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/torch/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/torch/include/torch/csrc/api/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/torch/include/THH -I/opt/rocm-6.3.4/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/include -I/usr/include/python3.12 -c -c /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src/flash_fwd_runner_batched_gqa_bf16_casual_gfx110x_hip.hip -o /tmp/pip-req-build-jdvqq1lu/build/temp.linux-x86_64-cpython-312/csrc/flash_attn_rocm/src/flash_fwd_runner_batched_gqa_bf16_casual_gfx110x_hip.o -D__HIP_PLATFORM_AMD__=1 -DUSE_ROCM=1 -DHIPBLAS_V2 -fPIC -DCUDA_HAS_FP16=1 -D__HIP_NO_HALF_OPERATORS__=1 -D__HIP_NO_HALF_CONVERSIONS__=1 -DHIP_ENABLE_WARP_SYNC_BUILTINS=1 -O3 -std=c++17 -DNDEBUG -U__HIP_NO_HALF_OPERATORS__ -U__HIP_NO_HALF_CONVERSIONS__ --offload-arch=native -D__WMMA__ -DTORCH_API_INCLUDE_EXTENSION_H '-DPYBIND11_COMPILER_TYPE="_gcc"' '-DPYBIND11_STDLIB="_libstdcpp"' '-DPYBIND11_BUILD_ABI="_cxxabi1016"' -DTORCH_EXTENSION_NAME=flash_attn_2_cuda -fno-gpu-rdc
- FAILED: /tmp/pip-req-build-jdvqq1lu/build/temp.linux-x86_64-cpython-312/csrc/flash_attn_rocm/src/flash_fwd_runner_batched_gqa_bf16_casual_gfx110x_hip.o
- /opt/rocm-6.3.4/bin/hipcc -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/include -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/library/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/torch/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/torch/include/torch/csrc/api/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/torch/include/THH -I/opt/rocm-6.3.4/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/include -I/usr/include/python3.12 -c -c /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src/flash_fwd_runner_batched_gqa_bf16_casual_gfx110x_hip.hip -o /tmp/pip-req-build-jdvqq1lu/build/temp.linux-x86_64-cpython-312/csrc/flash_attn_rocm/src/flash_fwd_runner_batched_gqa_bf16_casual_gfx110x_hip.o -D__HIP_PLATFORM_AMD__=1 -DUSE_ROCM=1 -DHIPBLAS_V2 -fPIC -DCUDA_HAS_FP16=1 -D__HIP_NO_HALF_OPERATORS__=1 -D__HIP_NO_HALF_CONVERSIONS__=1 -DHIP_ENABLE_WARP_SYNC_BUILTINS=1 -O3 -std=c++17 -DNDEBUG -U__HIP_NO_HALF_OPERATORS__ -U__HIP_NO_HALF_CONVERSIONS__ --offload-arch=native -D__WMMA__ -DTORCH_API_INCLUDE_EXTENSION_H '-DPYBIND11_COMPILER_TYPE="_gcc"' '-DPYBIND11_STDLIB="_libstdcpp"' '-DPYBIND11_BUILD_ABI="_cxxabi1016"' -DTORCH_EXTENSION_NAME=flash_attn_2_cuda -fno-gpu-rdc
- In file included from /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src/flash_fwd_runner_batched_gqa_bf16_casual_gfx110x_hip.hip:25:
- In file included from /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src/flash_runner_hip.hpp:30:
- In file included from /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src/fwd_device_gemm_invoker_hip.hpp:27:
- In file included from /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src/fwd_device_gemm_template_hip.hpp:27:
- In file included from /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src/device_gemm_trait_hip.hpp:45:
- In file included from /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/include/ck/tensor_operation/gpu/device/impl/device_grouped_query_attention_forward_wmma_hip.hpp:17:
- In file included from /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/include/ck/tensor_description/tensor_descriptor_hip.hpp:7:
- In file included from /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/include/ck/utility/common_header_hip.hpp:37:
- /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/include/ck/utility/amd_buffer_addressing.hpp:32:48: error: use of undeclared identifier 'CK_BUFFER_RESOURCE_3RD_DWORD'
- 32 | wave_buffer_resource.config(Number<3>{}) = CK_BUFFER_RESOURCE_3RD_DWORD;
- | ^
- /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/include/ck/utility/amd_buffer_addressing.hpp:47:48: error: use of undeclared identifier 'CK_BUFFER_RESOURCE_3RD_DWORD'
- 47 | wave_buffer_resource.config(Number<3>{}) = CK_BUFFER_RESOURCE_3RD_DWORD;
- | ^
- 2 errors generated when compiling for gfx1036.
- failed to execute:/opt/rocm-6.3.4/lib/llvm/bin/clang++ --offload-arch=native -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/include -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/library/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/torch/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/torch/include/torch/csrc/api/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/torch/include/THH -I/opt/rocm-6.3.4/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/include -I/usr/include/python3.12 -c -c -x hip /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src/flash_fwd_runner_batched_gqa_bf16_casual_gfx110x_hip.hip -o "/tmp/pip-req-build-jdvqq1lu/build/temp.linux-x86_64-cpython-312/csrc/flash_attn_rocm/src/flash_fwd_runner_batched_gqa_bf16_casual_gfx110x_hip.o" -D__HIP_PLATFORM_AMD__=1 -DUSE_ROCM=1 -DHIPBLAS_V2 -fPIC -DCUDA_HAS_FP16=1 -D__HIP_NO_HALF_OPERATORS__=1 -D__HIP_NO_HALF_CONVERSIONS__=1 -DHIP_ENABLE_WARP_SYNC_BUILTINS=1 -O3 -std=c++17 -DNDEBUG -U__HIP_NO_HALF_OPERATORS__ -U__HIP_NO_HALF_CONVERSIONS__ -D__WMMA__ -DTORCH_API_INCLUDE_EXTENSION_H -DPYBIND11_COMPILER_TYPE=\"_gcc\" -DPYBIND11_STDLIB=\"_libstdcpp\" -DPYBIND11_BUILD_ABI=\"_cxxabi1016\" -DTORCH_EXTENSION_NAME=flash_attn_2_cuda -fno-gpu-rdc
- [52/58] /opt/rocm-6.3.4/bin/hipcc -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/include -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/library/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/torch/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/torch/include/torch/csrc/api/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/torch/include/THH -I/opt/rocm-6.3.4/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/include -I/usr/include/python3.12 -c -c /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src/flash_fwd_runner_batched_gqa_bf16_noncasual_gfx110x_hip.hip -o /tmp/pip-req-build-jdvqq1lu/build/temp.linux-x86_64-cpython-312/csrc/flash_attn_rocm/src/flash_fwd_runner_batched_gqa_bf16_noncasual_gfx110x_hip.o -D__HIP_PLATFORM_AMD__=1 -DUSE_ROCM=1 -DHIPBLAS_V2 -fPIC -DCUDA_HAS_FP16=1 -D__HIP_NO_HALF_OPERATORS__=1 -D__HIP_NO_HALF_CONVERSIONS__=1 -DHIP_ENABLE_WARP_SYNC_BUILTINS=1 -O3 -std=c++17 -DNDEBUG -U__HIP_NO_HALF_OPERATORS__ -U__HIP_NO_HALF_CONVERSIONS__ --offload-arch=native -D__WMMA__ -DTORCH_API_INCLUDE_EXTENSION_H '-DPYBIND11_COMPILER_TYPE="_gcc"' '-DPYBIND11_STDLIB="_libstdcpp"' '-DPYBIND11_BUILD_ABI="_cxxabi1016"' -DTORCH_EXTENSION_NAME=flash_attn_2_cuda -fno-gpu-rdc
- FAILED: /tmp/pip-req-build-jdvqq1lu/build/temp.linux-x86_64-cpython-312/csrc/flash_attn_rocm/src/flash_fwd_runner_batched_gqa_bf16_noncasual_gfx110x_hip.o
- /opt/rocm-6.3.4/bin/hipcc -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/include -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/library/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/torch/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/torch/include/torch/csrc/api/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/torch/include/THH -I/opt/rocm-6.3.4/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/include -I/usr/include/python3.12 -c -c /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src/flash_fwd_runner_batched_gqa_bf16_noncasual_gfx110x_hip.hip -o /tmp/pip-req-build-jdvqq1lu/build/temp.linux-x86_64-cpython-312/csrc/flash_attn_rocm/src/flash_fwd_runner_batched_gqa_bf16_noncasual_gfx110x_hip.o -D__HIP_PLATFORM_AMD__=1 -DUSE_ROCM=1 -DHIPBLAS_V2 -fPIC -DCUDA_HAS_FP16=1 -D__HIP_NO_HALF_OPERATORS__=1 -D__HIP_NO_HALF_CONVERSIONS__=1 -DHIP_ENABLE_WARP_SYNC_BUILTINS=1 -O3 -std=c++17 -DNDEBUG -U__HIP_NO_HALF_OPERATORS__ -U__HIP_NO_HALF_CONVERSIONS__ --offload-arch=native -D__WMMA__ -DTORCH_API_INCLUDE_EXTENSION_H '-DPYBIND11_COMPILER_TYPE="_gcc"' '-DPYBIND11_STDLIB="_libstdcpp"' '-DPYBIND11_BUILD_ABI="_cxxabi1016"' -DTORCH_EXTENSION_NAME=flash_attn_2_cuda -fno-gpu-rdc
- In file included from /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src/flash_fwd_runner_batched_gqa_bf16_noncasual_gfx110x_hip.hip:25:
- In file included from /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src/flash_runner_hip.hpp:30:
- In file included from /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src/fwd_device_gemm_invoker_hip.hpp:27:
- In file included from /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src/fwd_device_gemm_template_hip.hpp:27:
- In file included from /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src/device_gemm_trait_hip.hpp:45:
- In file included from /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/include/ck/tensor_operation/gpu/device/impl/device_grouped_query_attention_forward_wmma_hip.hpp:17:
- In file included from /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/include/ck/tensor_description/tensor_descriptor_hip.hpp:7:
- In file included from /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/include/ck/utility/common_header_hip.hpp:37:
- /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/include/ck/utility/amd_buffer_addressing.hpp:32:48: error: use of undeclared identifier 'CK_BUFFER_RESOURCE_3RD_DWORD'
- 32 | wave_buffer_resource.config(Number<3>{}) = CK_BUFFER_RESOURCE_3RD_DWORD;
- | ^
- /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/include/ck/utility/amd_buffer_addressing.hpp:47:48: error: use of undeclared identifier 'CK_BUFFER_RESOURCE_3RD_DWORD'
- 47 | wave_buffer_resource.config(Number<3>{}) = CK_BUFFER_RESOURCE_3RD_DWORD;
- | ^
- 2 errors generated when compiling for gfx1036.
- failed to execute:/opt/rocm-6.3.4/lib/llvm/bin/clang++ --offload-arch=native -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/include -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/library/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/torch/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/torch/include/torch/csrc/api/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/torch/include/THH -I/opt/rocm-6.3.4/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/include -I/usr/include/python3.12 -c -c -x hip /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src/flash_fwd_runner_batched_gqa_bf16_noncasual_gfx110x_hip.hip -o "/tmp/pip-req-build-jdvqq1lu/build/temp.linux-x86_64-cpython-312/csrc/flash_attn_rocm/src/flash_fwd_runner_batched_gqa_bf16_noncasual_gfx110x_hip.o" -D__HIP_PLATFORM_AMD__=1 -DUSE_ROCM=1 -DHIPBLAS_V2 -fPIC -DCUDA_HAS_FP16=1 -D__HIP_NO_HALF_OPERATORS__=1 -D__HIP_NO_HALF_CONVERSIONS__=1 -DHIP_ENABLE_WARP_SYNC_BUILTINS=1 -O3 -std=c++17 -DNDEBUG -U__HIP_NO_HALF_OPERATORS__ -U__HIP_NO_HALF_CONVERSIONS__ -D__WMMA__ -DTORCH_API_INCLUDE_EXTENSION_H -DPYBIND11_COMPILER_TYPE=\"_gcc\" -DPYBIND11_STDLIB=\"_libstdcpp\" -DPYBIND11_BUILD_ABI=\"_cxxabi1016\" -DTORCH_EXTENSION_NAME=flash_attn_2_cuda -fno-gpu-rdc
- [53/58] /opt/rocm-6.3.4/bin/hipcc -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/include -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/library/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/torch/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/torch/include/torch/csrc/api/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/torch/include/THH -I/opt/rocm-6.3.4/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/include -I/usr/include/python3.12 -c -c /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src/flash_fwd_runner_batched_gqa_fp16_noncasual_gfx110x_hip.hip -o /tmp/pip-req-build-jdvqq1lu/build/temp.linux-x86_64-cpython-312/csrc/flash_attn_rocm/src/flash_fwd_runner_batched_gqa_fp16_noncasual_gfx110x_hip.o -D__HIP_PLATFORM_AMD__=1 -DUSE_ROCM=1 -DHIPBLAS_V2 -fPIC -DCUDA_HAS_FP16=1 -D__HIP_NO_HALF_OPERATORS__=1 -D__HIP_NO_HALF_CONVERSIONS__=1 -DHIP_ENABLE_WARP_SYNC_BUILTINS=1 -O3 -std=c++17 -DNDEBUG -U__HIP_NO_HALF_OPERATORS__ -U__HIP_NO_HALF_CONVERSIONS__ --offload-arch=native -D__WMMA__ -DTORCH_API_INCLUDE_EXTENSION_H '-DPYBIND11_COMPILER_TYPE="_gcc"' '-DPYBIND11_STDLIB="_libstdcpp"' '-DPYBIND11_BUILD_ABI="_cxxabi1016"' -DTORCH_EXTENSION_NAME=flash_attn_2_cuda -fno-gpu-rdc
- FAILED: /tmp/pip-req-build-jdvqq1lu/build/temp.linux-x86_64-cpython-312/csrc/flash_attn_rocm/src/flash_fwd_runner_batched_gqa_fp16_noncasual_gfx110x_hip.o
- /opt/rocm-6.3.4/bin/hipcc -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/include -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/library/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/torch/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/torch/include/torch/csrc/api/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/torch/include/THH -I/opt/rocm-6.3.4/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/include -I/usr/include/python3.12 -c -c /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src/flash_fwd_runner_batched_gqa_fp16_noncasual_gfx110x_hip.hip -o /tmp/pip-req-build-jdvqq1lu/build/temp.linux-x86_64-cpython-312/csrc/flash_attn_rocm/src/flash_fwd_runner_batched_gqa_fp16_noncasual_gfx110x_hip.o -D__HIP_PLATFORM_AMD__=1 -DUSE_ROCM=1 -DHIPBLAS_V2 -fPIC -DCUDA_HAS_FP16=1 -D__HIP_NO_HALF_OPERATORS__=1 -D__HIP_NO_HALF_CONVERSIONS__=1 -DHIP_ENABLE_WARP_SYNC_BUILTINS=1 -O3 -std=c++17 -DNDEBUG -U__HIP_NO_HALF_OPERATORS__ -U__HIP_NO_HALF_CONVERSIONS__ --offload-arch=native -D__WMMA__ -DTORCH_API_INCLUDE_EXTENSION_H '-DPYBIND11_COMPILER_TYPE="_gcc"' '-DPYBIND11_STDLIB="_libstdcpp"' '-DPYBIND11_BUILD_ABI="_cxxabi1016"' -DTORCH_EXTENSION_NAME=flash_attn_2_cuda -fno-gpu-rdc
- In file included from /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src/flash_fwd_runner_batched_gqa_fp16_noncasual_gfx110x_hip.hip:25:
- In file included from /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src/flash_runner_hip.hpp:30:
- In file included from /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src/fwd_device_gemm_invoker_hip.hpp:27:
- In file included from /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src/fwd_device_gemm_template_hip.hpp:27:
- In file included from /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src/device_gemm_trait_hip.hpp:45:
- In file included from /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/include/ck/tensor_operation/gpu/device/impl/device_grouped_query_attention_forward_wmma_hip.hpp:17:
- In file included from /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/include/ck/tensor_description/tensor_descriptor_hip.hpp:7:
- In file included from /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/include/ck/utility/common_header_hip.hpp:37:
- /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/include/ck/utility/amd_buffer_addressing.hpp:32:48: error: use of undeclared identifier 'CK_BUFFER_RESOURCE_3RD_DWORD'
- 32 | wave_buffer_resource.config(Number<3>{}) = CK_BUFFER_RESOURCE_3RD_DWORD;
- | ^
- /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/include/ck/utility/amd_buffer_addressing.hpp:47:48: error: use of undeclared identifier 'CK_BUFFER_RESOURCE_3RD_DWORD'
- 47 | wave_buffer_resource.config(Number<3>{}) = CK_BUFFER_RESOURCE_3RD_DWORD;
- | ^
- 2 errors generated when compiling for gfx1036.
- failed to execute:/opt/rocm-6.3.4/lib/llvm/bin/clang++ --offload-arch=native -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/include -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/library/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/torch/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/torch/include/torch/csrc/api/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/torch/include/THH -I/opt/rocm-6.3.4/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/include -I/usr/include/python3.12 -c -c -x hip /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src/flash_fwd_runner_batched_gqa_fp16_noncasual_gfx110x_hip.hip -o "/tmp/pip-req-build-jdvqq1lu/build/temp.linux-x86_64-cpython-312/csrc/flash_attn_rocm/src/flash_fwd_runner_batched_gqa_fp16_noncasual_gfx110x_hip.o" -D__HIP_PLATFORM_AMD__=1 -DUSE_ROCM=1 -DHIPBLAS_V2 -fPIC -DCUDA_HAS_FP16=1 -D__HIP_NO_HALF_OPERATORS__=1 -D__HIP_NO_HALF_CONVERSIONS__=1 -DHIP_ENABLE_WARP_SYNC_BUILTINS=1 -O3 -std=c++17 -DNDEBUG -U__HIP_NO_HALF_OPERATORS__ -U__HIP_NO_HALF_CONVERSIONS__ -D__WMMA__ -DTORCH_API_INCLUDE_EXTENSION_H -DPYBIND11_COMPILER_TYPE=\"_gcc\" -DPYBIND11_STDLIB=\"_libstdcpp\" -DPYBIND11_BUILD_ABI=\"_cxxabi1016\" -DTORCH_EXTENSION_NAME=flash_attn_2_cuda -fno-gpu-rdc
- [54/58] /opt/rocm-6.3.4/bin/hipcc -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/include -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/library/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/torch/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/torch/include/torch/csrc/api/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/torch/include/THH -I/opt/rocm-6.3.4/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/include -I/usr/include/python3.12 -c -c /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src/flash_fwd_runner_batched_mqa_bf16_casual_gfx110x_hip.hip -o /tmp/pip-req-build-jdvqq1lu/build/temp.linux-x86_64-cpython-312/csrc/flash_attn_rocm/src/flash_fwd_runner_batched_mqa_bf16_casual_gfx110x_hip.o -D__HIP_PLATFORM_AMD__=1 -DUSE_ROCM=1 -DHIPBLAS_V2 -fPIC -DCUDA_HAS_FP16=1 -D__HIP_NO_HALF_OPERATORS__=1 -D__HIP_NO_HALF_CONVERSIONS__=1 -DHIP_ENABLE_WARP_SYNC_BUILTINS=1 -O3 -std=c++17 -DNDEBUG -U__HIP_NO_HALF_OPERATORS__ -U__HIP_NO_HALF_CONVERSIONS__ --offload-arch=native -D__WMMA__ -DTORCH_API_INCLUDE_EXTENSION_H '-DPYBIND11_COMPILER_TYPE="_gcc"' '-DPYBIND11_STDLIB="_libstdcpp"' '-DPYBIND11_BUILD_ABI="_cxxabi1016"' -DTORCH_EXTENSION_NAME=flash_attn_2_cuda -fno-gpu-rdc
- FAILED: /tmp/pip-req-build-jdvqq1lu/build/temp.linux-x86_64-cpython-312/csrc/flash_attn_rocm/src/flash_fwd_runner_batched_mqa_bf16_casual_gfx110x_hip.o
- /opt/rocm-6.3.4/bin/hipcc -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/include -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/library/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/torch/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/torch/include/torch/csrc/api/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/torch/include/THH -I/opt/rocm-6.3.4/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/include -I/usr/include/python3.12 -c -c /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src/flash_fwd_runner_batched_mqa_bf16_casual_gfx110x_hip.hip -o /tmp/pip-req-build-jdvqq1lu/build/temp.linux-x86_64-cpython-312/csrc/flash_attn_rocm/src/flash_fwd_runner_batched_mqa_bf16_casual_gfx110x_hip.o -D__HIP_PLATFORM_AMD__=1 -DUSE_ROCM=1 -DHIPBLAS_V2 -fPIC -DCUDA_HAS_FP16=1 -D__HIP_NO_HALF_OPERATORS__=1 -D__HIP_NO_HALF_CONVERSIONS__=1 -DHIP_ENABLE_WARP_SYNC_BUILTINS=1 -O3 -std=c++17 -DNDEBUG -U__HIP_NO_HALF_OPERATORS__ -U__HIP_NO_HALF_CONVERSIONS__ --offload-arch=native -D__WMMA__ -DTORCH_API_INCLUDE_EXTENSION_H '-DPYBIND11_COMPILER_TYPE="_gcc"' '-DPYBIND11_STDLIB="_libstdcpp"' '-DPYBIND11_BUILD_ABI="_cxxabi1016"' -DTORCH_EXTENSION_NAME=flash_attn_2_cuda -fno-gpu-rdc
- In file included from /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src/flash_fwd_runner_batched_mqa_bf16_casual_gfx110x_hip.hip:25:
- In file included from /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src/flash_runner_hip.hpp:30:
- In file included from /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src/fwd_device_gemm_invoker_hip.hpp:27:
- In file included from /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src/fwd_device_gemm_template_hip.hpp:27:
- In file included from /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src/device_gemm_trait_hip.hpp:45:
- In file included from /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/include/ck/tensor_operation/gpu/device/impl/device_grouped_query_attention_forward_wmma_hip.hpp:17:
- In file included from /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/include/ck/tensor_description/tensor_descriptor_hip.hpp:7:
- In file included from /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/include/ck/utility/common_header_hip.hpp:37:
- /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/include/ck/utility/amd_buffer_addressing.hpp:32:48: error: use of undeclared identifier 'CK_BUFFER_RESOURCE_3RD_DWORD'
- 32 | wave_buffer_resource.config(Number<3>{}) = CK_BUFFER_RESOURCE_3RD_DWORD;
- | ^
- /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/include/ck/utility/amd_buffer_addressing.hpp:47:48: error: use of undeclared identifier 'CK_BUFFER_RESOURCE_3RD_DWORD'
- 47 | wave_buffer_resource.config(Number<3>{}) = CK_BUFFER_RESOURCE_3RD_DWORD;
- | ^
- 2 errors generated when compiling for gfx1036.
- failed to execute:/opt/rocm-6.3.4/lib/llvm/bin/clang++ --offload-arch=native -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/include -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/library/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/torch/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/torch/include/torch/csrc/api/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/torch/include/THH -I/opt/rocm-6.3.4/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/include -I/usr/include/python3.12 -c -c -x hip /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src/flash_fwd_runner_batched_mqa_bf16_casual_gfx110x_hip.hip -o "/tmp/pip-req-build-jdvqq1lu/build/temp.linux-x86_64-cpython-312/csrc/flash_attn_rocm/src/flash_fwd_runner_batched_mqa_bf16_casual_gfx110x_hip.o" -D__HIP_PLATFORM_AMD__=1 -DUSE_ROCM=1 -DHIPBLAS_V2 -fPIC -DCUDA_HAS_FP16=1 -D__HIP_NO_HALF_OPERATORS__=1 -D__HIP_NO_HALF_CONVERSIONS__=1 -DHIP_ENABLE_WARP_SYNC_BUILTINS=1 -O3 -std=c++17 -DNDEBUG -U__HIP_NO_HALF_OPERATORS__ -U__HIP_NO_HALF_CONVERSIONS__ -D__WMMA__ -DTORCH_API_INCLUDE_EXTENSION_H -DPYBIND11_COMPILER_TYPE=\"_gcc\" -DPYBIND11_STDLIB=\"_libstdcpp\" -DPYBIND11_BUILD_ABI=\"_cxxabi1016\" -DTORCH_EXTENSION_NAME=flash_attn_2_cuda -fno-gpu-rdc
- [55/58] /opt/rocm-6.3.4/bin/hipcc -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/include -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/library/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/torch/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/torch/include/torch/csrc/api/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/torch/include/THH -I/opt/rocm-6.3.4/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/include -I/usr/include/python3.12 -c -c /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src/flash_fwd_runner_batched_mqa_fp16_noncasual_gfx110x_hip.hip -o /tmp/pip-req-build-jdvqq1lu/build/temp.linux-x86_64-cpython-312/csrc/flash_attn_rocm/src/flash_fwd_runner_batched_mqa_fp16_noncasual_gfx110x_hip.o -D__HIP_PLATFORM_AMD__=1 -DUSE_ROCM=1 -DHIPBLAS_V2 -fPIC -DCUDA_HAS_FP16=1 -D__HIP_NO_HALF_OPERATORS__=1 -D__HIP_NO_HALF_CONVERSIONS__=1 -DHIP_ENABLE_WARP_SYNC_BUILTINS=1 -O3 -std=c++17 -DNDEBUG -U__HIP_NO_HALF_OPERATORS__ -U__HIP_NO_HALF_CONVERSIONS__ --offload-arch=native -D__WMMA__ -DTORCH_API_INCLUDE_EXTENSION_H '-DPYBIND11_COMPILER_TYPE="_gcc"' '-DPYBIND11_STDLIB="_libstdcpp"' '-DPYBIND11_BUILD_ABI="_cxxabi1016"' -DTORCH_EXTENSION_NAME=flash_attn_2_cuda -fno-gpu-rdc
- FAILED: /tmp/pip-req-build-jdvqq1lu/build/temp.linux-x86_64-cpython-312/csrc/flash_attn_rocm/src/flash_fwd_runner_batched_mqa_fp16_noncasual_gfx110x_hip.o
- /opt/rocm-6.3.4/bin/hipcc -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/include -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/library/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/torch/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/torch/include/torch/csrc/api/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/torch/include/THH -I/opt/rocm-6.3.4/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/include -I/usr/include/python3.12 -c -c /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src/flash_fwd_runner_batched_mqa_fp16_noncasual_gfx110x_hip.hip -o /tmp/pip-req-build-jdvqq1lu/build/temp.linux-x86_64-cpython-312/csrc/flash_attn_rocm/src/flash_fwd_runner_batched_mqa_fp16_noncasual_gfx110x_hip.o -D__HIP_PLATFORM_AMD__=1 -DUSE_ROCM=1 -DHIPBLAS_V2 -fPIC -DCUDA_HAS_FP16=1 -D__HIP_NO_HALF_OPERATORS__=1 -D__HIP_NO_HALF_CONVERSIONS__=1 -DHIP_ENABLE_WARP_SYNC_BUILTINS=1 -O3 -std=c++17 -DNDEBUG -U__HIP_NO_HALF_OPERATORS__ -U__HIP_NO_HALF_CONVERSIONS__ --offload-arch=native -D__WMMA__ -DTORCH_API_INCLUDE_EXTENSION_H '-DPYBIND11_COMPILER_TYPE="_gcc"' '-DPYBIND11_STDLIB="_libstdcpp"' '-DPYBIND11_BUILD_ABI="_cxxabi1016"' -DTORCH_EXTENSION_NAME=flash_attn_2_cuda -fno-gpu-rdc
- In file included from /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src/flash_fwd_runner_batched_mqa_fp16_noncasual_gfx110x_hip.hip:25:
- In file included from /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src/flash_runner_hip.hpp:30:
- In file included from /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src/fwd_device_gemm_invoker_hip.hpp:27:
- In file included from /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src/fwd_device_gemm_template_hip.hpp:27:
- In file included from /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src/device_gemm_trait_hip.hpp:45:
- In file included from /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/include/ck/tensor_operation/gpu/device/impl/device_grouped_query_attention_forward_wmma_hip.hpp:17:
- In file included from /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/include/ck/tensor_description/tensor_descriptor_hip.hpp:7:
- In file included from /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/include/ck/utility/common_header_hip.hpp:37:
- /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/include/ck/utility/amd_buffer_addressing.hpp:32:48: error: use of undeclared identifier 'CK_BUFFER_RESOURCE_3RD_DWORD'
- 32 | wave_buffer_resource.config(Number<3>{}) = CK_BUFFER_RESOURCE_3RD_DWORD;
- | ^
- /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/include/ck/utility/amd_buffer_addressing.hpp:47:48: error: use of undeclared identifier 'CK_BUFFER_RESOURCE_3RD_DWORD'
- 47 | wave_buffer_resource.config(Number<3>{}) = CK_BUFFER_RESOURCE_3RD_DWORD;
- | ^
- 2 errors generated when compiling for gfx1036.
- failed to execute:/opt/rocm-6.3.4/lib/llvm/bin/clang++ --offload-arch=native -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/include -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/library/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/torch/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/torch/include/torch/csrc/api/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/torch/include/THH -I/opt/rocm-6.3.4/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/include -I/usr/include/python3.12 -c -c -x hip /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src/flash_fwd_runner_batched_mqa_fp16_noncasual_gfx110x_hip.hip -o "/tmp/pip-req-build-jdvqq1lu/build/temp.linux-x86_64-cpython-312/csrc/flash_attn_rocm/src/flash_fwd_runner_batched_mqa_fp16_noncasual_gfx110x_hip.o" -D__HIP_PLATFORM_AMD__=1 -DUSE_ROCM=1 -DHIPBLAS_V2 -fPIC -DCUDA_HAS_FP16=1 -D__HIP_NO_HALF_OPERATORS__=1 -D__HIP_NO_HALF_CONVERSIONS__=1 -DHIP_ENABLE_WARP_SYNC_BUILTINS=1 -O3 -std=c++17 -DNDEBUG -U__HIP_NO_HALF_OPERATORS__ -U__HIP_NO_HALF_CONVERSIONS__ -D__WMMA__ -DTORCH_API_INCLUDE_EXTENSION_H -DPYBIND11_COMPILER_TYPE=\"_gcc\" -DPYBIND11_STDLIB=\"_libstdcpp\" -DPYBIND11_BUILD_ABI=\"_cxxabi1016\" -DTORCH_EXTENSION_NAME=flash_attn_2_cuda -fno-gpu-rdc
- [56/58] /opt/rocm-6.3.4/bin/hipcc -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/include -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/library/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/torch/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/torch/include/torch/csrc/api/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/torch/include/THH -I/opt/rocm-6.3.4/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/include -I/usr/include/python3.12 -c -c /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src/flash_fwd_runner_batched_mqa_fp16_casual_gfx110x_hip.hip -o /tmp/pip-req-build-jdvqq1lu/build/temp.linux-x86_64-cpython-312/csrc/flash_attn_rocm/src/flash_fwd_runner_batched_mqa_fp16_casual_gfx110x_hip.o -D__HIP_PLATFORM_AMD__=1 -DUSE_ROCM=1 -DHIPBLAS_V2 -fPIC -DCUDA_HAS_FP16=1 -D__HIP_NO_HALF_OPERATORS__=1 -D__HIP_NO_HALF_CONVERSIONS__=1 -DHIP_ENABLE_WARP_SYNC_BUILTINS=1 -O3 -std=c++17 -DNDEBUG -U__HIP_NO_HALF_OPERATORS__ -U__HIP_NO_HALF_CONVERSIONS__ --offload-arch=native -D__WMMA__ -DTORCH_API_INCLUDE_EXTENSION_H '-DPYBIND11_COMPILER_TYPE="_gcc"' '-DPYBIND11_STDLIB="_libstdcpp"' '-DPYBIND11_BUILD_ABI="_cxxabi1016"' -DTORCH_EXTENSION_NAME=flash_attn_2_cuda -fno-gpu-rdc
- FAILED: /tmp/pip-req-build-jdvqq1lu/build/temp.linux-x86_64-cpython-312/csrc/flash_attn_rocm/src/flash_fwd_runner_batched_mqa_fp16_casual_gfx110x_hip.o
- /opt/rocm-6.3.4/bin/hipcc -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/include -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/library/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/torch/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/torch/include/torch/csrc/api/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/torch/include/THH -I/opt/rocm-6.3.4/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/include -I/usr/include/python3.12 -c -c /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src/flash_fwd_runner_batched_mqa_fp16_casual_gfx110x_hip.hip -o /tmp/pip-req-build-jdvqq1lu/build/temp.linux-x86_64-cpython-312/csrc/flash_attn_rocm/src/flash_fwd_runner_batched_mqa_fp16_casual_gfx110x_hip.o -D__HIP_PLATFORM_AMD__=1 -DUSE_ROCM=1 -DHIPBLAS_V2 -fPIC -DCUDA_HAS_FP16=1 -D__HIP_NO_HALF_OPERATORS__=1 -D__HIP_NO_HALF_CONVERSIONS__=1 -DHIP_ENABLE_WARP_SYNC_BUILTINS=1 -O3 -std=c++17 -DNDEBUG -U__HIP_NO_HALF_OPERATORS__ -U__HIP_NO_HALF_CONVERSIONS__ --offload-arch=native -D__WMMA__ -DTORCH_API_INCLUDE_EXTENSION_H '-DPYBIND11_COMPILER_TYPE="_gcc"' '-DPYBIND11_STDLIB="_libstdcpp"' '-DPYBIND11_BUILD_ABI="_cxxabi1016"' -DTORCH_EXTENSION_NAME=flash_attn_2_cuda -fno-gpu-rdc
- In file included from /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src/flash_fwd_runner_batched_mqa_fp16_casual_gfx110x_hip.hip:25:
- In file included from /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src/flash_runner_hip.hpp:30:
- In file included from /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src/fwd_device_gemm_invoker_hip.hpp:27:
- In file included from /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src/fwd_device_gemm_template_hip.hpp:27:
- In file included from /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src/device_gemm_trait_hip.hpp:45:
- In file included from /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/include/ck/tensor_operation/gpu/device/impl/device_grouped_query_attention_forward_wmma_hip.hpp:17:
- In file included from /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/include/ck/tensor_description/tensor_descriptor_hip.hpp:7:
- In file included from /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/include/ck/utility/common_header_hip.hpp:37:
- /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/include/ck/utility/amd_buffer_addressing.hpp:32:48: error: use of undeclared identifier 'CK_BUFFER_RESOURCE_3RD_DWORD'
- 32 | wave_buffer_resource.config(Number<3>{}) = CK_BUFFER_RESOURCE_3RD_DWORD;
- | ^
- /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/include/ck/utility/amd_buffer_addressing.hpp:47:48: error: use of undeclared identifier 'CK_BUFFER_RESOURCE_3RD_DWORD'
- 47 | wave_buffer_resource.config(Number<3>{}) = CK_BUFFER_RESOURCE_3RD_DWORD;
- | ^
- 2 errors generated when compiling for gfx1036.
- failed to execute:/opt/rocm-6.3.4/lib/llvm/bin/clang++ --offload-arch=native -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/include -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/library/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/torch/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/torch/include/torch/csrc/api/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/torch/include/THH -I/opt/rocm-6.3.4/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/include -I/usr/include/python3.12 -c -c -x hip /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src/flash_fwd_runner_batched_mqa_fp16_casual_gfx110x_hip.hip -o "/tmp/pip-req-build-jdvqq1lu/build/temp.linux-x86_64-cpython-312/csrc/flash_attn_rocm/src/flash_fwd_runner_batched_mqa_fp16_casual_gfx110x_hip.o" -D__HIP_PLATFORM_AMD__=1 -DUSE_ROCM=1 -DHIPBLAS_V2 -fPIC -DCUDA_HAS_FP16=1 -D__HIP_NO_HALF_OPERATORS__=1 -D__HIP_NO_HALF_CONVERSIONS__=1 -DHIP_ENABLE_WARP_SYNC_BUILTINS=1 -O3 -std=c++17 -DNDEBUG -U__HIP_NO_HALF_OPERATORS__ -U__HIP_NO_HALF_CONVERSIONS__ -D__WMMA__ -DTORCH_API_INCLUDE_EXTENSION_H -DPYBIND11_COMPILER_TYPE=\"_gcc\" -DPYBIND11_STDLIB=\"_libstdcpp\" -DPYBIND11_BUILD_ABI=\"_cxxabi1016\" -DTORCH_EXTENSION_NAME=flash_attn_2_cuda -fno-gpu-rdc
- [57/58] /opt/rocm-6.3.4/bin/hipcc -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/include -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/library/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/torch/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/torch/include/torch/csrc/api/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/torch/include/THH -I/opt/rocm-6.3.4/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/include -I/usr/include/python3.12 -c -c /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/flash_api_hip.hip -o /tmp/pip-req-build-jdvqq1lu/build/temp.linux-x86_64-cpython-312/csrc/flash_attn_rocm/flash_api_hip.o -D__HIP_PLATFORM_AMD__=1 -DUSE_ROCM=1 -DHIPBLAS_V2 -fPIC -DCUDA_HAS_FP16=1 -D__HIP_NO_HALF_OPERATORS__=1 -D__HIP_NO_HALF_CONVERSIONS__=1 -DHIP_ENABLE_WARP_SYNC_BUILTINS=1 -O3 -std=c++17 -DNDEBUG -U__HIP_NO_HALF_OPERATORS__ -U__HIP_NO_HALF_CONVERSIONS__ --offload-arch=native -D__WMMA__ -DTORCH_API_INCLUDE_EXTENSION_H '-DPYBIND11_COMPILER_TYPE="_gcc"' '-DPYBIND11_STDLIB="_libstdcpp"' '-DPYBIND11_BUILD_ABI="_cxxabi1016"' -DTORCH_EXTENSION_NAME=flash_attn_2_cuda -fno-gpu-rdc
- FAILED: /tmp/pip-req-build-jdvqq1lu/build/temp.linux-x86_64-cpython-312/csrc/flash_attn_rocm/flash_api_hip.o
- /opt/rocm-6.3.4/bin/hipcc -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/include -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/library/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/torch/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/torch/include/torch/csrc/api/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/torch/include/THH -I/opt/rocm-6.3.4/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/include -I/usr/include/python3.12 -c -c /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/flash_api_hip.hip -o /tmp/pip-req-build-jdvqq1lu/build/temp.linux-x86_64-cpython-312/csrc/flash_attn_rocm/flash_api_hip.o -D__HIP_PLATFORM_AMD__=1 -DUSE_ROCM=1 -DHIPBLAS_V2 -fPIC -DCUDA_HAS_FP16=1 -D__HIP_NO_HALF_OPERATORS__=1 -D__HIP_NO_HALF_CONVERSIONS__=1 -DHIP_ENABLE_WARP_SYNC_BUILTINS=1 -O3 -std=c++17 -DNDEBUG -U__HIP_NO_HALF_OPERATORS__ -U__HIP_NO_HALF_CONVERSIONS__ --offload-arch=native -D__WMMA__ -DTORCH_API_INCLUDE_EXTENSION_H '-DPYBIND11_COMPILER_TYPE="_gcc"' '-DPYBIND11_STDLIB="_libstdcpp"' '-DPYBIND11_BUILD_ABI="_cxxabi1016"' -DTORCH_EXTENSION_NAME=flash_attn_2_cuda -fno-gpu-rdc
- In file included from /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/flash_api_hip.hip:14:
- In file included from /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src/flash_runner_hip.hpp:30:
- In file included from /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src/fwd_device_gemm_invoker_hip.hpp:27:
- In file included from /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src/fwd_device_gemm_template_hip.hpp:27:
- In file included from /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src/device_gemm_trait_hip.hpp:45:
- In file included from /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/include/ck/tensor_operation/gpu/device/impl/device_grouped_query_attention_forward_wmma_hip.hpp:17:
- In file included from /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/include/ck/tensor_description/tensor_descriptor_hip.hpp:7:
- In file included from /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/include/ck/utility/common_header_hip.hpp:37:
- /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/include/ck/utility/amd_buffer_addressing.hpp:32:48: error: use of undeclared identifier 'CK_BUFFER_RESOURCE_3RD_DWORD'
- 32 | wave_buffer_resource.config(Number<3>{}) = CK_BUFFER_RESOURCE_3RD_DWORD;
- | ^
- /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/include/ck/utility/amd_buffer_addressing.hpp:47:48: error: use of undeclared identifier 'CK_BUFFER_RESOURCE_3RD_DWORD'
- 47 | wave_buffer_resource.config(Number<3>{}) = CK_BUFFER_RESOURCE_3RD_DWORD;
- | ^
- 2 errors generated when compiling for gfx1036.
- failed to execute:/opt/rocm-6.3.4/lib/llvm/bin/clang++ --offload-arch=native -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/include -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/library/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/torch/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/torch/include/torch/csrc/api/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/torch/include/THH -I/opt/rocm-6.3.4/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/include -I/usr/include/python3.12 -c -c -x hip /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/flash_api_hip.hip -o "/tmp/pip-req-build-jdvqq1lu/build/temp.linux-x86_64-cpython-312/csrc/flash_attn_rocm/flash_api_hip.o" -D__HIP_PLATFORM_AMD__=1 -DUSE_ROCM=1 -DHIPBLAS_V2 -fPIC -DCUDA_HAS_FP16=1 -D__HIP_NO_HALF_OPERATORS__=1 -D__HIP_NO_HALF_CONVERSIONS__=1 -DHIP_ENABLE_WARP_SYNC_BUILTINS=1 -O3 -std=c++17 -DNDEBUG -U__HIP_NO_HALF_OPERATORS__ -U__HIP_NO_HALF_CONVERSIONS__ -D__WMMA__ -DTORCH_API_INCLUDE_EXTENSION_H -DPYBIND11_COMPILER_TYPE=\"_gcc\" -DPYBIND11_STDLIB=\"_libstdcpp\" -DPYBIND11_BUILD_ABI=\"_cxxabi1016\" -DTORCH_EXTENSION_NAME=flash_attn_2_cuda -fno-gpu-rdc
- [58/58] /opt/rocm-6.3.4/bin/hipcc -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/include -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/library/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/torch/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/torch/include/torch/csrc/api/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/torch/include/THH -I/opt/rocm-6.3.4/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/include -I/usr/include/python3.12 -c -c /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src/flash_fwd_runner_batched_mqa_bf16_noncasual_gfx110x_hip.hip -o /tmp/pip-req-build-jdvqq1lu/build/temp.linux-x86_64-cpython-312/csrc/flash_attn_rocm/src/flash_fwd_runner_batched_mqa_bf16_noncasual_gfx110x_hip.o -D__HIP_PLATFORM_AMD__=1 -DUSE_ROCM=1 -DHIPBLAS_V2 -fPIC -DCUDA_HAS_FP16=1 -D__HIP_NO_HALF_OPERATORS__=1 -D__HIP_NO_HALF_CONVERSIONS__=1 -DHIP_ENABLE_WARP_SYNC_BUILTINS=1 -O3 -std=c++17 -DNDEBUG -U__HIP_NO_HALF_OPERATORS__ -U__HIP_NO_HALF_CONVERSIONS__ --offload-arch=native -D__WMMA__ -DTORCH_API_INCLUDE_EXTENSION_H '-DPYBIND11_COMPILER_TYPE="_gcc"' '-DPYBIND11_STDLIB="_libstdcpp"' '-DPYBIND11_BUILD_ABI="_cxxabi1016"' -DTORCH_EXTENSION_NAME=flash_attn_2_cuda -fno-gpu-rdc
- FAILED: /tmp/pip-req-build-jdvqq1lu/build/temp.linux-x86_64-cpython-312/csrc/flash_attn_rocm/src/flash_fwd_runner_batched_mqa_bf16_noncasual_gfx110x_hip.o
- /opt/rocm-6.3.4/bin/hipcc -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/include -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/library/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/torch/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/torch/include/torch/csrc/api/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/torch/include/THH -I/opt/rocm-6.3.4/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/include -I/usr/include/python3.12 -c -c /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src/flash_fwd_runner_batched_mqa_bf16_noncasual_gfx110x_hip.hip -o /tmp/pip-req-build-jdvqq1lu/build/temp.linux-x86_64-cpython-312/csrc/flash_attn_rocm/src/flash_fwd_runner_batched_mqa_bf16_noncasual_gfx110x_hip.o -D__HIP_PLATFORM_AMD__=1 -DUSE_ROCM=1 -DHIPBLAS_V2 -fPIC -DCUDA_HAS_FP16=1 -D__HIP_NO_HALF_OPERATORS__=1 -D__HIP_NO_HALF_CONVERSIONS__=1 -DHIP_ENABLE_WARP_SYNC_BUILTINS=1 -O3 -std=c++17 -DNDEBUG -U__HIP_NO_HALF_OPERATORS__ -U__HIP_NO_HALF_CONVERSIONS__ --offload-arch=native -D__WMMA__ -DTORCH_API_INCLUDE_EXTENSION_H '-DPYBIND11_COMPILER_TYPE="_gcc"' '-DPYBIND11_STDLIB="_libstdcpp"' '-DPYBIND11_BUILD_ABI="_cxxabi1016"' -DTORCH_EXTENSION_NAME=flash_attn_2_cuda -fno-gpu-rdc
- In file included from /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src/flash_fwd_runner_batched_mqa_bf16_noncasual_gfx110x_hip.hip:25:
- In file included from /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src/flash_runner_hip.hpp:30:
- In file included from /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src/fwd_device_gemm_invoker_hip.hpp:27:
- In file included from /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src/fwd_device_gemm_template_hip.hpp:27:
- In file included from /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src/device_gemm_trait_hip.hpp:45:
- In file included from /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/include/ck/tensor_operation/gpu/device/impl/device_grouped_query_attention_forward_wmma_hip.hpp:17:
- In file included from /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/include/ck/tensor_description/tensor_descriptor_hip.hpp:7:
- In file included from /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/include/ck/utility/common_header_hip.hpp:37:
- /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/include/ck/utility/amd_buffer_addressing.hpp:32:48: error: use of undeclared identifier 'CK_BUFFER_RESOURCE_3RD_DWORD'
- 32 | wave_buffer_resource.config(Number<3>{}) = CK_BUFFER_RESOURCE_3RD_DWORD;
- | ^
- /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/include/ck/utility/amd_buffer_addressing.hpp:47:48: error: use of undeclared identifier 'CK_BUFFER_RESOURCE_3RD_DWORD'
- 47 | wave_buffer_resource.config(Number<3>{}) = CK_BUFFER_RESOURCE_3RD_DWORD;
- | ^
- 2 errors generated when compiling for gfx1036.
- failed to execute:/opt/rocm-6.3.4/lib/llvm/bin/clang++ --offload-arch=native -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/include -I/tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/composable_kernel/library/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/torch/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/torch/include/torch/csrc/api/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/torch/include/THH -I/opt/rocm-6.3.4/include -I/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/include -I/usr/include/python3.12 -c -c -x hip /tmp/pip-req-build-jdvqq1lu/csrc/flash_attn_rocm/src/flash_fwd_runner_batched_mqa_bf16_noncasual_gfx110x_hip.hip -o "/tmp/pip-req-build-jdvqq1lu/build/temp.linux-x86_64-cpython-312/csrc/flash_attn_rocm/src/flash_fwd_runner_batched_mqa_bf16_noncasual_gfx110x_hip.o" -D__HIP_PLATFORM_AMD__=1 -DUSE_ROCM=1 -DHIPBLAS_V2 -fPIC -DCUDA_HAS_FP16=1 -D__HIP_NO_HALF_OPERATORS__=1 -D__HIP_NO_HALF_CONVERSIONS__=1 -DHIP_ENABLE_WARP_SYNC_BUILTINS=1 -O3 -std=c++17 -DNDEBUG -U__HIP_NO_HALF_OPERATORS__ -U__HIP_NO_HALF_CONVERSIONS__ -D__WMMA__ -DTORCH_API_INCLUDE_EXTENSION_H -DPYBIND11_COMPILER_TYPE=\"_gcc\" -DPYBIND11_STDLIB=\"_libstdcpp\" -DPYBIND11_BUILD_ABI=\"_cxxabi1016\" -DTORCH_EXTENSION_NAME=flash_attn_2_cuda -fno-gpu-rdc
- ninja: build stopped: subcommand failed.
- Traceback (most recent call last):
- File "/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/torch/utils/cpp_extension.py", line 2560, in _run_ninja_build
- subprocess.run(
- File "/usr/lib/python3.12/subprocess.py", line 571, in run
- raise CalledProcessError(retcode, process.args,
- subprocess.CalledProcessError: Command '['ninja', '-v']' returned non-zero exit status 1.
- The above exception was the direct cause of the following exception:
- Traceback (most recent call last):
- File "<string>", line 2, in <module>
- File "<pip-setuptools-caller>", line 35, in <module>
- File "/tmp/pip-req-build-jdvqq1lu/setup.py", line 380, in <module>
- setup(
- File "/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/setuptools/__init__.py", line 103, in setup
- return distutils.core.setup(**attrs)
- ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
- File "/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/setuptools/_distutils/core.py", line 184, in setup
- return run_commands(dist)
- ^^^^^^^^^^^^^^^^^^
- File "/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/setuptools/_distutils/core.py", line 200, in run_commands
- dist.run_commands()
- File "/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/setuptools/_distutils/dist.py", line 970, in run_commands
- self.run_command(cmd)
- File "/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/setuptools/dist.py", line 974, in run_command
- super().run_command(command)
- File "/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/setuptools/_distutils/dist.py", line 989, in run_command
- cmd_obj.run()
- File "/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/setuptools/command/bdist_wheel.py", line 373, in run
- self.run_command("build")
- File "/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/setuptools/_distutils/cmd.py", line 316, in run_command
- self.distribution.run_command(command)
- File "/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/setuptools/dist.py", line 974, in run_command
- super().run_command(command)
- File "/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/setuptools/_distutils/dist.py", line 989, in run_command
- cmd_obj.run()
- File "/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/setuptools/_distutils/command/build.py", line 135, in run
- self.run_command(cmd_name)
- File "/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/setuptools/_distutils/cmd.py", line 316, in run_command
- self.distribution.run_command(command)
- File "/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/setuptools/dist.py", line 974, in run_command
- super().run_command(command)
- File "/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/setuptools/_distutils/dist.py", line 989, in run_command
- cmd_obj.run()
- File "/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/setuptools/command/build_ext.py", line 93, in run
- _build_ext.run(self)
- File "/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/setuptools/_distutils/command/build_ext.py", line 359, in run
- self.build_extensions()
- File "/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/torch/utils/cpp_extension.py", line 1056, in build_extensions
- build_ext.build_extensions(self)
- File "/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/setuptools/_distutils/command/build_ext.py", line 479, in build_extensions
- self._build_extensions_serial()
- File "/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/setuptools/_distutils/command/build_ext.py", line 505, in _build_extensions_serial
- self.build_extension(ext)
- File "/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/setuptools/command/build_ext.py", line 254, in build_extension
- _build_ext.build_extension(self, ext)
- File "/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/setuptools/_distutils/command/build_ext.py", line 560, in build_extension
- objects = self.compiler.compile(
- ^^^^^^^^^^^^^^^^^^^^^^
- File "/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/torch/utils/cpp_extension.py", line 840, in unix_wrap_ninja_compile
- _write_ninja_file_and_compile_objects(
- File "/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/torch/utils/cpp_extension.py", line 2213, in _write_ninja_file_and_compile_objects
- _run_ninja_build(
- File "/home/andrew/Downloads/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.12/site-packages/torch/utils/cpp_extension.py", line 2577, in _run_ninja_build
- raise RuntimeError(message) from e
- RuntimeError: Error compiling objects for extension
- [end of output]
- note: This error originates from a subprocess, and is likely not a problem with pip.
- ERROR: Failed building wheel for flash_attn
- Running setup.py clean for flash_attn
- Failed to build flash_attn
- ERROR: Failed to build installable wheels for some pyproject.toml based projects (flash_attn)
Advertisement
Add Comment
Please, Sign In to add comment