# ############################################################################# # Copyright (c) 2016 - present Advanced Micro Devices, Inc. All rights reserved. # # Permission is hereby granted, free of charge, to any person obtaining a copy # of this software and associated documentation files (the "Software"), to deal # in the Software without restriction, including without limitation the rights # to use, copy, modify, merge, publish, distribute, sublicense, and/or sell # copies of the Software, and to permit persons to whom the Software is # furnished to do so, subject to the following conditions: # # The above copyright notice and this permission notice shall be included in # all copies or substantial portions of the Software. # # THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR # IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, # FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE # AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER # LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, # OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN # THE SOFTWARE. # ############################################################################# # ######################################################################## # A helper function to prefix a source list of files with a common path into a new list (non-destructive) # ######################################################################## function( prepend_path prefix source_list_of_files return_list_of_files ) foreach( file ${${source_list_of_files}} ) if(IS_ABSOLUTE ${file} ) list( APPEND new_list ${file} ) else( ) list( APPEND new_list ${prefix}/${file} ) endif( ) endforeach( ) set( ${return_list_of_files} ${new_list} PARENT_SCOPE ) endfunction( ) # ######################################################################## # Main # ######################################################################## # This builds the generator executable add_subdirectory( generator ) # This includes an explicit list (all possible) of files the generator currently outputs include( generator/generated-kernels.cmake ) set( generator_pattern all CACHE STRING "FFT kernels to generate" ) set_property( CACHE generator_pattern PROPERTY STRINGS pow2 pow3 pow5 "pow2,3" "pow2,5" "pow3,5" all ) set( gen_headers ${kernels_launch} ${kernels_all} ) if( generator_pattern STREQUAL "pow2" ) set( gen_headers ${kernels_launch} ${kernels_pow2} ) elseif( generator_pattern STREQUAL "pow3" ) set( gen_headers ${kernels_launch} ${kernels_pow3} ) elseif( generator_pattern STREQUAL "pow5" ) set( gen_headers ${kernels_launch} ${kernels_pow5} ) endif() # add_custom_command will create source output files, that are used in a target below # In order for the dependencies to work in cmake, add_custom_command must be in the same # CMakeLists.txt file as the target [rocfft-device] add_custom_command( OUTPUT ${gen_headers} COMMAND rocfft-kernel-generator ${generator_pattern} ${small_kernels_group_num} DEPENDS rocfft-kernel-generator # WORKING_DIRECTORY ${kernel_path} COMMENT "Generator producing device kernels for rocfft-device" ) # The following is a list of implementation files defining the library set( rocfft_device_source transpose.cpp bluestein.cpp real2complex.cpp complex2real.cpp ) prepend_path( "../.." rocfft_headers_public relative_rocfft_device_headers_public ) add_library( rocfft-device ${rocfft_device_source} ${relative_rocfft_device_headers_public} ${gen_headers} ) add_library( roc::rocfft-device ALIAS rocfft-device ) target_compile_features( rocfft-device PRIVATE cxx_static_assert cxx_nullptr cxx_auto_type ) target_compile_options (rocfft-device PRIVATE -fno-gpu-rdc) # Remove this check when we no longer build with older rocm stack(ie < 1.8.2) if(TARGET hip::device) target_link_libraries( rocfft-device PRIVATE hip::device ) else() target_link_libraries( rocfft-device PRIVATE hip::hip_hcc hip::hip_device hcc::hccshared ) endif() if(HIP_PLATFORM STREQUAL "nvcc") target_compile_options( rocfft-device PRIVATE "-gencode arch=compute_50,code=sm_50 -gencode arch=compute_52,code=sm_52 -gencode arch=compute_30,code=sm_30" ) endif() if( CMAKE_CXX_COMPILER MATCHES ".*/hcc$" OR HIP_PLATFORM STREQUAL "hip-clang") # Remove following when hcc is fixed; hcc emits following spurious warning ROCm v1.6.1 # "clang-5.0: warning: argument unused during compilation: '-isystem /opt/rocm/include'" target_compile_options( rocfft-device PRIVATE -Wno-unused-command-line-argument ) foreach( target ${AMDGPU_TARGETS} ) target_link_libraries( rocfft-device PRIVATE --amdgpu-target=${target} ) endforeach( ) endif( ) target_include_directories( rocfft-device PRIVATE $ $ $ $ $ $ $ ) rocm_set_soversion( rocfft-device ${rocfft_SOVERSION} ) set_target_properties( rocfft-device PROPERTIES CXX_EXTENSIONS NO ) set_target_properties( rocfft-device PROPERTIES RUNTIME_OUTPUT_DIRECTORY "${PROJECT_BINARY_DIR}/staging" ) set_target_properties( rocfft-device PROPERTIES DEBUG_POSTFIX "-d" ) set_target_properties( rocfft-device PROPERTIES CXX_STANDARD 14 CXX_STANDARD_REQUIRED ON ) # Following Boost conventions of prefixing 'lib' on static built libraries, across all platforms if( NOT BUILD_SHARED_LIBS ) set_target_properties( rocfft-device PROPERTIES PREFIX "lib" ) endif( ) rocm_install_targets( TARGETS rocfft-device PREFIX rocfft ) # PERMISSIONS OWNER_EXECUTE OWNER_WRITE OWNER_READ GROUP_EXECUTE GROUP_READ WORLD_EXECUTE WORLD_READ rocm_install_symlink_subdir( rocfft )