Select Git revision
opt_mesh.texi
Forked from
gmsh / gmsh
Source project has a limited visibility.
CMakeLists.txt 12.74 KiB
# This is GMSH/DG, a GPU-Accelerated Nodal Discontinuous Galerkin
# solver for Conservation Laws.
#
# Copyright (C) 2020-2022 Matteo Cicuttin - University of Liège
#
# This code is released under GNU AGPLv3 license, see LICENSE.txt for details.
cmake_minimum_required(VERSION 3.18)
project(gmsh_gpu_dg)
include(CheckLanguage)
set(CMAKE_CXX_STANDARD 17)
set(CMAKE_CXX_STANDARD_REQUIRED ON)
set(CMAKE_CUDA_ARCHITECTURES 35 70)
set(CMAKE_HIP_ARCHITECTURES gfx803 gfx908) # rocm_agent_enumerator
# Additional modules path for cmake
set (CMAKE_MODULE_PATH
${CMAKE_MODULE_PATH}
${CMAKE_CURRENT_SOURCE_DIR}/cmake)
set(CXX_LANGUAGE_FEATURES_TESTS_DIR "${CMAKE_CURRENT_SOURCE_DIR}/cmake")
if(NOT DEFINED HIP_PATH)
if(NOT DEFINED ENV{HIP_PATH})
set(HIP_PATH "/opt/rocm/hip" CACHE PATH "Path to which HIP has been installed")
else()
set(HIP_PATH $ENV{HIP_PATH} CACHE PATH "Path to which HIP has been installed")
endif()
endif()
set(CMAKE_MODULE_PATH "${HIP_PATH}/cmake" ${CMAKE_MODULE_PATH})
try_compile(CXX_FEATURE_STD_FILESYSTEM ${CMAKE_BINARY_DIR} "${CXX_LANGUAGE_FEATURES_TESTS_DIR}/check_std_filesystem.cpp")
if (NOT CXX_FEATURE_STD_FILESYSTEM)
add_definitions(-DDONT_USE_STD_FILESYSTEM)
endif()
if (CMAKE_CXX_COMPILER_ID STREQUAL "AppleClang")
cmake_host_system_information(RESULT OSVER QUERY OS_RELEASE)
if (OSVER VERSION_LESS "10.15")
add_definitions(-DDONT_USE_STD_FILESYSTEM)
endif()
endif()
######################################################################
## Find required libraries: Eigen3
find_package(Eigen3 REQUIRED)
set(LINK_LIBS ${LINK_LIBS} Eigen3::Eigen)
######################################################################
## Find required libraries: GMSH
find_package(GMSH REQUIRED)
set(LINK_LIBS ${LINK_LIBS} GMSH)
file(STRINGS ${GMSH_INCLUDE_DIR}/gmsh.h GMSH_API_VERSION_STR REGEX "#define GMSH_API_VERSION .*")
string(REGEX MATCH "[\.0-9]+" GMSH_API_VERSION "${GMSH_API_VERSION_STR}")
if(GMSH_API_VERSION VERSION_LESS "4.9.0")
add_definitions(-DUSE_INITIAL_4_8_4_API)
endif()
######################################################################
## Find required libraries: SILO
find_package(SILO REQUIRED)
set(LINK_LIBS ${LINK_LIBS} SILO)
option(OPT_SILO_USE_HDF5 "Use HDF5 driver for silo files" ON)
if (OPT_SILO_USE_HDF5)
add_definitions(-DSILO_USE_HDF5)
endif()
######################################################################
## Find required libraries: Lua
find_package(Lua REQUIRED)
include_directories("${LUA_INCLUDE_DIR}")
set(LINK_LIBS ${LINK_LIBS} ${LUA_LIBRARIES})
set(SOL2_BUILD_LUA OFF CACHE BOOL "Override sol2 build lua option")
add_subdirectory(contrib/sol2)
include_directories(contrib/sol2/include)
######################################################################
## Find optional libraries: MPI
option(OPT_USE_MPI "Use MPI if available" OFF)
find_package(MPI)
if (OPT_USE_MPI AND MPI_FOUND)
add_definitions(-DUSE_MPI)
# Ugly hack for Lumi
if (DEFINED ENV{CRAY_MPICH_ROOTDIR})
include_directories("$ENV{MPICH_DIR}/include")
link_directories("$ENV{MPICH_DIR}/lib")
link_directories("$ENV{CRAY_MPICH_ROOTDIR}/gtl/lib")
set(LINK_LIBS ${LINK_LIBS} -lmpi_gtl_hsa)
else()
include_directories("${MPI_CXX_INCLUDE_DIRS}")
set(LINK_LIBS ${LINK_LIBS} ${MPI_CXX_LIBRARIES})
endif()
endif()
######################################################################
## Use or not use GPU solvers
option(OPT_CUDA_USE_CXX14 "Use C++14 (only for rhum compat)" OFF)
option(OPT_ENABLE_GPU_SOLVER "Enable GPU solvers" OFF)
if (OPT_ENABLE_GPU_SOLVER)
add_definitions(-DENABLE_GPU_SOLVER)
######################################################################
## CUDA stuff, find toolkit, compiler & NVML
find_package(CUDAToolkit)
if (CUDAToolkit_FOUND)
set(CMAKE_CUDA_COMPILER ${CUDAToolkit_NVCC_EXECUTABLE})
enable_language(CUDA)
if (OPT_CUDA_USE_CXX14)
set(CMAKE_CUDA_STANDARD 14)
else()
set(CMAKE_CUDA_STANDARD 17)
set(CMAKE_CUDA_FLAGS "${CMAKE_CUDA_FLAGS} -Wno-cpp")
endif()
set(CMAKE_CUDA_STANDARD_REQUIRED TRUE)
#set(CMAKE_CUDA_FLAGS "${CMAKE_CUDA_FLAGS} -lineinfo --resource-usage -Xptxas -dlcm=ca")
set(CMAKE_CUDA_FLAGS "${CMAKE_CUDA_FLAGS} -lineinfo -prec-div=true \
-Xptxas -warn-spills -Xptxas -lineinfo -Xptxas -warn-lmem-usage")
option(OPT_PTXAS_SHOW_RUSAGE "Enable PTXAS resource usage reporting")
if (OPT_PTXAS_SHOW_RUSAGE)
set(CMAKE_CUDA_FLAGS "${CMAKE_CUDA_FLAGS} --resource-usage")
endif()
if (TARGET CUDA::cudart)
set(HAVE_CUDA TRUE)
set(LINK_LIBS ${LINK_LIBS} CUDA::cudart)
add_definitions(-DHAVE_CUDA)
endif()
option(OPT_USE_CUDA_NVML "Enable NVML" ON)
if (OPT_USE_CUDA_NVML AND TARGET CUDA::nvml)
set(HAVE_CUDA_NVML TRUE)
set(LINK_LIBS ${LINK_LIBS} CUDA::nvml)
add_definitions(-DHAVE_CUDA_NVML)
endif()
link_directories("/usr/local/cuda/lib64")
endif()
######################################################################
## Find HIP stuff
find_package(HIP QUIET MODULE)
if (HIP_FOUND)
add_definitions(-DHAVE_HIP)
include_directories("${HIP_PATH}/include")
set(CMAKE_HIP_LINK_EXECUTABLE "${HIP_HIPCC_CMAKE_LINKER_HELPER} ${HCC_HOME} <FLAGS> <CMAKE_CXX_LINK_FLAGS> <LINK_FLAGS> <OBJECTS> -o <TARGET> <LINK_LIBRARIES>")
if (DEFINED ENV{HIP_PLATFORM})
if ($ENV{HIP_PLATFORM} STREQUAL "nvcc")
#set(HIP_NVCC_FLAGS "-ccbin g++-7" ${HIP_NVCC_FLAGS})
set(CMAKE_HIP_LINK_EXECUTABLE "${CUDAToolkit_NVCC_EXECUTABLE} <FLAGS> <CMAKE_CXX_LINK_FLAGS> <LINK_FLAGS> <OBJECTS> -o <TARGET> <LINK_LIBRARIES>")
endif()
endif()
option(OPT_USE_HIP "Use HIP GPU code path" OFF)
if (OPT_USE_HIP)
add_definitions(-DGPU_USE_HIP)
add_definitions(-D__HIP_PLATFORM_HCC__)
set(LINK_LIBS ${LINK_LIBS})
endif()
endif()
endif()
if (OPT_ENABLE_GPU_SOLVER)
option(OPT_DEBUG_GPU "Enable GPU debugging" OFF)
if (OPT_DEBUG_GPU)
add_definitions(-DCUDA_DEBUG)
add_definitions(-DGPU_DEBUG)
endif()
endif()
######################################################################
## Compiler identification stuff
if (CMAKE_CXX_COMPILER_ID MATCHES "Clang")
set(COMPILER_IS_CLANG TRUE)
elseif (CMAKE_CXX_COMPILER_ID STREQUAL "GNU")
set(COMPILER_IS_GNU TRUE)
elseif (CMAKE_CXX_COMPILER_ID STREQUAL "Intel")
set(COMPILER_IS_INTEL TRUE)
endif ()
######################################################################
## Compiler optimization options
if (COMPILER_IS_CLANG)
set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -Wall -Weverything -Wno-c++98-compat \
-Wno-c++98-compat-pedantic -Wno-zero-as-null-pointer-constant -Wno-global-constructors \
-Wno-padded -Wno-shorten-64-to-32 -Wno-sign-conversion -Wno-old-style-cast \
-Wno-sign-compare -Wno-c99-extensions -Wno-extra-semi-stmt -Wno-source-uses-openmp")
else()
set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -Wall -Wextra -Wno-sign-compare -Wshadow \
-Wno-unknown-pragmas -Wno-unused-parameter")
endif()
set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -fpermissive")
set(CMAKE_CXX_FLAGS_DEBUG "-O0 -g -fsanitize=address")
set(CMAKE_CXX_FLAGS_RELWITHDEBINFO "${CMAKE_CXX_FLAGS_RELWITHDEBINFO}")
set(CMAKE_CXX_FLAGS_RELEASE "-O3 -g -DNDEBUG")
set(CMAKE_CXX_FLAGS_RELEASEASSERT "-O3 -g")
option(OPT_ENABLE_OPENMP "Enable OpenMP parallelization" OFF)
if (OPT_ENABLE_OPENMP)
find_package(OpenMP)
if (OpenMP_FOUND)
set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} ${OpenMP_C_FLAGS}")
set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} ${OpenMP_CXX_FLAGS}")
endif()
endif()
if (COMPILER_IS_CLANG OR COMPILER_IS_GNU OR COMPILER_IS_INTEL)
set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -march=native")
endif()
######################################################################
## Optimization stuff
option(OPT_PREFER_512bit "Prefer 512 bit vectors with AVX512 (only Clang > 10 & GCC)" OFF)
if (OPT_PREFER_512bit)
# https://reviews.llvm.org/D67259
set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -mprefer-vector-width=512")
endif()
option(OPT_AGGRESSIVE_FP "Enable DAZ, FTZ and -ffast-math" ON)
if (OPT_AGGRESSIVE_FP)
add_definitions(-DDISALLOW_DENORMALS)
if (COMPILER_IS_CLANG OR COMPILER_IS_GNU)
set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -ffast-math")
endif()
endif()
option(OPT_VECTORIZER_REMARKS "Enable vectorizer remarks" OFF)
if (OPT_VECTORIZER_REMARKS)
if (COMPILER_IS_CLANG)
set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -Rpass=loop-vectorize \
-Rpass-missed=loop-vectorize -Rpass-analysis=loop-vectorize")
endif()
if (COMPILER_IS_INTEL)
set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -qopt-report-phase=vec -qopt-report=2")
endif()
if (COMPILER_IS_GNU)
set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -fopt-info-vec-optimized")
endif()
endif()
option(OPT_MEASURE_PERFORMANCE "Enable performance measurement (produces a ton of output)" OFF)
if (OPT_MEASURE_PERFORMANCE)
add_definitions(-DMEASURE_PERFORMANCE)
endif()
option(OPT_CRASH_ON_NAN "Crash code if NaNs are generated" OFF)
if (OPT_CRASH_ON_NAN)
add_definitions(-DCRASH_ON_NAN)
endif()
######################################################################
## Development & debug stuff
if (COMPILER_IS_CLANG OR COMPILER_IS_GNU)
option(OPT_ASAN "Enable Address Sanitizer" OFF)
if (OPT_ASAN)
set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -fsanitize=address")
endif()
endif()
option(OPT_WRITE_TEST_OUTPUTS "Produce SILO files in tests" OFF)
if (OPT_WRITE_TEST_OUTPUTS)
add_definitions(-DWRITE_TEST_OUTPUTS)
endif()
option(OPT_EXPENSIVE_ASSERTS "Enable expensive assert()s" OFF)
if (OPT_EXPENSIVE_ASSERTS)
add_definitions(-DEXPENSIVE_ASSERTS)
endif()
option(TM_NEW_CURLS "Use the new method for computing curls" ON)
if (TM_NEW_CURLS)
add_compile_definitions(TM_NEW_CURLS)
endif()
option(TM_ONESHOT_LIFTING "Use one-shot lifting" ON)
if (TM_ONESHOT_LIFTING)
add_compile_definitions(TM_ONESHOT_LIFTING)
endif()
option(TM_ONESHOT_JUMPS "Use one-shot jumps" ON)
if (TM_ONESHOT_JUMPS)
add_compile_definitions(TM_ONESHOT_JUMPS)
endif()
option(OPT_ENABLE_PROFILING "Enables code profiling" OFF)
if (OPT_ENABLE_PROFILING)
add_compile_definitions(ENABLE_PROFILING)
endif()
######################################################################
## Enable/disable solver modules
option(OPT_DEBUG_PRINT "Print debug information")
if (OPT_DEBUG_PRINT)
add_definitions(-DENABLE_DEBUG_PRINT)
endif()
######################################################################
option(OPT_DISABLE_TEXTURE_CACHE "On ROCm 4.1 texture stuff is broken, disable it" OFF)
if (OPT_DISABLE_TEXTURE_CACHE)
add_definitions(-DDISABLE_TEXTURE_CACHE)
endif()
######################################################################
## Enable code to handle geometric diode simulation for UniUD project
option(OPT_ENABLE_EXP_GEOMETRIC_DIODE "Enable Geometric Diode stuff [EXPERIMENTAL][NO GPU]")
if (OPT_ENABLE_EXP_GEOMETRIC_DIODE)
add_definitions(-DENABLE_EXP_GEOMETRIC_DIODE)
endif()
######################################################################
## Configure targets
include_directories(contrib/sgr)
include_directories(${CMAKE_CURRENT_SOURCE_DIR}/include)
add_subdirectory(src)
########## tests
option(OPT_BUILD_TESTS "Build tests" OFF)
if (OPT_BUILD_TESTS)
add_executable(test_basics tests/test_basics.cpp)
target_link_libraries(test_basics gmshdg ${LINK_LIBS})
add_executable(test_mass tests/test_mass.cpp)
target_link_libraries(test_mass gmshdg ${LINK_LIBS})
add_executable(test_curl tests/test_curl.cpp)
target_link_libraries(test_curl gmshdg ${LINK_LIBS})
add_executable(test_differentiation tests/test_differentiation.cpp)
target_link_libraries(test_differentiation gmshdg ${LINK_LIBS})
add_executable(test_lifting tests/test_lifting.cpp)
target_link_libraries(test_lifting gmshdg ${LINK_LIBS})
if (OPT_ENABLE_GPU_SOLVER)
add_executable(test_curl_gpu tests/test_curl_gpu.cpp)
target_link_libraries(test_curl_gpu gmshdg ${LINK_LIBS})
add_executable(test_differentiation_gpu tests/test_differentiation_gpu.cpp)
target_link_libraries(test_differentiation_gpu gmshdg ${LINK_LIBS})
add_executable(profile_differentiation_gpu tests/profile_differentiation_gpu.cpp)
target_link_libraries(profile_differentiation_gpu gmshdg ${LINK_LIBS})
add_executable(profile_curl_gpu tests/profile_curl_gpu.cpp)
target_link_libraries(profile_curl_gpu gmshdg ${LINK_LIBS})
add_executable(test_lifting_gpu tests/test_lifting_gpu.cpp)
target_link_libraries(test_lifting_gpu gmshdg ${LINK_LIBS})
endif()
endif()