|
- if(CMAKE_TOOLCHAIN_FILE)
- set(LIBRARY_OUTPUT_PATH_ROOT ${CMAKE_BINARY_DIR} CACHE PATH "root for library output, set this to change where android libs are compiled to")
- # get absolute path, but get_filename_component ABSOLUTE only refer with source dir, so find_file here :(
- get_filename_component(CMAKE_TOOLCHAIN_FILE_NAME ${CMAKE_TOOLCHAIN_FILE} NAME)
- find_file(CMAKE_TOOLCHAIN_FILE ${CMAKE_TOOLCHAIN_FILE_NAME} PATHS ${CMAKE_SOURCE_DIR} NO_DEFAULT_PATH)
- message(STATUS "CMAKE_TOOLCHAIN_FILE = ${CMAKE_TOOLCHAIN_FILE}")
- endif()
-
- if(NOT DEFINED CMAKE_INSTALL_PREFIX)
- set(CMAKE_INSTALL_PREFIX "${CMAKE_BINARY_DIR}/install" CACHE PATH "Installation Directory")
- endif()
- message(STATUS "CMAKE_INSTALL_PREFIX = ${CMAKE_INSTALL_PREFIX}")
-
- if(NOT DEFINED NCNN_VERSION)
- string(TIMESTAMP NCNN_VERSION "%Y%m%d")
- endif()
-
- set(NCNN_VERSION_MAJOR 1)
- set(NCNN_VERSION_MINOR 0)
- set(NCNN_VERSION_PATCH ${NCNN_VERSION})
- set(NCNN_VERSION_STRING ${NCNN_VERSION_MAJOR}.${NCNN_VERSION_MINOR}.${NCNN_VERSION_PATCH})
- if(APPLE OR IOS)
- # macos / ios only accepts a.b.c.d.e where a=24bit b/c/d/e=10bit
- # 20201228 to 20.12.28
- string(SUBSTRING ${NCNN_VERSION} 2 2 NCNN_VERSION_YEAR)
- string(SUBSTRING ${NCNN_VERSION} 4 2 NCNN_VERSION_MONTH)
- string(SUBSTRING ${NCNN_VERSION} 6 2 NCNN_VERSION_DAY)
- set(NCNN_VERSION_STRING ${NCNN_VERSION_MAJOR}.${NCNN_VERSION_MINOR}.${NCNN_VERSION_YEAR}.${NCNN_VERSION_MONTH}.${NCNN_VERSION_DAY})
- endif()
- message(STATUS "NCNN_VERSION_STRING = ${NCNN_VERSION_STRING}")
-
- cmake_minimum_required(VERSION 2.8.12)
-
- if(NOT CMAKE_BUILD_TYPE)
- set(CMAKE_BUILD_TYPE release CACHE STRING "Choose the type of build" FORCE)
- endif()
-
- if(NOT CMAKE_VERSION VERSION_LESS "3.15")
- # enable CMAKE_MSVC_RUNTIME_LIBRARY
- cmake_policy(SET CMP0091 NEW)
- endif()
-
- if(POLICY CMP0025)
- # reference from https://cmake.org/cmake/help/latest/policy/CMP0025.html
- cmake_policy(SET CMP0025 NEW)
- endif()
-
- project(ncnn)
-
- if(MSVC AND NOT CMAKE_VERSION VERSION_LESS "3.15")
- option(NCNN_BUILD_WITH_STATIC_CRT "Enables use of statically linked CRT for statically linked ncnn" OFF)
- if(NCNN_BUILD_WITH_STATIC_CRT)
- # cmake before version 3.15 not work
- set(CMAKE_MSVC_RUNTIME_LIBRARY "MultiThreaded$<$<CONFIG:Debug>:Debug>")
- endif()
- endif()
-
- option(NCNN_SHARED_LIB "shared library support" OFF)
- option(NCNN_ENABLE_LTO "enable link-time optimization" OFF)
- option(NCNN_OPENMP "openmp support" ON)
- option(NCNN_STDIO "load model from external file" ON)
- option(NCNN_STRING "plain and verbose string" ON)
- option(NCNN_INSTALL_SDK "install ncnn library and headers" ON)
- option(NCNN_SIMPLEOCV "minimal opencv structure emulation" OFF)
- option(NCNN_SIMPLEOMP "minimal openmp runtime emulation" OFF)
- option(NCNN_SIMPLESTL "minimal cpp stl structure emulation" OFF)
- option(NCNN_THREADS "build with threads" ON)
- option(NCNN_BENCHMARK "print benchmark information for every layer" OFF)
- option(NCNN_C_API "build with C api" ON)
- option(NCNN_PLATFORM_API "build with platform api candy" ON)
- option(NCNN_PIXEL "convert and resize from/to image pixel" ON)
- option(NCNN_PIXEL_ROTATE "rotate image pixel orientation" ON)
- option(NCNN_PIXEL_AFFINE "warp affine image pixel" ON)
- option(NCNN_PIXEL_DRAWING "draw basic figure and text" ON)
- option(NCNN_CMAKE_VERBOSE "print verbose cmake messages" OFF)
- option(NCNN_VULKAN "vulkan compute support" OFF)
- option(NCNN_SYSTEM_GLSLANG "use system glslang library" OFF)
- option(NCNN_RUNTIME_CPU "runtime dispatch cpu routines" ON)
- option(NCNN_DISABLE_PIC "disable position-independent code" OFF)
- option(NCNN_BUILD_TESTS "build tests" OFF)
- option(NCNN_COVERAGE "build for coverage" OFF)
- option(NCNN_ASAN "build for address sanitizer" OFF)
- option(NCNN_BUILD_BENCHMARK "build benchmark" ON)
- option(NCNN_PYTHON "build python api" OFF)
- option(NCNN_INT8 "int8 inference" ON)
- option(NCNN_BF16 "bf16 inference" ON)
- option(NCNN_FORCE_INLINE "force inline some function" ON)
-
- if(ANDROID OR IOS OR NCNN_SIMPLESTL OR CMAKE_CROSSCOMPILING)
- option(NCNN_DISABLE_RTTI "disable rtti" ON)
- option(NCNN_BUILD_TOOLS "build tools" OFF)
- option(NCNN_BUILD_EXAMPLES "build examples" OFF)
- else()
- option(NCNN_DISABLE_RTTI "disable rtti" OFF)
- option(NCNN_BUILD_TOOLS "build tools" ON)
- option(NCNN_BUILD_EXAMPLES "build examples" ON)
- endif()
-
- if(ANDROID OR IOS OR LINUX OR NCNN_SIMPLESTL)
- option(NCNN_DISABLE_EXCEPTION "disable exception" ON)
- else()
- option(NCNN_DISABLE_EXCEPTION "disable exception" OFF)
- endif()
-
- if(NCNN_SHARED_LIB)
- if(NCNN_BUILD_TESTS)
- message(WARNING "NCNN_SHARED_LIB must be OFF to build tests! NCNN_BUILD_TESTS will be turned off.")
- set(NCNN_BUILD_TESTS OFF)
- endif()
-
- if(NCNN_ENABLE_LTO)
- # enable global link time optimization
- cmake_policy(SET CMP0069 NEW)
- set(CMAKE_POLICY_DEFAULT_CMP0069 NEW)
- include(CheckIPOSupported)
- check_ipo_supported(RESULT ipo_supported OUTPUT ipo_supported_output)
- if(ipo_supported)
- set(CMAKE_INTERPROCEDURAL_OPTIMIZATION TRUE)
- else()
- message(WARNING "IPO is not supported: ${ipo_supported_output}")
- set(NCNN_ENABLE_LTO OFF)
- endif()
- endif()
- endif()
-
- if(NOT NCNN_STDIO OR NOT NCNN_STRING)
- if(NCNN_BUILD_TOOLS)
- message(WARNING "NCNN_STDIO or NCNN_STRING disabled, NCNN_BUILD_TOOLS will be turned off.")
- set(NCNN_BUILD_TOOLS OFF)
- endif()
- if(NCNN_BUILD_EXAMPLES)
- message(WARNING "NCNN_STDIO or NCNN_STRING disabled, NCNN_BUILD_EXAMPLES will be turned off.")
- set(NCNN_BUILD_EXAMPLES OFF)
- endif()
- if(NCNN_BUILD_BENCHMARK)
- message(WARNING "NCNN_STDIO or NCNN_STRING disabled, NCNN_BUILD_BENCHMARK will be turned off.")
- set(NCNN_BUILD_BENCHMARK OFF)
- endif()
- if(NCNN_BUILD_TESTS)
- message(WARNING "NCNN_STDIO or NCNN_STRING disabled, NCNN_BUILD_TESTS will be turned off.")
- set(NCNN_BUILD_TESTS OFF)
- endif()
- endif()
-
- ##############################################
-
- if((IOS AND CMAKE_OSX_ARCHITECTURES MATCHES "arm")
- OR (APPLE AND CMAKE_OSX_ARCHITECTURES MATCHES "arm64")
- OR (CMAKE_SYSTEM_PROCESSOR MATCHES "^(arm|aarch64)")
- OR ((CMAKE_CXX_COMPILER_ID MATCHES "MSVC" OR (CMAKE_CXX_COMPILER_ID MATCHES "Clang" AND CMAKE_CXX_SIMULATE_ID MATCHES "MSVC" AND CMAKE_CXX_COMPILER_FRONTEND_VARIANT MATCHES "MSVC")) AND (${CMAKE_GENERATOR_PLATFORM} MATCHES "^(arm|arm64)")))
- set(NCNN_TARGET_ARCH arm)
-
- if(NOT (CMAKE_CXX_COMPILER_ID MATCHES "MSVC" OR (CMAKE_CXX_COMPILER_ID MATCHES "Clang" AND CMAKE_CXX_SIMULATE_ID MATCHES "MSVC" AND CMAKE_CXX_COMPILER_FRONTEND_VARIANT MATCHES "MSVC")))
- include(CheckCXXCompilerFlag)
-
- set(CMAKE_REQUIRED_FLAGS "-mfpu=neon-vfpv4")
- check_cxx_source_compiles("#include <arm_neon.h>\nint main() { float32x4_t _a; float16x4_t _s = vcvt_f16_f32(_a); return 0; }" NCNN_COMPILER_SUPPORT_ARM_VFPV4)
-
- if(NOT NCNN_COMPILER_SUPPORT_ARM_VFPV4)
- set(CMAKE_REQUIRED_FLAGS "-mfpu=neon-vfpv4 -mfp16-format=ieee")
- check_cxx_source_compiles("#include <arm_neon.h>\nint main() { float32x4_t _a; float16x4_t _s = vcvt_f16_f32(_a); return 0; }" NCNN_COMPILER_SUPPORT_ARM_VFPV4_FP16)
- endif()
-
- set(CMAKE_REQUIRED_FLAGS "-march=armv8.2-a+fp16")
- check_cxx_source_compiles("#include <arm_neon.h>\nint main() { float16x8_t _s, _a, _b; _s = vfmaq_f16(_s, _a, _b); return 0; }" NCNN_COMPILER_SUPPORT_ARM82_FP16)
-
- set(CMAKE_REQUIRED_FLAGS "-march=armv8.2-a+dotprod")
- check_cxx_source_compiles("#include <arm_neon.h>\nint main() { int32x4_t _s; int8x16_t _a, _b; _s = vdotq_s32(_s, _a, _b); return 0; }" NCNN_COMPILER_SUPPORT_ARM82_DOTPROD)
-
- set(CMAKE_REQUIRED_FLAGS "-march=armv8.2-a+fp16fml")
- check_cxx_source_compiles("#include <arm_neon.h>\nint main() { float32x4_t _s; float16x8_t _a, _b; _s = vfmlalq_low_f16(_s, _a, _b); return 0; }" NCNN_COMPILER_SUPPORT_ARM82_FP16FML)
-
- set(CMAKE_REQUIRED_FLAGS "-march=armv8.4-a+bf16")
- check_cxx_source_compiles("#include <arm_neon.h>\nint main() { float32x4_t _s; bfloat16x8_t _a, _b; _s = vcvt_f32_bf16(vcvt_bf16_f32(vbfmmlaq_f32(_s, _a, _b))); return 0; }" NCNN_COMPILER_SUPPORT_ARM84_BF16)
-
- set(CMAKE_REQUIRED_FLAGS "-march=armv8.4-a+i8mm")
- check_cxx_source_compiles("#include <arm_neon.h>\nint main() { int32x4_t _s; int8x16_t _a, _b; _s = vmmlaq_s32(_s, _a, _b); return 0; }" NCNN_COMPILER_SUPPORT_ARM84_I8MM)
-
- set(CMAKE_REQUIRED_FLAGS "-march=armv8.6-a+sve")
- check_cxx_source_compiles("#include <arm_sve.h>\nint main() { svfloat16_t _s, _a, _b; svbool_t bp; _s = svmla_f16_z(bp, _s, _a, _b); return 0; }" NCNN_COMPILER_SUPPORT_ARM86_SVE)
-
- set(CMAKE_REQUIRED_FLAGS "-march=armv8.6-a+sve2")
- check_cxx_source_compiles("#include <arm_sve.h>\nint main() { svint16_t _s; svint8_t _a, _b; _s = svmlslb_s16(_s, _a, _b); return 0; }" NCNN_COMPILER_SUPPORT_ARM86_SVE2)
-
- set(CMAKE_REQUIRED_FLAGS "-march=armv8.6-a+sve+bf16")
- check_cxx_source_compiles("#include <arm_sve.h>\nint main() { svfloat32_t _s; svbfloat16_t _a, _b; _s = svbfmmla_f32(_s, _a, _b); return 0; }" NCNN_COMPILER_SUPPORT_ARM86_SVEBF16)
-
- set(CMAKE_REQUIRED_FLAGS "-march=armv8.6-a+sve+i8mm")
- check_cxx_source_compiles("#include <arm_sve.h>\nint main() { svint32_t _s; svint8_t _a, _b; _s = svmmla_s32(_s, _a, _b); return 0; }" NCNN_COMPILER_SUPPORT_ARM86_SVEI8MM)
-
- set(CMAKE_REQUIRED_FLAGS "-march=armv8.6-a+sve+f32mm")
- check_cxx_source_compiles("#include <arm_sve.h>\nint main() { svfloat32_t _s, _a, _b; _s = svmmla_f32(_s, _a, _b); return 0; }" NCNN_COMPILER_SUPPORT_ARM86_SVEF32MM)
-
- unset(CMAKE_REQUIRED_FLAGS)
- endif()
-
- if(NCNN_COMPILER_SUPPORT_ARM_VFPV4 OR NCNN_COMPILER_SUPPORT_ARM_VFPV4_FP16)
- option(NCNN_VFPV4 "optimize armv7 platform with vfpv4" ON)
- else()
- message(WARNING "The compiler does not support arm vfpv4. NCNN_VFPV4 will be OFF.")
- endif()
-
- if(NCNN_COMPILER_SUPPORT_ARM82_FP16)
- option(NCNN_ARM82 "optimize aarch64 platform with armv8.2 fp16" ON)
- if(NCNN_COMPILER_SUPPORT_ARM82_DOTPROD)
- if(NCNN_ARM82)
- option(NCNN_ARM82DOT "optimize aarch64 platform with armv8.2 dotprod" ON)
- endif()
- else()
- message(WARNING "The compiler does not support armv8.2 dotprod. NCNN_ARM82DOT will be OFF.")
- endif()
- if(NCNN_COMPILER_SUPPORT_ARM82_FP16FML)
- if(NCNN_ARM82)
- option(NCNN_ARM82FP16FML "optimize aarch64 platform with armv8.2 fp16fml" ON)
- endif()
- else()
- message(WARNING "The compiler does not support armv8.2 fp16fml. NCNN_ARM82FP16FML will be OFF.")
- endif()
- if(NCNN_COMPILER_SUPPORT_ARM84_BF16)
- if(NCNN_ARM82DOT AND NCNN_ARM82FP16FML)
- option(NCNN_ARM84BF16 "optimize aarch64 platform with armv8.4 bf16" ON)
- endif()
- else()
- message(WARNING "The compiler does not support armv8.4 bf16. NCNN_ARM86BF16 will be OFF.")
- endif()
- if(NCNN_COMPILER_SUPPORT_ARM84_I8MM)
- if(NCNN_ARM82DOT AND NCNN_ARM82FP16FML)
- option(NCNN_ARM84I8MM "optimize aarch64 platform with armv8.4 i8mm" ON)
- endif()
- else()
- message(WARNING "The compiler does not support armv8.4 i8mm. NCNN_ARM84I8MM will be OFF.")
- endif()
- if(NCNN_COMPILER_SUPPORT_ARM86_SVE)
- if(NCNN_ARM84BF16 AND NCNN_ARM84I8MM)
- option(NCNN_ARM86SVE "optimize aarch64 platform with armv8.6 sve" ON)
- if(NCNN_COMPILER_SUPPORT_ARM86_SVE2)
- if(NCNN_ARM86SVE)
- option(NCNN_ARM86SVE2 "optimize aarch64 platform with armv8.6 sve2" ON)
- endif()
- else()
- message(WARNING "The compiler does not support armv8.6 sve2. NCNN_ARM86SVE2 will be OFF.")
- endif()
- if(NCNN_COMPILER_SUPPORT_ARM86_SVEBF16)
- if(NCNN_ARM86SVE)
- option(NCNN_ARM86SVEBF16 "optimize aarch64 platform with armv8.6 sve bf16" ON)
- endif()
- else()
- message(WARNING "The compiler does not support armv8.6 sve bf16. NCNN_ARM86SVEBF16 will be OFF.")
- endif()
- if(NCNN_COMPILER_SUPPORT_ARM86_SVEI8MM)
- if(NCNN_ARM86SVE)
- option(NCNN_ARM86SVEI8MM "optimize aarch64 platform with armv8.6 sve i8mm" ON)
- endif()
- else()
- message(WARNING "The compiler does not support armv8.6 sve i8mm. NCNN_ARM86SVEI8MM will be OFF.")
- endif()
- if(NCNN_COMPILER_SUPPORT_ARM86_SVEF32MM)
- if(NCNN_ARM86SVE)
- option(NCNN_ARM86SVEF32MM "optimize aarch64 platform with armv8.6 sve f32mm" ON)
- endif()
- else()
- message(WARNING "The compiler does not support armv8.6 sve f32mm. NCNN_ARM86SVEF32MM will be OFF.")
- endif()
- endif()
- else()
- message(WARNING "The compiler does not support armv8.6 sve. NCNN_ARM86SVE will be OFF.")
- endif()
- else()
- message(WARNING "The compiler does not support armv8.2 fp16. NCNN_ARM82 will be OFF.")
- endif()
- elseif(CMAKE_SYSTEM_PROCESSOR MATCHES "^(mips)")
- set(NCNN_TARGET_ARCH mips)
-
- include(CheckCXXCompilerFlag)
-
- check_cxx_compiler_flag("-mmsa" NCNN_COMPILER_SUPPORT_MIPS_MSA)
-
- set(CMAKE_REQUIRED_FLAGS "-mloongson-mmi -I${CMAKE_CURRENT_SOURCE_DIR}/src/layer/mips")
- check_cxx_source_compiles("#include \"loongson_mmi.h\"\nint main() { int16x4_t _a, _b; int32x2_t _s = __mmi_pmaddhw(_a, _b); return 0; }" NCNN_COMPILER_SUPPORT_LOONGSON_MMI)
-
- unset(CMAKE_REQUIRED_FLAGS)
-
- if(NCNN_COMPILER_SUPPORT_MIPS_MSA)
- option(NCNN_MSA "optimize mips platform with msa extension" ON)
- else()
- message(WARNING "The compiler does not support msa extension. NCNN_MSA will be OFF.")
- endif()
- if(NCNN_COMPILER_SUPPORT_LOONGSON_MMI)
- option(NCNN_MMI "optimize mips platform with loongson mmi extension" ON)
- else()
- message(WARNING "The compiler does not support loongson mmi extension. NCNN_MMI will be OFF.")
- endif()
- elseif(CMAKE_SYSTEM_PROCESSOR MATCHES "^(loongarch64|loongarch32)")
- set(NCNN_TARGET_ARCH loongarch)
-
- include(CheckCXXCompilerFlag)
-
- check_cxx_compiler_flag("-mlsx" NCNN_COMPILER_SUPPORT_LOONGARCH_LSX)
-
- if(NCNN_COMPILER_SUPPORT_LOONGARCH_LSX)
- option(NCNN_LSX "optimize loongarch platform with lsx extension" ON)
- else()
- message(WARNING "The compiler does not support lsx extension. NCNN_LSX will be OFF.")
- endif()
-
- elseif(CMAKE_SYSTEM_PROCESSOR MATCHES "^(riscv)")
- set(NCNN_TARGET_ARCH riscv)
-
- include(CheckCXXCompilerFlag)
-
- set(CMAKE_REQUIRED_FLAGS "-march=rv64gcv")
- check_cxx_source_compiles("#include <riscv_vector.h>\nint main() { vfloat32m1_t _s, _w; float _v; size_t vl; _s = vfmacc_vf_f32m1(_s, _v, _w, vl); return 0; }" NCNN_COMPILER_SUPPORT_RVV)
-
- set(CMAKE_REQUIRED_FLAGS "-march=rv64gcv_zfh")
- check_cxx_source_compiles("#include <riscv_vector.h>\nint main() { vfloat16m1_t _s, _w; __fp16 _v; size_t vl; _s = vfmacc_vf_f16m1(_s, _v, _w, vl); return 0; }" NCNN_COMPILER_SUPPORT_RVV_ZFH)
-
- if(NOT NCNN_COMPILER_SUPPORT_RVV_ZFH)
- set(CMAKE_REQUIRED_FLAGS "-march=rv64gcv_zfh_zvfh0p1 -menable-experimental-extensions -D__fp16=_Float16")
- check_cxx_source_compiles("#include <riscv_vector.h>\nint main() { vfloat16m1_t _s, _w; __fp16 _v; size_t vl; _s = vfmacc_vf_f16m1(_s, _v, _w, vl); return 0; }" NCNN_COMPILER_SUPPORT_RVV_ZVFH)
- endif()
-
- unset(CMAKE_REQUIRED_FLAGS)
-
- if(NCNN_COMPILER_SUPPORT_RVV)
- option(NCNN_RVV "optimize risc-v platform with v extension" ON)
- option(NCNN_RVV_CHECK_VFREDSUM "check compilter about support rvv-intrinsic" ON)
- if(NCNN_RVV_CHECK_VFREDSUM)
- include(${CMAKE_CURRENT_SOURCE_DIR}/cmake/ncnn_check_rvv_vfredusum.cmake)
- endif()
- if(NOT (NCNN_COMPILER_SUPPORT_RVV_ZFH OR NCNN_COMPILER_SUPPORT_RVV_ZVFH))
- message(WARNING "The compiler does not support risc-v zfh extension. Upgrading your toolchain is strongly recommended.")
- endif()
- option(NCNN_RVV_CHECK_PLAIN_SEGMENT "check compilter about rvv segment load/store interface" ON)
- if(NCNN_RVV_CHECK_PLAIN_SEGMENT)
- set(CMAKE_REQUIRED_FLAGS "-march=rv64gcv")
- check_cxx_source_compiles("#include <riscv_vector.h>\nint main() { vfloat32m1_t _s, _w; size_t vl; float src[32]={.0f}; vlseg2e32_v_f32m1(&_s, &_w, src, vl); return 0; }" NCNN_COMPILER_USE_RVV_PLAIN_SEG)
- unset(CMAKE_REQUIRED_FLAGS)
- endif()
- if(NOT NCNN_COMPILER_USE_RVV_PLAIN_SEG)
- message(WARNING "The compiler uses tuple types for segment load/store. Upgrading your toolchain is strongly recommended.")
- add_definitions(-D__rvv_tuple)
- endif()
- else()
- message(WARNING "The compiler does not support risc-v v extension. NCNN_RVV will be OFF.")
- endif()
- elseif(CMAKE_SYSTEM_PROCESSOR MATCHES "^(powerpc|ppc)")
- set(NCNN_TARGET_ARCH powerpc)
- elseif(CMAKE_SYSTEM_PROCESSOR MATCHES "^(xtensa)")
- set(NCNN_TARGET_ARCH xtensa)
- elseif(CMAKE_SYSTEM_PROCESSOR MATCHES "^(s390x)")
- set(NCNN_TARGET_ARCH s390x)
- elseif(CMAKE_SYSTEM_PROCESSOR MATCHES "^(sw_64)")
- set(NCNN_TARGET_ARCH sw_64)
- #sw_64 is alpha-like platform
- set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -mieee")
- set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -mieee")
- else()
- set(NCNN_TARGET_ARCH x86)
-
- option(NCNN_SSE2 "optimize x86 platform with sse2 extension" ON)
-
- include(CheckCXXCompilerFlag)
- if(CMAKE_CXX_COMPILER_ID MATCHES "MSVC" OR (CMAKE_CXX_COMPILER_ID MATCHES "Clang" AND CMAKE_CXX_SIMULATE_ID MATCHES "MSVC" AND CMAKE_CXX_COMPILER_FRONTEND_VARIANT MATCHES "MSVC"))
- check_cxx_compiler_flag("/arch:AVX" NCNN_COMPILER_SUPPORT_X86_AVX)
- check_cxx_compiler_flag("/arch:AVX" NCNN_COMPILER_SUPPORT_X86_FMA)
- check_cxx_compiler_flag("/arch:AVX" NCNN_COMPILER_SUPPORT_X86_XOP)
- check_cxx_compiler_flag("/arch:AVX" NCNN_COMPILER_SUPPORT_X86_F16C)
- check_cxx_compiler_flag("/arch:AVX2" NCNN_COMPILER_SUPPORT_X86_AVX2)
- check_cxx_compiler_flag("/arch:AVX2" NCNN_COMPILER_SUPPORT_X86_AVX_VNNI)
- check_cxx_compiler_flag("/arch:AVX512" NCNN_COMPILER_SUPPORT_X86_AVX512)
- check_cxx_compiler_flag("/arch:AVX512" NCNN_COMPILER_SUPPORT_X86_AVX512_VNNI)
- if(CMAKE_CXX_COMPILER_VERSION VERSION_LESS 19.16)
- # vs2017+ supports avx512 and vnni
- set(NCNN_COMPILER_SUPPORT_X86_AVX_VNNI OFF)
- set(NCNN_COMPILER_SUPPORT_X86_AVX512 OFF)
- set(NCNN_COMPILER_SUPPORT_X86_AVX512_VNNI OFF)
- endif()
- else()
- check_cxx_compiler_flag("-mavx" NCNN_COMPILER_SUPPORT_X86_AVX)
-
- set(CMAKE_REQUIRED_FLAGS "-mfma -mf16c")
- check_cxx_source_compiles("#include <immintrin.h>\nint main() { __m256 _s, _a, _b; _s = _mm256_fmadd_ps(_a, _b, _s); return 0; }" NCNN_COMPILER_SUPPORT_X86_FMA)
-
- check_cxx_compiler_flag("-mxop" NCNN_COMPILER_SUPPORT_X86_XOP)
- check_cxx_compiler_flag("-mf16c" NCNN_COMPILER_SUPPORT_X86_F16C)
- check_cxx_compiler_flag("-mfma -mf16c -mavx2" NCNN_COMPILER_SUPPORT_X86_AVX2)
- check_cxx_compiler_flag("-mfma -mf16c -mavx512f -mavx512cd -mavx512bw -mavx512dq -mavx512vl" NCNN_COMPILER_SUPPORT_X86_AVX512)
-
- set(CMAKE_REQUIRED_FLAGS "-mfma -mf16c -mavx2 -mavxvnni")
- check_cxx_source_compiles("#include <immintrin.h>\nint main() { __m256i _s, _a, _b; _s = _mm256_dpwssd_epi32(_s, _a, _b); return 0; }" NCNN_COMPILER_SUPPORT_X86_AVX_VNNI)
-
- set(CMAKE_REQUIRED_FLAGS "-mfma -mf16c -mavx512f -mavx512cd -mavx512bw -mavx512dq -mavx512vl -mavx512vnni")
- check_cxx_source_compiles("#include <immintrin.h>\nint main() { __m512i _s, _a, _b; _s = _mm512_dpwssd_epi32(_s, _a, _b); return 0; }" NCNN_COMPILER_SUPPORT_X86_AVX512_VNNI)
-
- set(CMAKE_REQUIRED_FLAGS "-mfma -mf16c -mavx512f -mavx512cd -mavx512bw -mavx512dq -mavx512vl -mavx512bf16")
- check_cxx_source_compiles("#include <immintrin.h>\nint main() { __m256bh _s; __m512bh _a, _b; _s = _mm512_cvtneps_pbh(_mm512_dpbf16_ps(_mm512_cvtpbh_ps(_s), _a, _b)); return 0; }" NCNN_COMPILER_SUPPORT_X86_AVX512_BF16)
-
- set(CMAKE_REQUIRED_FLAGS "-mfma -mf16c -mavx512f -mavx512cd -mavx512bw -mavx512dq -mavx512vl -mavx512fp16")
- check_cxx_source_compiles("#include <immintrin.h>\nint main() { __m512h _s, _a, _b; _s = _mm512_fmadd_ph(_s, _a, _b); __m512 _s2; _s2 = _mm512_cvtxph_ps(_mm512_cvtxps_ph(_s2)); return 0; }" NCNN_COMPILER_SUPPORT_X86_AVX512_FP16)
-
- unset(CMAKE_REQUIRED_FLAGS)
- endif()
-
- if(NOT CMAKE_SYSTEM_NAME STREQUAL "Emscripten" AND NCNN_COMPILER_SUPPORT_X86_AVX)
- option(NCNN_AVX "optimize x86 platform with avx extension" ON)
- if(NCNN_COMPILER_SUPPORT_X86_FMA)
- if(NCNN_AVX)
- option(NCNN_FMA "optimize x86 platform with fma extension" ON)
- endif()
- else()
- message(WARNING "The compiler does not support fma extension. NCNN_FMA will be OFF.")
- endif()
- if(NCNN_COMPILER_SUPPORT_X86_XOP)
- if(NCNN_AVX)
- option(NCNN_XOP "optimize x86 platform with xop extension" ON)
- endif()
- else()
- message(WARNING "The compiler does not support xop extension. NCNN_XOP will be OFF.")
- endif()
- if(NCNN_COMPILER_SUPPORT_X86_F16C)
- if(NCNN_AVX)
- option(NCNN_F16C "optimize x86 platform with f16c extension" ON)
- endif()
- else()
- message(WARNING "The compiler does not support f16c extension. NCNN_F16C will be OFF.")
- endif()
- if(NCNN_COMPILER_SUPPORT_X86_AVX2)
- if(NCNN_AVX)
- option(NCNN_AVX2 "optimize x86 platform with avx2 extension" ON)
- endif()
- if(NCNN_COMPILER_SUPPORT_X86_AVX_VNNI)
- if(NCNN_AVX2)
- option(NCNN_AVXVNNI "optimize x86 platform with avx vnni extension" ON)
- endif()
- else()
- message(WARNING "The compiler does not support avx vnni extension. NCNN_AVXVNNI will be OFF.")
- endif()
- if(NCNN_COMPILER_SUPPORT_X86_AVX512)
- if(NCNN_AVX2)
- option(NCNN_AVX512 "optimize x86 platform with avx512 extension" ON)
- endif()
- if(NCNN_COMPILER_SUPPORT_X86_AVX512_VNNI)
- if(NCNN_AVX512)
- option(NCNN_AVX512VNNI "optimize x86 platform with avx512 vnni extension" ON)
- endif()
- else()
- message(WARNING "The compiler does not support avx512 vnni extension. NCNN_AVX512VNNI will be OFF.")
- endif()
- if(NCNN_COMPILER_SUPPORT_X86_AVX512_BF16)
- if(NCNN_AVX512)
- option(NCNN_AVX512BF16 "optimize x86 platform with avx512 bf16 extension" ON)
- endif()
- else()
- message(WARNING "The compiler does not support avx512 bf16 extension. NCNN_AVX512BF16 will be OFF.")
- endif()
- if(NCNN_COMPILER_SUPPORT_X86_AVX512_FP16)
- if(NCNN_AVX512)
- option(NCNN_AVX512FP16 "optimize x86 platform with avx512 fp16 extension" ON)
- endif()
- else()
- message(WARNING "The compiler does not support avx512 fp16 extension. NCNN_AVX512FP16 will be OFF.")
- endif()
- else()
- message(WARNING "The compiler does not support avx512 extension. NCNN_AVX512 will be OFF.")
- endif()
- else()
- message(WARNING "The compiler does not support avx2 extension. NCNN_AVX2 will be OFF.")
- endif()
- else()
- message(WARNING "The compiler does not support avx extension. NCNN_AVX will be OFF.")
- endif()
- endif()
-
- message(STATUS "Target arch: ${NCNN_TARGET_ARCH}")
-
- ##############################################
-
- # set cmake default folder name
- set_property(GLOBAL PROPERTY USE_FOLDERS ON)
- set_property(GLOBAL PROPERTY PREDEFINED_TARGETS_FOLDER "cmake")
-
- if(CMAKE_SYSTEM_NAME STREQUAL "Emscripten")
- set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -s FORCE_FILESYSTEM=1 -s INITIAL_MEMORY=256MB -s EXIT_RUNTIME=1")
- set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -s FORCE_FILESYSTEM=1 -s INITIAL_MEMORY=256MB -s EXIT_RUNTIME=1")
- set(CMAKE_EXECUTBLE_LINKER_FLAGS "${CMAKE_EXECUTBLE_LINKER_FLAGS} -s FORCE_FILESYSTEM=1 -s INITIAL_MEMORY=256MB -s EXIT_RUNTIME=1")
-
- if(NCNN_OPENMP AND NCNN_SIMPLEOMP)
- # TODO better flags for emscripten
- # node --experimental-wasm-threads xxx.js
- set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -s USE_PTHREADS=1 -s PTHREAD_POOL_SIZE=15")
- set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -s USE_PTHREADS=1 -s PTHREAD_POOL_SIZE=15")
- set(CMAKE_EXECUTBLE_LINKER_FLAGS "${CMAKE_EXECUTBLE_LINKER_FLAGS} -s USE_PTHREADS=1 -s PTHREAD_POOL_SIZE=15")
- endif()
- endif()
-
- if(NCNN_VULKAN)
- if(NCNN_SYSTEM_GLSLANG)
- set(GLSLANG_TARGET_DIR "GLSLANG-NOTFOUND" CACHE PATH "Absolute path to glslangTargets.cmake directory")
- if(NOT GLSLANG_TARGET_DIR AND NOT DEFINED ENV{GLSLANG_TARGET_DIR})
- message(WARNING "GLSLANG_TARGET_DIR must be defined! NCNN_SYSTEM_GLSLANG will be turned off.")
- set(NCNN_SYSTEM_GLSLANG OFF)
- else()
- message(STATUS "Using glslang install located at ${GLSLANG_TARGET_DIR}")
-
- find_package(Threads)
-
- include("${GLSLANG_TARGET_DIR}/OSDependentTargets.cmake")
- include("${GLSLANG_TARGET_DIR}/OGLCompilerTargets.cmake")
- if(EXISTS "${GLSLANG_TARGET_DIR}/HLSLTargets.cmake")
- # hlsl support can be optional
- include("${GLSLANG_TARGET_DIR}/HLSLTargets.cmake")
- endif()
- include("${GLSLANG_TARGET_DIR}/glslangTargets.cmake")
- include("${GLSLANG_TARGET_DIR}/SPIRVTargets.cmake")
-
- if (NOT TARGET glslang OR NOT TARGET SPIRV)
- message(WARNING "glslang or SPIRV target not found! NCNN_SYSTEM_GLSLANG will be turned off.")
- set(NCNN_SYSTEM_GLSLANG OFF)
- endif()
- endif()
- endif()
-
- if(NOT NCNN_SYSTEM_GLSLANG)
- if(NOT EXISTS "${CMAKE_CURRENT_SOURCE_DIR}/glslang/CMakeLists.txt")
- message(FATAL_ERROR "The submodules were not downloaded! Please update submodules with \"git submodule update --init\" and try again.")
- else()
- # glslang requires c++11
- set(CMAKE_CXX_STANDARD 11)
-
- option(BUILD_EXTERNAL "" OFF)
- option(ENABLE_SPVREMAPPER "" OFF)
- option(ENABLE_GLSLANG_BINARIES "" OFF)
- option(ENABLE_HLSL "" OFF)
- option(ENABLE_RTTI "" OFF)
- option(ENABLE_EXCEPTIONS "" OFF)
- option(ENABLE_OPT "" OFF)
- option(ENABLE_PCH "" OFF)
- option(ENABLE_CTEST "" OFF)
- if(NCNN_SHARED_LIB)
- option(SKIP_GLSLANG_INSTALL "" ON)
- endif()
- add_subdirectory(glslang)
- if(NCNN_SHARED_LIB)
- if(CMAKE_CXX_COMPILER_ID MATCHES "GNU" OR (CMAKE_CXX_COMPILER_ID MATCHES "Clang" AND NOT CMAKE_CXX_COMPILER_FRONTEND_VARIANT MATCHES "MSVC"))
- target_compile_options(glslang PRIVATE -fvisibility=hidden -fvisibility-inlines-hidden)
- target_compile_options(OGLCompiler PRIVATE -fvisibility=hidden -fvisibility-inlines-hidden)
- target_compile_options(OSDependent PRIVATE -fvisibility=hidden -fvisibility-inlines-hidden)
- target_compile_options(SPIRV PRIVATE -fvisibility=hidden -fvisibility-inlines-hidden)
- endif()
- if(NCNN_ENABLE_LTO)
- set_target_properties(glslang PROPERTIES INTERPROCEDURAL_OPTIMIZATION ON)
- set_target_properties(OGLCompiler PROPERTIES INTERPROCEDURAL_OPTIMIZATION ON)
- set_target_properties(OSDependent PROPERTIES INTERPROCEDURAL_OPTIMIZATION ON)
- set_target_properties(SPIRV PROPERTIES INTERPROCEDURAL_OPTIMIZATION ON)
- endif()
- endif()
- endif()
- endif()
- endif()
-
- add_subdirectory(src)
- if(NCNN_BUILD_BENCHMARK)
- add_subdirectory(benchmark)
- endif()
- if(NCNN_BUILD_EXAMPLES)
- add_subdirectory(examples)
- endif()
- if(NCNN_BUILD_TOOLS)
- add_subdirectory(tools)
- endif()
- if(NCNN_BUILD_TESTS)
- enable_testing()
- add_subdirectory(tests)
- endif()
- if(NCNN_PYTHON)
- add_subdirectory(python)
- endif()
|