| @@ -50,7 +50,7 @@ option(MGE_WITH_JIT "Build MegEngine with JIT." ON) | |||
| option(MGE_WITH_JIT_MLIR "Build MegEngine with MLIR JIT." OFF) | |||
| option(MGE_WITH_HALIDE "Build MegEngine with Halide JIT" OFF) | |||
| option(MGE_WITH_MIDOUT_PROFILE "Build MegEngine with Midout profile." OFF) | |||
| option(MGE_WITH_MINIMUM_SIZE "Swith off MGE_ENABLE_RTTI、MGE_ENABLE_EXCEPTIONS、MGE_ENABLE_LOGGING and switch on MGE_INFERENCE_ONLY so that compile minimum load_and_run. Take effect only when MGE_BIN_REDUCE was set" OFF) | |||
| option(MGE_WITH_MINIMUM_SIZE "Swith off MGE_ENABLE_RTTI、MGE_ENABLE_EXCEPTIONS、MGE_ENABLE_LOGGING and switch on MGE_INFERENCE_ONLY so that compile minimum load_and_run." OFF) | |||
| option(MGE_ARMV8_2_FEATURE_FP16 "Enable armv8.2-a+fp16 support" OFF) | |||
| option(MGE_DISABLE_FLOAT16 "Disable MegEngine float16 support." OFF) | |||
| option(MGE_WITH_CUDA "Enable MegEngine CUDA support." ON) | |||
| @@ -143,16 +143,32 @@ else() | |||
| set(MGE_WITH_ANY_CUDA_STUB OFF) | |||
| endif() | |||
| if(NOT ${MGE_BIN_REDUCE} STREQUAL "") | |||
| message(STATUS "build with BIN REDUCE") | |||
| if(MGE_WITH_MINIMUM_SIZE) | |||
| set(MGE_ENABLE_RTTI OFF) | |||
| set(MGE_ENABLE_LOGGING OFF) | |||
| set(MGE_ENABLE_EXCEPTIONS OFF) | |||
| set(MGE_INFERENCE_ONLY ON) | |||
| if(MGE_WITH_MIDOUT_PROFILE) | |||
| message(STATUS "build with MIDOUT PROFILE and force set MGE_WITH_MINIMUM_SIZE off and force rtti ON") | |||
| set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -DMIDOUT_PROFILING") | |||
| set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -DMIDOUT_PROFILING") | |||
| set(MGE_WITH_MINIMUM_SIZE OFF) | |||
| set(MGE_ENABLE_RTTI ON) | |||
| if(WIN32) | |||
| message(FATAL_ERROR "do not support midout at WIN32") | |||
| endif() | |||
| set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -include ${MGE_BIN_REDUCE}") | |||
| set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -include ${MGE_BIN_REDUCE}") | |||
| endif() | |||
| set(BIN_REDUCE ${PROJECT_SOURCE_DIR}/src/bin_reduce_cmake.h) | |||
| if(MGE_WITH_MINIMUM_SIZE) | |||
| message(STATUS "build with MGE_WITH_MINIMUM_SIZE bin_reduce header is: ${BIN_REDUCE}") | |||
| set(MGE_ENABLE_RTTI OFF) | |||
| set(MGE_ENABLE_LOGGING OFF) | |||
| set(MGE_ENABLE_EXCEPTIONS OFF) | |||
| set(MGE_INFERENCE_ONLY ON) | |||
| # MGE_WITH_MINIMUM_SIZE will triger unused-parameter | |||
| set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -Wno-unused-parameter") | |||
| set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -Wno-unused-parameter") | |||
| endif() | |||
| if(NOT MGE_WITH_MIDOUT_PROFILE AND NOT WIN32) | |||
| set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -include ${BIN_REDUCE}") | |||
| set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -include ${BIN_REDUCE}") | |||
| endif() | |||
| if (NOT APPLE) | |||
| @@ -176,12 +192,6 @@ else() | |||
| message(STATUS "lto is not supported in this compiler") | |||
| endif() | |||
| if(MGE_WITH_MIDOUT_PROFILE) | |||
| message(STATUS "build with MIDOUT PROFILE") | |||
| set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -DMIDOUT_PROFILING") | |||
| set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -DMIDOUT_PROFILING") | |||
| endif() | |||
| if (APPLE) | |||
| set (BUILD_SHARED_LIBS OFF) | |||
| message(STATUS "build static for xcode framework require") | |||
| @@ -253,9 +263,9 @@ if(NOT CMAKE_CONFIGURATION_TYPES AND NOT CMAKE_BUILD_TYPE) | |||
| set(CMAKE_BUILD_TYPE RelWithDebInfo) | |||
| endif() | |||
| if(${CMAKE_BUILD_TYPE} STREQUAL "Release" AND NOT MGE_WITH_TEST AND NOT ${MGE_ARCH} STREQUAL "x86_64") | |||
| if(${CMAKE_BUILD_TYPE} STREQUAL "Release" AND NOT MGE_WITH_TEST AND NOT ${MGE_ARCH} STREQUAL "x86_64" AND NOT MGE_WITH_MIDOUT_PROFILE) | |||
| set(MGE_ENABLE_RTTI OFF) | |||
| message(STATUS "disable MGE_ENABLE_RTTI when Release/NON-x86_64 mode!!") | |||
| message(STATUS "disable MGE_ENABLE_RTTI when Release/NON-x86_64/NON-MGE_WITH_MIDOUT_PROFILE mode!!") | |||
| endif() | |||
| if(MSVC OR WIN32) | |||
| @@ -83,9 +83,11 @@ LTensorLayout lite::to_impl_layout(const Layout& layout) { | |||
| case LiteDataType::LITE_FLOAT: | |||
| mge_layout.dtype = mgb::dtype::Float32(); | |||
| break; | |||
| #if !MEGDNN_DISABLE_FLOAT16 | |||
| case LiteDataType::LITE_HALF: | |||
| mge_layout.dtype = mgb::dtype::Float16(); | |||
| break; | |||
| #endif | |||
| case LiteDataType::LITE_INT: | |||
| mge_layout.dtype = mgb::dtype::Int32(); | |||
| break; | |||
| @@ -120,9 +122,11 @@ Layout lite::to_lite_layout(const LTensorLayout& mge_layout) { | |||
| case mgb::DTypeEnum::Float32: | |||
| layout.data_type = LiteDataType::LITE_FLOAT; | |||
| break; | |||
| #if !MEGDNN_DISABLE_FLOAT16 | |||
| case mgb::DTypeEnum::Float16: | |||
| layout.data_type = LiteDataType::LITE_HALF; | |||
| break; | |||
| #endif | |||
| case mgb::DTypeEnum::Int32: | |||
| layout.data_type = LiteDataType::LITE_INT; | |||
| break; | |||
| @@ -0,0 +1,14 @@ | |||
| /** | |||
| * \file src/bin_reduce_cmake.h | |||
| * MegEngine is Licensed under the Apache License, Version 2.0 (the "License") | |||
| * | |||
| * Copyright (c) 2014-2021 Megvii Inc. All rights reserved. | |||
| * | |||
| * Unless required by applicable law or agreed to in writing, | |||
| * software distributed under the License is distributed on an | |||
| * "AS IS" BASIS, WITHOUT ARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. | |||
| */ | |||
| /* | |||
| * always empty, override by ../tools/gen_header_for_bin_reduce.py | |||
| */ | |||
| @@ -1,5 +1,5 @@ | |||
| /** | |||
| * \file src/core/include/megbrain_build_config.h | |||
| * \file src/megbrain_build_config.h.in | |||
| * MegEngine is Licensed under the Apache License, Version 2.0 (the "License") | |||
| * | |||
| * Copyright (c) 2014-2021 Megvii Inc. All rights reserved. | |||
| @@ -53,7 +53,16 @@ class HeaderGen: | |||
| cls._megvii3_root_cache = str(wd) | |||
| return cls._megvii3_root_cache | |||
| wd = wd.parent | |||
| raise RuntimeError('This script is supposed to run in megvii3.') | |||
| return None | |||
| _megengine_root_cache = None | |||
| @classmethod | |||
| def get_megengine_root(cls): | |||
| if cls._megengine_root_cache is not None: | |||
| return cls._megengine_root_cache | |||
| wd = Path(__file__).resolve().parent.parent | |||
| cls._megengine_root_cache = str(wd) | |||
| return cls._megengine_root_cache | |||
| def extend_netinfo(self, data): | |||
| self._has_netinfo = True | |||
| @@ -125,11 +134,11 @@ class HeaderGen: | |||
| with tempfile.NamedTemporaryFile() as ftmp: | |||
| fpath = os.path.realpath(ftmp.name) | |||
| subprocess.check_call( | |||
| ['./brain/megbrain/dnn/scripts/gen_param_defs.py', | |||
| ['./dnn/scripts/gen_param_defs.py', | |||
| '--write-enum-items', 'Elemwise:Mode', | |||
| './brain/megbrain/dnn/scripts/opr_param_defs.py', | |||
| './dnn/scripts/opr_param_defs.py', | |||
| fpath], | |||
| cwd=self.get_megvii3_root() | |||
| cwd=self.get_megengine_root() | |||
| ) | |||
| with open(fpath) as fin: | |||
| @@ -178,8 +187,10 @@ class HeaderGen: | |||
| if not self._midout_files: | |||
| return | |||
| gen = os.path.join(self.get_megvii3_root(), 'brain', 'midout', | |||
| 'gen_header.py') | |||
| gen = os.path.join(self.get_megengine_root(), 'third_party', 'midout', 'gen_header.py') | |||
| if self.get_megvii3_root(): | |||
| gen = os.path.join(self.get_megvii3_root(), 'brain', 'midout', 'gen_header.py') | |||
| print('use {} to gen bin_reduce header'.format(gen)) | |||
| cvt = subprocess.run( | |||
| [gen] + self._midout_files, | |||
| stdout=subprocess.PIPE, check=True, | |||
| @@ -212,10 +223,13 @@ def main(): | |||
| ' 1. json files generated by ' | |||
| 'megbrain.serialize_comp_graph_to_file() in python; ' | |||
| ' 2. trace files generated by midout library') | |||
| parser.add_argument('-o', '--output', help='output file', | |||
| default=os.path.join(HeaderGen.get_megvii3_root(), | |||
| 'utils', 'bin_reduce.h')) | |||
| default_file=os.path.join(HeaderGen.get_megengine_root(), 'src', 'bin_reduce_cmake.h') | |||
| is_megvii3 = HeaderGen.get_megvii3_root() | |||
| if is_megvii3: | |||
| default_file=os.path.join(HeaderGen.get_megvii3_root(), 'utils', 'bin_reduce.h') | |||
| parser.add_argument('-o', '--output', help='output file', default=default_file) | |||
| args = parser.parse_args() | |||
| print('config output file: {}'.format(args.output)) | |||
| gen = HeaderGen() | |||
| for i in args.inputs: | |||