2020-06-25 05:00:19 +08:00
if ( CMAKE_SOURCE_DIR STREQUAL CMAKE_CURRENT_SOURCE_DIR )
2020-10-28 06:43:39 +08:00
message ( STATUS "The simdjson repository appears to be standalone." )
2020-06-25 05:00:19 +08:00
option ( SIMDJSON_JUST_LIBRARY "Build just the library, omit tests, tools and benchmarks" OFF )
message ( STATUS "By default, we attempt to build everything." )
else ( )
message ( STATUS "The simdjson repository appears to be used as a subdirectory." )
option ( SIMDJSON_JUST_LIBRARY "Build just the library, omit tests, tools and benchmarks" ON )
message ( STATUS "By default, we just build the library." )
endif ( )
2020-06-17 22:06:16 +08:00
#
# Flags used by exes and by the simdjson library (project-wide flags)
#
add_library ( simdjson-flags INTERFACE )
add_library ( simdjson-internal-flags INTERFACE )
target_link_libraries ( simdjson-internal-flags INTERFACE simdjson-flags )
2021-03-10 00:39:43 +08:00
option ( SIMDJSON_SANITIZE_UNDEFINED "Sanitize undefined behavior" OFF )
if ( SIMDJSON_SANITIZE_UNDEFINED )
target_compile_options ( simdjson-flags INTERFACE -fsanitize=undefined -fno-sanitize-recover=all )
target_link_libraries ( simdjson-flags INTERFACE -fsanitize=undefined -fno-sanitize-recover=all )
endif ( )
2020-06-17 22:06:16 +08:00
option ( SIMDJSON_SANITIZE "Sanitize addresses" OFF )
if ( SIMDJSON_SANITIZE )
2021-03-10 00:39:43 +08:00
if ( CMAKE_CXX_COMPILER_ID STREQUAL "AppleClang" )
message ( STATUS "The address sanitizer under Apple's clang appears to be incompatible with the undefined-behavior sanitizer." )
message ( STATUS "You may set SIMDJSON_SANITIZE_UNDEFINED to sanitize undefined behavior." )
target_compile_options ( simdjson-flags INTERFACE -fsanitize=address -fno-omit-frame-pointer -fno-sanitize-recover=all )
target_compile_definitions ( simdjson-flags INTERFACE ASAN_OPTIONS=detect_leaks=1 )
target_link_libraries ( simdjson-flags INTERFACE -fsanitize=address -fno-omit-frame-pointer -fno-sanitize-recover=all )
else ( )
message ( STATUS "Setting both the address sanitizer and the undefined sanitizer." )
target_compile_options ( simdjson-flags INTERFACE -fsanitize=address -fno-omit-frame-pointer -fsanitize=undefined -fno-sanitize-recover=all )
target_link_libraries ( simdjson-flags INTERFACE -fsanitize=address -fno-omit-frame-pointer -fsanitize=undefined -fno-sanitize-recover=all )
endif ( )
2020-06-17 22:06:16 +08:00
# Ubuntu bug for GCC 5.0+ (safe for all versions)
if ( CMAKE_COMPILER_IS_GNUCC )
target_link_libraries ( simdjson-flags INTERFACE -fuse-ld=gold )
endif ( )
endif ( )
2021-03-10 00:39:43 +08:00
2020-12-02 01:40:15 +08:00
if ( SIMDJSON_SANITIZE_THREADS )
2021-03-10 00:39:43 +08:00
message ( STATUS "Setting both the thread sanitizer and the undefined-behavior sanitizer." )
2020-12-02 01:40:15 +08:00
target_compile_options ( simdjson-flags INTERFACE -fsanitize=thread -fsanitize=undefined -fno-sanitize-recover=all )
target_link_libraries ( simdjson-flags INTERFACE -fsanitize=thread -fsanitize=undefined -fno-sanitize-recover=all )
# Ubuntu bug for GCC 5.0+ (safe for all versions)
if ( CMAKE_COMPILER_IS_GNUCC )
target_link_libraries ( simdjson-flags INTERFACE -fuse-ld=gold )
endif ( )
endif ( )
2020-06-17 22:06:16 +08:00
2020-04-23 08:25:45 +08:00
if ( NOT CMAKE_BUILD_TYPE )
2021-03-10 00:39:43 +08:00
# Deliberately not including SIMDJSON_SANITIZE_THREADS since thread behavior depends on the build type.
if ( SIMDJSON_SANITIZE OR SIMDJSON_SANITIZE_UNDEFINED )
message ( STATUS "No build type selected and you have enabled the sanitizer, default to Debug. Consider setting CMAKE_BUILD_TYPE." )
set ( CMAKE_BUILD_TYPE Debug CACHE STRING "Choose the type of build." FORCE )
else ( )
message ( STATUS "No build type selected, default to Release" )
set ( CMAKE_BUILD_TYPE Release CACHE STRING "Choose the type of build." FORCE )
2020-06-17 22:06:16 +08:00
endif ( )
2020-04-23 08:25:45 +08:00
endif ( )
if ( MSVC )
option ( SIMDJSON_BUILD_STATIC "Build a static library" ON ) # turning it on disables the production of a dynamic library
else ( )
option ( SIMDJSON_BUILD_STATIC "Build a static library" OFF ) # turning it on disables the production of a dynamic library
option ( SIMDJSON_USE_LIBCPP "Use the libc++ library" OFF )
endif ( )
2021-02-27 05:17:05 +08:00
if ( MSVC AND NOT(SIMDJSON_BUILD_STATIC ) )
# This will require special handling.
set ( SIMDJSON_WINDOWS_DLL TRUE )
endif ( )
2020-04-23 08:25:45 +08:00
set ( CMAKE_MODULE_PATH "${CMAKE_CURRENT_SOURCE_DIR}/tools/cmake" )
# We compile tools, tests, etc. with C++ 17. Override yourself if you need on a target.
set ( CMAKE_CXX_STANDARD 17 )
set ( CMAKE_CXX_STANDARD_REQUIRED ON )
set ( CMAKE_CXX_EXTENSIONS OFF )
set ( CMAKE_MACOSX_RPATH OFF )
set ( CMAKE_THREAD_PREFER_PTHREAD ON )
set ( THREADS_PREFER_PTHREAD_FLAG ON )
# LTO seems to create all sorts of fun problems. Let us
# disable temporarily.
#include(CheckIPOSupported)
#check_ipo_supported(RESULT ltoresult)
#if(ltoresult)
# set(CMAKE_INTERPROCEDURAL_OPTIMIZATION TRUE)
#endif()
2020-07-07 05:53:57 +08:00
option ( SIMDJSON_VISUAL_STUDIO_BUILD_WITH_DEBUG_INFO_FOR_PROFILING "Under Visual Studio, add Zi to the compile flag and DEBUG to the link file to add debugging information to the release build for easier profiling inside tools like VTune" OFF )
2020-04-23 08:25:45 +08:00
if ( MSVC )
2021-02-16 08:49:12 +08:00
if ( "${MSVC_TOOLSET_VERSION}" STRLESS "142" )
set ( SIMDJSON_LEGACY_VISUAL_STUDIO TRUE )
message ( STATUS "A legacy Visual Studio version was detected. We recommend Visual Studio 2019 or better on a 64-bit system." )
endif ( )
2020-12-12 09:28:24 +08:00
if ( "${MSVC_TOOLSET_VERSION}" STREQUAL "140" )
# Visual Studio 2015 issues warnings and we tolerate it, cmake -G"Visual Studio 14" ..
target_compile_options ( simdjson-internal-flags INTERFACE /W0 /sdl )
else ( )
# Recent version of Visual Studio expected (2017, 2019...). Prior versions are unsupported.
target_compile_options ( simdjson-internal-flags INTERFACE /WX /W3 /sdl /w34714 ) # https://docs.microsoft.com/en-us/cpp/error-messages/compiler-warnings/compiler-warning-level-4-c4714?view=vs-2019
endif ( )
if ( SIMDJSON_VISUAL_STUDIO_BUILD_WITH_DEBUG_INFO_FOR_PROFILING )
target_link_options ( simdjson-flags INTERFACE /DEBUG )
target_compile_options ( simdjson-flags INTERFACE /Zi )
endif ( SIMDJSON_VISUAL_STUDIO_BUILD_WITH_DEBUG_INFO_FOR_PROFILING )
else ( MSVC )
2020-11-02 21:18:04 +08:00
if ( NOT WIN32 )
target_compile_options ( simdjson-internal-flags INTERFACE -fPIC )
endif ( )
2020-06-24 04:44:25 +08:00
target_compile_options ( simdjson-internal-flags INTERFACE -Werror -Wall -Wextra -Weffc++ )
target_compile_options ( simdjson-internal-flags INTERFACE -Wsign-compare -Wshadow -Wwrite-strings -Wpointer-arith -Winit-self -Wconversion -Wno-sign-conversion )
2020-12-12 09:28:24 +08:00
endif ( MSVC )
2020-04-23 08:25:45 +08:00
2021-03-02 03:16:30 +08:00
# workaround for GNU GCC poor AVX load/store code generation
if ( ( CMAKE_CXX_COMPILER_ID STREQUAL "GNU" ) AND ( CMAKE_SYSTEM_PROCESSOR MATCHES "^(i.86|x86(_64)?)$" ) )
target_compile_options ( simdjson-flags INTERFACE -mno-avx256-split-unaligned-load -mno-avx256-split-unaligned-store )
endif ( )
2020-09-09 20:46:29 +08:00
#
2020-04-23 08:25:45 +08:00
# Optional flags
2020-09-09 20:46:29 +08:00
#
2020-09-17 02:27:59 +08:00
#
2020-09-09 20:46:29 +08:00
# Implementation selection
2020-09-17 02:27:59 +08:00
#
2020-10-28 06:43:39 +08:00
set ( SIMDJSON_ALL_IMPLEMENTATIONS "fallback;westmere;haswell;arm64;ppc64" )
2020-09-17 02:27:59 +08:00
set ( SIMDJSON_IMPLEMENTATION "" CACHE STRING "Semicolon-separated list of implementations to include (${SIMDJSON_ALL_IMPLEMENTATIONS}). If this is not set, any implementations that are supported at compile time and may be selected at runtime will be included." )
foreach ( implementation ${ SIMDJSON_IMPLEMENTATION } )
if ( NOT ( implementation IN_LIST SIMDJSON_ALL_IMPLEMENTATIONS ) )
message ( ERROR "Implementation ${implementation} not supported by simdjson. Possible implementations: ${SIMDJSON_ALL_IMPLEMENTATIONS}" )
endif ( )
endforeach ( implementation )
2020-10-28 06:43:39 +08:00
set ( SIMDJSON_EXCLUDE_IMPLEMENTATION "" CACHE STRING "Semicolon-separated list of implementations to exclude (haswell/westmere/arm64/ppc64/fallback). By default, excludes any implementations that are unsupported at compile time or cannot be selected at runtime." )
2020-09-17 02:27:59 +08:00
foreach ( implementation ${ SIMDJSON_EXCLUDE_IMPLEMENTATION } )
if ( NOT ( implementation IN_LIST SIMDJSON_ALL_IMPLEMENTATIONS ) )
message ( ERROR "Implementation ${implementation} not supported by simdjson. Possible implementations: ${SIMDJSON_ALL_IMPLEMENTATIONS}" )
endif ( )
endforeach ( implementation )
foreach ( implementation ${ SIMDJSON_ALL_IMPLEMENTATIONS } )
string ( TOUPPER ${ implementation } implementation_upper )
if ( implementation IN_LIST SIMDJSON_EXCLUDE_IMPLEMENTATION )
message ( STATUS "Excluding implementation ${implementation} due to SIMDJSON_EXCLUDE_IMPLEMENTATION=${SIMDJSON_EXCLUDE_IMPLEMENTATION}" )
target_compile_definitions ( simdjson-flags INTERFACE "SIMDJSON_IMPLEMENTATION_${implementation_upper}=0" )
elseif ( implementation IN_LIST SIMDJSON_IMPLEMENTATION )
message ( STATUS "Including implementation ${implementation} due to SIMDJSON_IMPLEMENTATION=${SIMDJSON_IMPLEMENTATION}" )
target_compile_definitions ( simdjson-flags INTERFACE "SIMDJSON_IMPLEMENTATION_${implementation_upper}=1" )
elseif ( SIMDJSON_IMPLEMENTATION )
message ( STATUS "Excluding implementation ${implementation} due to SIMDJSON_IMPLEMENTATION=${SIMDJSON_IMPLEMENTATION}" )
target_compile_definitions ( simdjson-flags INTERFACE "SIMDJSON_IMPLEMENTATION_${implementation_upper}=0" )
endif ( )
endforeach ( implementation )
# TODO make it so this generates the necessary compiler flags to select the given implementation as the builtin automatically!
option ( SIMDJSON_BUILTIN_IMPLEMENTATION "Select the implementation that will be used for user code. Defaults to the most universal implementation in SIMDJSON_IMPLEMENTATION (in the order ${SIMDJSON_ALL_IMPLEMENTATIONS}) if specified; otherwise, by default the compiler will pick the best implementation that can always be selected given the compiler flags." "" )
if ( SIMDJSON_BUILTIN_IMPLEMENTATION )
target_compile_definitions ( simdjson-flags INTERFACE "SIMDJSON_BUILTIN_IMPLEMENTATION=${SIMDJSON_BUILTIN_IMPLEMENTATION}" )
else ( )
# Pick the most universal implementation out of the selected implementations (if any)
foreach ( implementation ${ SIMDJSON_ALL_IMPLEMENTATIONS } )
if ( implementation IN_LIST SIMDJSON_IMPLEMENTATION AND NOT ( implementation IN_LIST SIMDJSON_EXCLUDE_IMPLEMENTATION ) )
message ( STATUS "Selected implementation ${implementation} as builtin implementation based on ${SIMDJSON_IMPLEMENTATION}." )
target_compile_definitions ( simdjson-flags INTERFACE "SIMDJSON_BUILTIN_IMPLEMENTATION=${implementation}" )
break ( )
endif ( )
endforeach ( implementation )
endif ( SIMDJSON_BUILTIN_IMPLEMENTATION )
2020-04-23 08:25:45 +08:00
option ( SIMDJSON_IMPLEMENTATION_HASWELL "Include the haswell implementation" ON )
if ( NOT SIMDJSON_IMPLEMENTATION_HASWELL )
2020-09-17 02:27:59 +08:00
message ( DEPRECATION "SIMDJSON_IMPLEMENTATION_HASWELL is deprecated. Use SIMDJSON_IMPLEMENTATION=-haswell instead." )
target_compile_definitions ( simdjson-flags INTERFACE SIMDJSON_IMPLEMENTATION_HASWELL=0 )
2020-04-23 08:25:45 +08:00
endif ( )
option ( SIMDJSON_IMPLEMENTATION_WESTMERE "Include the westmere implementation" ON )
if ( NOT SIMDJSON_IMPLEMENTATION_WESTMERE )
2020-09-09 20:46:29 +08:00
message ( DEPRECATION "SIMDJSON_IMPLEMENTATION_WESTMERE is deprecated. SIMDJSON_IMPLEMENTATION=-westmere instead." )
2020-09-17 02:27:59 +08:00
target_compile_definitions ( simdjson-flags INTERFACE SIMDJSON_IMPLEMENTATION_WESTMERE=0 )
2020-04-23 08:25:45 +08:00
endif ( )
option ( SIMDJSON_IMPLEMENTATION_ARM64 "Include the arm64 implementation" ON )
if ( NOT SIMDJSON_IMPLEMENTATION_ARM64 )
2020-09-09 20:46:29 +08:00
message ( DEPRECATION "SIMDJSON_IMPLEMENTATION_ARM64 is deprecated. Use SIMDJSON_IMPLEMENTATION=-arm64 instead." )
2020-09-17 02:27:59 +08:00
target_compile_definitions ( simdjson-flags INTERFACE SIMDJSON_IMPLEMENTATION_ARM64=0 )
2020-04-23 08:25:45 +08:00
endif ( )
2020-10-28 06:43:39 +08:00
option ( SIMDJSON_IMPLEMENTATION_PPC64 "Include the arm64 implementation" ON )
if ( NOT SIMDJSON_IMPLEMENTATION_PPC64 )
message ( DEPRECATION "SIMDJSON_IMPLEMENTATION_PPC64 is deprecated. Use SIMDJSON_IMPLEMENTATION=-ppc64 instead." )
target_compile_definitions ( simdjson-flags INTERFACE SIMDJSON_IMPLEMENTATION_PPC64=0 )
endif ( )
2020-04-23 08:25:45 +08:00
option ( SIMDJSON_IMPLEMENTATION_FALLBACK "Include the fallback implementation" ON )
if ( NOT SIMDJSON_IMPLEMENTATION_FALLBACK )
2020-09-09 20:46:29 +08:00
message ( DEPRECATION "SIMDJSON_IMPLEMENTATION_FALLBACK is deprecated. Use SIMDJSON_IMPLEMENTATION=-fallback instead." )
2020-09-17 02:27:59 +08:00
target_compile_definitions ( simdjson-flags INTERFACE SIMDJSON_IMPLEMENTATION_FALLBACK=0 )
2020-04-23 08:25:45 +08:00
endif ( )
2020-09-09 20:46:29 +08:00
2020-09-17 02:27:59 +08:00
#
# Other optional flags
#
2021-02-21 03:46:01 +08:00
option ( SIMDJSON_DEVELOPMENT_CHECKS "Enable development-time aids, such as checks for incorrect API usage. Enabled by default in DEBUG." OFF )
if ( SIMDJSON_DEVELOPMENT_CHECKS )
target_compile_definitions ( simdjson-flags INTERFACE SIMDJSON_DEVELOPMENT_CHECKS )
2021-02-06 05:34:52 +08:00
endif ( )
2020-04-23 08:25:45 +08:00
2020-08-17 23:50:57 +08:00
option ( SIMDJSON_BASH "Allow usage of bash within CMake" ON )
2020-04-23 08:25:45 +08:00
option ( SIMDJSON_EXCEPTIONS "Enable simdjson's exception-throwing interface" ON )
if ( NOT SIMDJSON_EXCEPTIONS )
message ( STATUS "simdjson exception interface turned off. Code that does not check error codes will not compile." )
2020-09-17 02:27:59 +08:00
target_compile_definitions ( simdjson-flags INTERFACE SIMDJSON_EXCEPTIONS=0 )
2020-10-27 02:11:25 +08:00
if ( MSVC )
# CMake currently /EHsc as a default flag in CMAKE_CXX_FLAGS on MSVC. Replacing this with a more general abstraction is a WIP (see https://gitlab.kitware.com/cmake/cmake/-/issues/20610)
# /EHs enables standard C++ stack unwinding when catching exceptions (non-structured exception handling)
# /EHc used in conjection with /EHs indicates that extern "C" functions never throw (terminate-on-throw)
# Here, we disable both with the - argument negation operator
string ( REPLACE "/EHsc" "/EHs-c-" CMAKE_CXX_FLAGS ${ CMAKE_CXX_FLAGS } )
# Because we cannot change the flag above on an invidual target (yet), the definition below must similarly be added globally
add_definitions ( -D_HAS_EXCEPTIONS=0 )
2021-02-27 05:15:34 +08:00
elseif ( CMAKE_COMPILER_IS_GNUCC )
target_link_libraries ( simdjson-flags INTERFACE -fno-exceptions )
2020-10-27 02:11:25 +08:00
endif ( )
2020-04-23 08:25:45 +08:00
endif ( )
2020-06-27 01:23:44 +08:00
option ( SIMDJSON_ENABLE_THREADS "Link with thread support" ON )
2020-04-23 08:25:45 +08:00
if ( SIMDJSON_ENABLE_THREADS )
2020-04-30 04:47:36 +08:00
set ( CMAKE_THREAD_PREFER_PTHREAD TRUE )
set ( THREADS_PREFER_PTHREAD_FLAG TRUE )
2020-06-06 09:01:41 +08:00
find_package ( Threads REQUIRED )
Using a worker instead of a thread per batch (#920)
In the parse_many function, we have one thread doing the stage 1, while the main thread does stage 2. So if stage 1 and stage 2 take half the time, the parse_many could run at twice the speed. It is unlikely to do so. Still, we see benefits of about 40% due to threading.
To achieve this interleaving, we load the data in batches (blocks) of some size. In the current code (master), we create a new thread for each batch. Thread creation is expensive so our approach only works over sizeable batches. This PR improves things and makes parse_many faster when using small batches.
This fixes our parse_stream benchmark which is just busted.
This replaces the one-thread per batch routine by a worker object that reuses the same thread. In benchmarks, this allows us to get the same maximal speed, but with smaller processing blocks. It does not help much with larger blocks because the cost of the thread create gets amortized efficiently.
This PR makes parse_many beneficial over small datasets. It also makes us less dependent on the thread creation time.
Unfortunately, it is going to be difficult to say anything definitive in general. The cost of creating a thread varies widely depending on the OS. On some systems, it might be cheap, in others very expensive. It should be expected that the new code will depend less drastically on the performances of the underlying system, since we create juste one thread.
Co-authored-by: John Keiser <john@johnkeiser.com>
Co-authored-by: Daniel Lemire <lemire@gmai.com>
2020-06-13 04:51:18 +08:00
target_link_libraries ( simdjson-flags INTERFACE Threads::Threads )
2020-06-27 01:23:44 +08:00
target_compile_definitions ( simdjson-flags INTERFACE SIMDJSON_THREADS_ENABLED=1 ) # This will be set in the code automatically.
endif ( )
2020-08-14 04:36:20 +08:00
option ( SIMDJSON_VERBOSE_LOGGING, "Enable verbose logging for internal simdjson library development." OFF )
if ( SIMDJSON_VERBOSE_LOGGING )
target_compile_definitions ( simdjson-flags INTERFACE SIMDJSON_VERBOSE_LOGGING=1 )
endif ( )
2020-11-01 13:38:52 +08:00
option ( SIMDJSON_DISABLE_DEPRECATED_API "Disables deprecated APIs" Off )
if ( SIMDJSON_DISABLE_DEPRECATED_API )
target_compile_definitions ( simdjson-flags INTERFACE SIMDJSON_DISABLE_DEPRECATED_API=1 )
endif ( )
2020-04-23 08:25:45 +08:00
if ( SIMDJSON_USE_LIBCPP )
target_link_libraries ( simdjson-flags INTERFACE -stdlib=libc++ -lc++abi )
# instead of the above line, we could have used
# set(CMAKE_EXE_LINKER_FLAGS "${CMAKE_EXE_LINKER_FLAGS} -stdlib=libc++ -lc++abi")
# The next line is needed empirically.
set ( CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -stdlib=libc++" )
# we update CMAKE_SHARED_LINKER_FLAGS, this gets updated later as well
set ( CMAKE_SHARED_LINKER_FLAGS "${CMAKE_SHARED_LINKER_FLAGS} -lc++abi" )
endif ( SIMDJSON_USE_LIBCPP )
# prevent shared libraries from depending on Intel provided libraries
if ( ${ CMAKE_C_COMPILER_ID } MATCHES "Intel" ) # icc / icpc
set ( CMAKE_SHARED_LINKER_FLAGS "${CMAKE_SHARED_LINKER_FLAGS} -static-intel" )
endif ( )
2020-12-12 09:28:24 +08:00
include ( CheckSymbolExists )
CHECK_SYMBOL_EXISTS ( fork unistd.h HAVE_POSIX_FORK )
CHECK_SYMBOL_EXISTS ( wait sys/wait.h HAVE_POSIX_WAIT )
2020-04-30 07:06:19 +08:00
install ( TARGETS simdjson-flags EXPORT simdjson-config )
2021-01-21 02:20:49 +08:00
# I do not think we want to export our internal flags!
# install(TARGETS simdjson-internal-flags EXPORT simdjson-config)