200 lines
6.0 KiB
Bash
Executable File
200 lines
6.0 KiB
Bash
Executable File
#!/bin/bash
|
|
########################################################################
|
|
# Generates an "amalgamation build" for roaring. Inspired by similar
|
|
# script used by whefs.
|
|
########################################################################
|
|
SCRIPTPATH="$( cd "$(dirname "$0")" ; pwd -P )"
|
|
|
|
echo "We are about to amalgamate all simdjson files into one source file. "
|
|
echo "See https://www.sqlite.org/amalgamation.html and https://en.wikipedia.org/wiki/Single_Compilation_Unit for rationale. "
|
|
|
|
AMAL_H="simdjson.h"
|
|
AMAL_C="simdjson.cpp"
|
|
|
|
# order does not matter
|
|
ALLCFILES="
|
|
$SCRIPTPATH/src/jsoncharutils.h
|
|
$SCRIPTPATH/src/numberparsing.h
|
|
$SCRIPTPATH/src/simdprune_tables.h
|
|
$SCRIPTPATH/src/simdjson.cpp
|
|
$SCRIPTPATH/src/jsonioutil.cpp
|
|
$SCRIPTPATH/src/jsonminifier.cpp
|
|
$SCRIPTPATH/src/jsonparser.cpp
|
|
$SCRIPTPATH/src/jsonstream.cpp
|
|
$SCRIPTPATH/src/arm64/bitmask.h
|
|
$SCRIPTPATH/src/haswell/bitmask.h
|
|
$SCRIPTPATH/src/westmere/bitmask.h
|
|
$SCRIPTPATH/src/arm64/simd.h
|
|
$SCRIPTPATH/src/haswell/simd.h
|
|
$SCRIPTPATH/src/westmere/simd.h
|
|
$SCRIPTPATH/src/arm64/stage1_find_marks.h
|
|
$SCRIPTPATH/src/haswell/stage1_find_marks.h
|
|
$SCRIPTPATH/src/westmere/stage1_find_marks.h
|
|
$SCRIPTPATH/src/stage1_find_marks.cpp
|
|
$SCRIPTPATH/src/arm64/stringparsing.h
|
|
$SCRIPTPATH/src/haswell/stringparsing.h
|
|
$SCRIPTPATH/src/westmere/stringparsing.h
|
|
$SCRIPTPATH/src/stage2_build_tape.cpp
|
|
$SCRIPTPATH/src/arm64/stage2_build_tape.h
|
|
$SCRIPTPATH/src/haswell/stage2_build_tape.h
|
|
$SCRIPTPATH/src/westmere/stage2_build_tape.h
|
|
$SCRIPTPATH/src/parsedjson.cpp
|
|
$SCRIPTPATH/src/parsedjsoniterator.cpp
|
|
"
|
|
|
|
# order matters
|
|
ALLCHEADERS="
|
|
$SCRIPTPATH/include/simdjson/simdjson_version.h
|
|
$SCRIPTPATH/include/simdjson/portability.h
|
|
$SCRIPTPATH/include/simdjson/isadetection.h
|
|
$SCRIPTPATH/include/simdjson/jsonformatutils.h
|
|
$SCRIPTPATH/include/simdjson/simdjson.h
|
|
$SCRIPTPATH/include/simdjson/common_defs.h
|
|
$SCRIPTPATH/include/simdjson/padded_string.h
|
|
$SCRIPTPATH/include/simdjson/jsonioutil.h
|
|
$SCRIPTPATH/include/simdjson/jsonminifier.h
|
|
$SCRIPTPATH/include/simdjson/parsedjson.h
|
|
$SCRIPTPATH/include/simdjson/parsedjsoniterator.h
|
|
$SCRIPTPATH/include/simdjson/stage1_find_marks.h
|
|
$SCRIPTPATH/include/simdjson/stage2_build_tape.h
|
|
$SCRIPTPATH/include/simdjson/jsonparser.h
|
|
$SCRIPTPATH/include/simdjson/jsonstream.h
|
|
"
|
|
|
|
for i in ${ALLCHEADERS} ${ALLCFILES}; do
|
|
test -e $i && continue
|
|
echo "FATAL: source file [$i] not found."
|
|
exit 127
|
|
done
|
|
|
|
function dofile()
|
|
{
|
|
# Last lines are always ignored. Files should end by an empty lines.
|
|
RELFILE=${1#"$SCRIPTPATH/"}
|
|
echo "/* begin file $RELFILE */"
|
|
# echo "#line 8 \"$1\"" ## redefining the line/file is not nearly as useful as it sounds for debugging. It breaks IDEs.
|
|
while IFS= read -r line
|
|
do
|
|
if [[ "${line}" == '#include "'*'"'* ]]; then
|
|
file=$(echo $line| cut -d'"' -f 2)
|
|
|
|
if [[ "${file}" == '../'* ]]; then
|
|
file=$(echo $file| cut -d'/' -f 2-)
|
|
fi;
|
|
|
|
# we ignore simdjson headers (except src/generic/*.h); they are handled in the above list
|
|
if [ -f include/$file ]; then
|
|
continue;
|
|
elif [ -f src/$file ]; then
|
|
# we paste the contents of src/generic/*.h
|
|
if [[ "${file}" == *'generic/'*'.h' ]]; then
|
|
echo "$(<src/$file)"
|
|
fi;
|
|
continue;
|
|
fi;
|
|
fi;
|
|
|
|
# Otherwise we simply copy the line
|
|
echo "$line"
|
|
done < "$1"
|
|
echo "/* end file $RELFILE */"
|
|
}
|
|
timestamp=$(date)
|
|
echo "Creating ${AMAL_H}..."
|
|
echo "/* auto-generated on ${timestamp}. Do not edit! */" > "${AMAL_H}"
|
|
{
|
|
for h in ${ALLCHEADERS}; do
|
|
dofile $h
|
|
done
|
|
} >> "${AMAL_H}"
|
|
|
|
|
|
echo "Creating ${AMAL_C}..."
|
|
echo "/* auto-generated on ${timestamp}. Do not edit! */" > "${AMAL_C}"
|
|
{
|
|
echo "#include \"${AMAL_H}\""
|
|
|
|
echo ""
|
|
echo "/* used for http://dmalloc.com/ Dmalloc - Debug Malloc Library */"
|
|
echo "#ifdef DMALLOC"
|
|
echo "#include \"dmalloc.h\""
|
|
echo "#endif"
|
|
echo ""
|
|
|
|
for h in ${ALLCFILES}; do
|
|
dofile $h
|
|
done
|
|
} >> "${AMAL_C}"
|
|
|
|
|
|
|
|
DEMOCPP="amalgamation_demo.cpp"
|
|
echo "Creating ${DEMOCPP}..."
|
|
echo "/* auto-generated on ${timestamp}. Do not edit! */" > "${DEMOCPP}"
|
|
cat <<< '
|
|
#include <iostream>
|
|
#include "simdjson.h"
|
|
#include "simdjson.cpp"
|
|
int main(int argc, char *argv[]) {
|
|
if(argc < 3) {
|
|
std::cerr << "Please specify filenames " << std::endl;
|
|
}
|
|
const char * filename = argv[1];
|
|
simdjson::padded_string p = simdjson::get_corpus(filename);
|
|
simdjson::ParsedJson pj = simdjson::build_parsed_json(p); // do the parsing
|
|
if( ! pj.is_valid() ) {
|
|
std::cout << "build_parsed_json not valid" << std::endl;
|
|
} else {
|
|
std::cout << "build_parsed_json valid" << std::endl;
|
|
}
|
|
|
|
//JsonStream
|
|
const char * filename2 = argv[2];
|
|
simdjson::padded_string p2 = simdjson::get_corpus(filename2);
|
|
simdjson::ParsedJson pj2;
|
|
simdjson::JsonStream js{p2.data(), p2.size()};
|
|
int parse_res = simdjson::SUCCESS_AND_HAS_MORE;
|
|
|
|
while (parse_res == simdjson::SUCCESS_AND_HAS_MORE) {
|
|
parse_res = js.json_parse(pj2);
|
|
}
|
|
|
|
if( ! pj2.is_valid()) {
|
|
std::cout << "JsonStream not valid" << std::endl;
|
|
} else {
|
|
std::cout << "JsonStream valid" << std::endl;
|
|
}
|
|
|
|
|
|
return EXIT_SUCCESS;
|
|
}
|
|
' >> "${DEMOCPP}"
|
|
|
|
echo "Done with all files generation. "
|
|
|
|
echo "Files have been written to directory: $PWD "
|
|
ls -la ${AMAL_C} ${AMAL_H} ${DEMOCPP}
|
|
|
|
echo "Giving final instructions:"
|
|
|
|
|
|
CPPBIN=${DEMOCPP%%.*}
|
|
|
|
echo "Try :"
|
|
echo "c++ -O3 -std=c++17 -o ${CPPBIN} ${DEMOCPP} && ./${CPPBIN} ../jsonexamples/twitter.json ../jsonexamples/amazon_cellphones.ndjson"
|
|
|
|
SINGLEHDR=$SCRIPTPATH/singleheader
|
|
echo "Copying files to $SCRIPTPATH/singleheader "
|
|
mkdir -p $SINGLEHDR
|
|
echo "c++ -O3 -std=c++17 -o ${CPPBIN} ${DEMOCPP} && ./${CPPBIN} ../jsonexamples/twitter.json ../jsonexamples/amazon_cellphones.ndjson" > $SINGLEHDR/README.md
|
|
cp ${AMAL_C} ${AMAL_H} ${DEMOCPP} $SINGLEHDR
|
|
ls $SINGLEHDR
|
|
|
|
cd $SINGLEHDR && c++ -O3 -std=c++17 -o ${CPPBIN} ${DEMOCPP} && ./${CPPBIN} ../jsonexamples/twitter.json ../jsonexamples/amazon_cellphones.ndjson
|
|
|
|
lowercase(){
|
|
echo "$1" | tr 'A-Z' 'a-z'
|
|
}
|
|
|
|
OS=`lowercase \`uname\``
|