#include #include "simdjson.h" #include using namespace simdjson; using namespace benchmark; using namespace std; const padded_string EMPTY_ARRAY("[]", 2); const char *TWITTER_JSON = SIMDJSON_BENCHMARK_DATA_DIR "twitter.json"; const char *NUMBERS_JSON = SIMDJSON_BENCHMARK_DATA_DIR "numbers.json"; static void numbers_scan(State& state) { // Prints the number of results in twitter.json dom::parser parser; dom::array arr; simdjson::error_code error; parser.load(NUMBERS_JSON).get().tie(arr, error); if(error) { cerr << "could not read " << NUMBERS_JSON << " as an array" << endl; return; } for (UNUSED auto _ : state) { std::vector container; for (auto e : arr) { double x; e.get().tie(x,error); if(error) { cerr << "found a node that is not an number?" << endl; break;} container.push_back(x); } benchmark::DoNotOptimize(container.data()); benchmark::ClobberMemory(); } } BENCHMARK(numbers_scan); static void numbers_size_scan(State& state) { // Prints the number of results in twitter.json dom::parser parser; dom::array arr; simdjson::error_code error; parser.load(NUMBERS_JSON).get().tie(arr, error); if(error) { cerr << "could not read " << NUMBERS_JSON << " as an array" << endl; return; } for (UNUSED auto _ : state) { std::vector container; container.resize(arr.size()); size_t pos = 0; for (auto e : arr) { double x; e.get().tie(x,error); if(error) { cerr << "found a node that is not an number?" << endl; break;} container[pos++] = x; } if(pos != container.size()) { cerr << "bad count" << endl; } benchmark::DoNotOptimize(container.data()); benchmark::ClobberMemory(); } } BENCHMARK(numbers_size_scan); static void numbers_type_scan(State& state) { // Prints the number of results in twitter.json dom::parser parser; dom::array arr; simdjson::error_code error; parser.load(NUMBERS_JSON).get().tie(arr, error); if(error) { cerr << "could not read " << NUMBERS_JSON << " as an array" << endl; return; } for (UNUSED auto _ : state) { std::vector container; for (auto e : arr) { dom::element_type actual_type = e.type(); if(actual_type != dom::element_type::DOUBLE) { cerr << "found a node that is not an number?" << endl; break; } double x; e.get().tie(x,error); container.push_back(x); } benchmark::DoNotOptimize(container.data()); benchmark::ClobberMemory(); } } BENCHMARK(numbers_type_scan); static void numbers_type_size_scan(State& state) { // Prints the number of results in twitter.json dom::parser parser; dom::array arr; simdjson::error_code error; parser.load(NUMBERS_JSON).get().tie(arr, error); if(error) { cerr << "could not read " << NUMBERS_JSON << " as an array" << endl; return; } for (UNUSED auto _ : state) { std::vector container; container.resize(arr.size()); size_t pos = 0; for (auto e : arr) { dom::element_type actual_type = e.type(); if(actual_type != dom::element_type::DOUBLE) { cerr << "found a node that is not an number?" << endl; break; } double x; e.get().tie(x,error); container[pos++] = x; } if(pos != container.size()) { cerr << "bad count" << endl; } benchmark::DoNotOptimize(container.data()); benchmark::ClobberMemory(); } } BENCHMARK(numbers_type_size_scan); static void numbers_load_scan(State& state) { // Prints the number of results in twitter.json dom::parser parser; dom::array arr; simdjson::error_code error; for (UNUSED auto _ : state) { // this may hit the disk, but probably just once parser.load(NUMBERS_JSON).get().tie(arr, error); if(error) { cerr << "could not read " << NUMBERS_JSON << " as an array" << endl; break; } std::vector container; for (auto e : arr) { double x; e.get().tie(x,error); if(error) { cerr << "found a node that is not an number?" << endl; break;} container.push_back(x); } benchmark::DoNotOptimize(container.data()); benchmark::ClobberMemory(); } } BENCHMARK(numbers_load_scan); static void numbers_load_size_scan(State& state) { // Prints the number of results in twitter.json dom::parser parser; dom::array arr; simdjson::error_code error; for (UNUSED auto _ : state) { // this may hit the disk, but probably just once parser.load(NUMBERS_JSON).get().tie(arr, error); if(error) { cerr << "could not read " << NUMBERS_JSON << " as an array" << endl; break; } std::vector container; container.resize(arr.size()); size_t pos = 0; for (auto e : arr) { double x; e.get().tie(x,error); if(error) { cerr << "found a node that is not an number?" << endl; break;} container[pos++] = x; } if(pos != container.size()) { cerr << "bad count" << endl; } benchmark::DoNotOptimize(container.data()); benchmark::ClobberMemory(); } } BENCHMARK(numbers_load_size_scan); #if SIMDJSON_EXCEPTIONS static void numbers_exceptions_scan(State& state) { // Prints the number of results in twitter.json dom::parser parser; dom::array arr = parser.load(NUMBERS_JSON); for (UNUSED auto _ : state) { std::vector container; for (double x : arr) { container.push_back(x); } benchmark::DoNotOptimize(container.data()); benchmark::ClobberMemory(); } } BENCHMARK(numbers_exceptions_scan); static void numbers_exceptions_size_scan(State& state) { // Prints the number of results in twitter.json dom::parser parser; dom::array arr = parser.load(NUMBERS_JSON); for (UNUSED auto _ : state) { std::vector container; container.resize(arr.size()); size_t pos = 0; for (auto e : arr) { container[pos++] = double(e); } if(pos != container.size()) { cerr << "bad count" << endl; } benchmark::DoNotOptimize(container.data()); benchmark::ClobberMemory(); } } BENCHMARK(numbers_exceptions_size_scan); static void numbers_type_exceptions_scan(State& state) { // Prints the number of results in twitter.json dom::parser parser; dom::array arr = parser.load(NUMBERS_JSON); for (UNUSED auto _ : state) { std::vector container; for (auto e : arr) { dom::element_type actual_type = e.type(); if(actual_type != dom::element_type::DOUBLE) { cerr << "found a node that is not an number?" << endl; break; } container.push_back(double(e)); } benchmark::DoNotOptimize(container.data()); benchmark::ClobberMemory(); } } BENCHMARK(numbers_type_exceptions_scan); static void numbers_type_exceptions_size_scan(State& state) { // Prints the number of results in twitter.json dom::parser parser; dom::array arr = parser.load(NUMBERS_JSON); for (UNUSED auto _ : state) { std::vector container; container.resize(arr.size()); size_t pos = 0; for (auto e : arr) { dom::element_type actual_type = e.type(); if(actual_type != dom::element_type::DOUBLE) { cerr << "found a node that is not an number?" << endl; break; } container[pos++] = double(e); } if(pos != container.size()) { cerr << "bad count" << endl; } benchmark::DoNotOptimize(container.data()); benchmark::ClobberMemory(); } } BENCHMARK(numbers_type_exceptions_size_scan); static void numbers_exceptions_load_scan(State& state) { // Prints the number of results in twitter.json dom::parser parser; for (UNUSED auto _ : state) { // this may hit the disk, but probably just once dom::array arr = parser.load(NUMBERS_JSON); std::vector container; for (double x : arr) { container.push_back(x); } benchmark::DoNotOptimize(container.data()); benchmark::ClobberMemory(); } } BENCHMARK(numbers_exceptions_load_scan); static void numbers_exceptions_load_size_scan(State& state) { // Prints the number of results in twitter.json dom::parser parser; for (UNUSED auto _ : state) { // this may hit the disk, but probably just once dom::array arr = parser.load(NUMBERS_JSON); std::vector container; container.resize(arr.size()); size_t pos = 0; for (double x : arr) { container[pos++] = x; } if(pos != container.size()) { cerr << "bad count" << endl; } benchmark::DoNotOptimize(container.data()); benchmark::ClobberMemory(); } } BENCHMARK(numbers_exceptions_load_size_scan); static void twitter_count(State& state) { // Prints the number of results in twitter.json dom::parser parser; dom::element doc = parser.load(TWITTER_JSON); for (UNUSED auto _ : state) { uint64_t result_count = doc["search_metadata"]["count"]; if (result_count != 100) { return; } } } BENCHMARK(twitter_count); SIMDJSON_PUSH_DISABLE_WARNINGS SIMDJSON_DISABLE_DEPRECATED_WARNING static void iterator_twitter_count(State& state) { // Prints the number of results in twitter.json padded_string json = padded_string::load(TWITTER_JSON); ParsedJson pj = build_parsed_json(json); for (UNUSED auto _ : state) { ParsedJson::Iterator iter(pj); // uint64_t result_count = doc["search_metadata"]["count"]; if (!iter.move_to_key("search_metadata")) { return; } if (!iter.move_to_key("count")) { return; } if (!iter.is_integer()) { return; } int64_t result_count = iter.get_integer(); if (result_count != 100) { return; } } } BENCHMARK(iterator_twitter_count); SIMDJSON_POP_DISABLE_WARNINGS static void twitter_default_profile(State& state) { // Count unique users with a default profile. dom::parser parser; dom::element doc = parser.load(TWITTER_JSON); for (UNUSED auto _ : state) { set default_users; for (dom::object tweet : doc["statuses"].get()) { dom::object user = tweet["user"]; if (user["default_profile"]) { default_users.insert(user["screen_name"]); } } if (default_users.size() != 86) { return; } } } BENCHMARK(twitter_default_profile); static void twitter_image_sizes(State& state) { // Count unique image sizes dom::parser parser; dom::element doc = parser.load(TWITTER_JSON); for (UNUSED auto _ : state) { set> image_sizes; for (dom::object tweet : doc["statuses"].get()) { auto [media, not_found] = tweet["entities"]["media"]; if (!not_found) { for (dom::object image : media.get()) { for (auto size : image["sizes"].get()) { image_sizes.insert({ size.value["w"], size.value["h"] }); } } } } if (image_sizes.size() != 15) { return; }; } } BENCHMARK(twitter_image_sizes); #endif // SIMDJSON_EXCEPTIONS static void error_code_twitter_count(State& state) noexcept { // Prints the number of results in twitter.json dom::parser parser; auto [doc, error1] = parser.load(TWITTER_JSON); if (error1) { return; } for (UNUSED auto _ : state) { auto [value, error] = doc["search_metadata"]["count"].get(); if (error) { return; } if (value != 100) { return; } } } BENCHMARK(error_code_twitter_count); static void error_code_twitter_default_profile(State& state) noexcept { // Count unique users with a default profile. dom::parser parser; auto [doc, error1] = parser.load(TWITTER_JSON); if (error1) { std::cerr << error1 << std::endl; return; } for (UNUSED auto _ : state) { set default_users; auto [tweets, error] = doc["statuses"].get(); if (error) { return; } for (dom::element tweet : tweets) { auto [user, error2] = tweet["user"].get(); if (error2) { return; } auto [default_profile, error3] = user["default_profile"].get(); if (error3) { return; } if (default_profile) { auto [screen_name, error4] = user["screen_name"].get(); if (error4) { return; } default_users.insert(screen_name); } } if (default_users.size() != 86) { return; } } } BENCHMARK(error_code_twitter_default_profile); SIMDJSON_PUSH_DISABLE_WARNINGS SIMDJSON_DISABLE_DEPRECATED_WARNING static void iterator_twitter_default_profile(State& state) { // Count unique users with a default profile. auto [json, error1] = padded_string::load(TWITTER_JSON); if (error1) { std::cerr << error1 << std::endl; return; } ParsedJson pj = build_parsed_json(json); for (UNUSED auto _ : state) { set default_users; ParsedJson::Iterator iter(pj); // for (dom::object tweet : doc["statuses"].get()) { if (!(iter.move_to_key("statuses") && iter.is_array())) { return; } if (iter.down()) { // first status do { // dom::object user = tweet["user"]; if (!(iter.move_to_key("user") && iter.is_object())) { return; } // if (user["default_profile"]) { if (iter.move_to_key("default_profile")) { if (iter.is_true()) { if (!iter.up()) { return; } // back to user // default_users.insert(user["screen_name"]); if (!(iter.move_to_key("screen_name") && iter.is_string())) { return; } default_users.insert(string_view(iter.get_string(), iter.get_string_length())); } if (!iter.up()) { return; } // back to user } if (!iter.up()) { return; } // back to status } while (iter.next()); // next status } if (default_users.size() != 86) { return; } } } SIMDJSON_POP_DISABLE_WARNINGS BENCHMARK(iterator_twitter_default_profile); static void error_code_twitter_image_sizes(State& state) noexcept { // Count unique image sizes dom::parser parser; auto [doc, error1] = parser.load(TWITTER_JSON); if (error1) { std::cerr << error1 << std::endl; return; } for (UNUSED auto _ : state) { set> image_sizes; auto [statuses, error] = doc["statuses"].get(); if (error) { return; } for (dom::element tweet : statuses) { auto [images, not_found] = tweet["entities"]["media"].get(); if (!not_found) { for (dom::element image : images) { auto [sizes, error2] = image["sizes"].get(); if (error2) { return; } for (auto size : sizes) { auto [width, error3] = size.value["w"].get(); auto [height, error4] = size.value["h"].get(); if (error3 || error4) { return; } image_sizes.insert({ width, height }); } } } } if (image_sizes.size() != 15) { return; }; } } BENCHMARK(error_code_twitter_image_sizes); SIMDJSON_PUSH_DISABLE_WARNINGS SIMDJSON_DISABLE_DEPRECATED_WARNING static void iterator_twitter_image_sizes(State& state) { // Count unique image sizes auto [json, error1] = padded_string::load(TWITTER_JSON); if (error1) { std::cerr << error1 << std::endl; return; } ParsedJson pj = build_parsed_json(json); for (UNUSED auto _ : state) { set> image_sizes; ParsedJson::Iterator iter(pj); // for (dom::object tweet : doc["statuses"].get()) { if (!(iter.move_to_key("statuses") && iter.is_array())) { return; } if (iter.down()) { // first status do { // auto [media, not_found] = tweet["entities"]["media"]; // if (!not_found) { if (iter.move_to_key("entities")) { if (!iter.is_object()) { return; } if (iter.move_to_key("media")) { if (!iter.is_array()) { return; } // for (dom::object image : media.get()) { if (iter.down()) { // first media do { // for (auto [key, size] : image["sizes"].get()) { if (!(iter.move_to_key("sizes") && iter.is_object())) { return; } if (iter.down()) { // first size do { iter.move_to_value(); // image_sizes.insert({ size["w"], size["h"] }); if (!(iter.move_to_key("w")) && !iter.is_integer()) { return; } uint64_t width = iter.get_integer(); if (!iter.up()) { return; } // back to size if (!(iter.move_to_key("h")) && !iter.is_integer()) { return; } uint64_t height = iter.get_integer(); if (!iter.up()) { return; } // back to size image_sizes.insert({ width, height }); } while (iter.next()); // next size if (!iter.up()) { return; } // back to sizes } if (!iter.up()) { return; } // back to image } while (iter.next()); // next image if (!iter.up()) { return; } // back to media } if (!iter.up()) { return; } // back to entities } if (!iter.up()) { return; } // back to status } } while (iter.next()); // next status } if (image_sizes.size() != 15) { return; }; } } BENCHMARK(iterator_twitter_image_sizes); static void print_json(State& state) noexcept { // Prints the number of results in twitter.json auto [json, error1] = padded_string::load(TWITTER_JSON); if (error1) { std::cerr << error1 << std::endl; return; } dom::parser parser; if (int error = json_parse(json, parser); error != SUCCESS) { cerr << error_message(error) << endl; return; } for (UNUSED auto _ : state) { std::stringstream s; if (!parser.print_json(s)) { cerr << "print_json failed" << endl; return; } } } BENCHMARK(print_json); SIMDJSON_POP_DISABLE_WARNINGS BENCHMARK_MAIN();