conflicts are solved
This commit is contained in:
parent
78406ba954
commit
9230588ce8
|
@ -19,5 +19,6 @@ Reini Urban
|
||||||
Tom Dyson
|
Tom Dyson
|
||||||
Ihor Dotsenko
|
Ihor Dotsenko
|
||||||
Alexey Milovidov
|
Alexey Milovidov
|
||||||
|
Chang Liu
|
||||||
# if you have contributed to the project and your name does not
|
# if you have contributed to the project and your name does not
|
||||||
# appear in this list, please let us know!
|
# appear in this list, please let us know!
|
||||||
|
|
|
@ -30,7 +30,7 @@ void print_vec(const std::vector<int64_t> &v) {
|
||||||
std::cout << std::endl;
|
std::cout << std::endl;
|
||||||
}
|
}
|
||||||
|
|
||||||
void simdjson_scan(std::vector<int64_t> &answer, ParsedJson::iterator &i) {
|
void simdjson_scan(std::vector<int64_t> &answer, simdjson::ParsedJson::iterator &i) {
|
||||||
while(i.move_forward()) {
|
while(i.move_forward()) {
|
||||||
if(i.get_scope_type() == '{') {
|
if(i.get_scope_type() == '{') {
|
||||||
bool founduser = (i.get_string_length() == 4) && (memcmp(i.get_string(), "user", 4) == 0);
|
bool founduser = (i.get_string_length() == 4) && (memcmp(i.get_string(), "user", 4) == 0);
|
||||||
|
@ -48,30 +48,30 @@ void simdjson_scan(std::vector<int64_t> &answer, ParsedJson::iterator &i) {
|
||||||
}
|
}
|
||||||
|
|
||||||
__attribute__ ((noinline))
|
__attribute__ ((noinline))
|
||||||
std::vector<int64_t> simdjson_justdom(ParsedJson &pj) {
|
std::vector<int64_t> simdjson_justdom(simdjson::ParsedJson &pj) {
|
||||||
std::vector<int64_t> answer;
|
std::vector<int64_t> answer;
|
||||||
ParsedJson::iterator i(pj);
|
simdjson::ParsedJson::iterator i(pj);
|
||||||
simdjson_scan(answer,i);
|
simdjson_scan(answer,i);
|
||||||
remove_duplicates(answer);
|
remove_duplicates(answer);
|
||||||
return answer;
|
return answer;
|
||||||
}
|
}
|
||||||
|
|
||||||
__attribute__ ((noinline))
|
__attribute__ ((noinline))
|
||||||
std::vector<int64_t> simdjson_computestats(const padded_string &p) {
|
std::vector<int64_t> simdjson_computestats(const simdjson::padded_string &p) {
|
||||||
std::vector<int64_t> answer;
|
std::vector<int64_t> answer;
|
||||||
ParsedJson pj = build_parsed_json(p);
|
simdjson::ParsedJson pj = simdjson::build_parsed_json(p);
|
||||||
if (!pj.isValid()) {
|
if (!pj.isValid()) {
|
||||||
return answer;
|
return answer;
|
||||||
}
|
}
|
||||||
ParsedJson::iterator i(pj);
|
simdjson::ParsedJson::iterator i(pj);
|
||||||
simdjson_scan(answer,i);
|
simdjson_scan(answer,i);
|
||||||
remove_duplicates(answer);
|
remove_duplicates(answer);
|
||||||
return answer;
|
return answer;
|
||||||
}
|
}
|
||||||
|
|
||||||
__attribute__ ((noinline))
|
__attribute__ ((noinline))
|
||||||
bool simdjson_justparse(const padded_string &p) {
|
bool simdjson_justparse(const simdjson::padded_string &p) {
|
||||||
ParsedJson pj = build_parsed_json(p);
|
simdjson::ParsedJson pj = simdjson::build_parsed_json(p);
|
||||||
bool answer = !pj.isValid();
|
bool answer = !pj.isValid();
|
||||||
return answer;
|
return answer;
|
||||||
}
|
}
|
||||||
|
@ -135,7 +135,7 @@ std::vector<int64_t> sasjon_justdom(sajson::document & d) {
|
||||||
}
|
}
|
||||||
|
|
||||||
__attribute__ ((noinline))
|
__attribute__ ((noinline))
|
||||||
std::vector<int64_t> sasjon_computestats(const padded_string &p) {
|
std::vector<int64_t> sasjon_computestats(const simdjson::padded_string &p) {
|
||||||
std::vector<int64_t> answer;
|
std::vector<int64_t> answer;
|
||||||
char *buffer = (char *)malloc(p.size());
|
char *buffer = (char *)malloc(p.size());
|
||||||
memcpy(buffer, p.data(), p.size());
|
memcpy(buffer, p.data(), p.size());
|
||||||
|
@ -152,7 +152,7 @@ std::vector<int64_t> sasjon_computestats(const padded_string &p) {
|
||||||
}
|
}
|
||||||
|
|
||||||
__attribute__ ((noinline))
|
__attribute__ ((noinline))
|
||||||
bool sasjon_justparse(const padded_string &p) {
|
bool sasjon_justparse(const simdjson::padded_string &p) {
|
||||||
char *buffer = (char *)malloc(p.size());
|
char *buffer = (char *)malloc(p.size());
|
||||||
memcpy(buffer, p.data(), p.size());
|
memcpy(buffer, p.data(), p.size());
|
||||||
auto d = sajson::parse(sajson::dynamic_allocation(),
|
auto d = sajson::parse(sajson::dynamic_allocation(),
|
||||||
|
@ -210,7 +210,7 @@ std::vector<int64_t> rapid_justdom(rapidjson::Document &d) {
|
||||||
}
|
}
|
||||||
|
|
||||||
__attribute__ ((noinline))
|
__attribute__ ((noinline))
|
||||||
std::vector<int64_t> rapid_computestats(const padded_string &p) {
|
std::vector<int64_t> rapid_computestats(const simdjson::padded_string &p) {
|
||||||
std::vector<int64_t> answer;
|
std::vector<int64_t> answer;
|
||||||
char *buffer = (char *)malloc(p.size() + 1);
|
char *buffer = (char *)malloc(p.size() + 1);
|
||||||
memcpy(buffer, p.data(), p.size());
|
memcpy(buffer, p.data(), p.size());
|
||||||
|
@ -228,7 +228,7 @@ std::vector<int64_t> rapid_computestats(const padded_string &p) {
|
||||||
}
|
}
|
||||||
|
|
||||||
__attribute__ ((noinline))
|
__attribute__ ((noinline))
|
||||||
bool rapid_justparse(const padded_string &p) {
|
bool rapid_justparse(const simdjson::padded_string &p) {
|
||||||
char *buffer = (char *)malloc(p.size() + 1);
|
char *buffer = (char *)malloc(p.size() + 1);
|
||||||
memcpy(buffer, p.data(), p.size());
|
memcpy(buffer, p.data(), p.size());
|
||||||
buffer[p.size()] = '\0';
|
buffer[p.size()] = '\0';
|
||||||
|
@ -267,9 +267,9 @@ int main(int argc, char *argv[]) {
|
||||||
if (optind + 1 < argc) {
|
if (optind + 1 < argc) {
|
||||||
std::cerr << "warning: ignoring everything after " << argv[optind + 1] << std::endl;
|
std::cerr << "warning: ignoring everything after " << argv[optind + 1] << std::endl;
|
||||||
}
|
}
|
||||||
padded_string p;
|
simdjson::padded_string p;
|
||||||
try {
|
try {
|
||||||
get_corpus(filename).swap(p);
|
simdjson::get_corpus(filename).swap(p);
|
||||||
} catch (const std::exception &e) { // caught by reference to base
|
} catch (const std::exception &e) { // caught by reference to base
|
||||||
std::cout << "Could not load the file " << filename << std::endl;
|
std::cout << "Could not load the file " << filename << std::endl;
|
||||||
return EXIT_FAILURE;
|
return EXIT_FAILURE;
|
||||||
|
@ -321,7 +321,7 @@ int main(int argc, char *argv[]) {
|
||||||
!justdata);
|
!justdata);
|
||||||
BEST_TIME("sasjon (just parse) ", sasjon_justparse(p), false, , repeat, volume,
|
BEST_TIME("sasjon (just parse) ", sasjon_justparse(p), false, , repeat, volume,
|
||||||
!justdata);
|
!justdata);
|
||||||
ParsedJson dsimdjson = build_parsed_json(p);
|
simdjson::ParsedJson dsimdjson = simdjson::build_parsed_json(p);
|
||||||
BEST_TIME("simdjson (just dom) ", simdjson_justdom(dsimdjson).size(), size, , repeat,
|
BEST_TIME("simdjson (just dom) ", simdjson_justdom(dsimdjson).size(), size, , repeat,
|
||||||
volume, !justdata);
|
volume, !justdata);
|
||||||
char *buffer = (char *)malloc(p.size());
|
char *buffer = (char *)malloc(p.size());
|
||||||
|
|
|
@ -65,9 +65,9 @@ int main(int argc, char *argv[]) {
|
||||||
exit(1);
|
exit(1);
|
||||||
}
|
}
|
||||||
const char * filename = argv[optind];
|
const char * filename = argv[optind];
|
||||||
padded_string p;
|
simdjson::padded_string p;
|
||||||
try {
|
try {
|
||||||
get_corpus(filename).swap(p);
|
simdjson::get_corpus(filename).swap(p);
|
||||||
} catch (const std::exception& e) { // caught by reference to base
|
} catch (const std::exception& e) { // caught by reference to base
|
||||||
std::cout << "Could not load the file " << filename << std::endl;
|
std::cout << "Could not load the file " << filename << std::endl;
|
||||||
return EXIT_FAILURE;
|
return EXIT_FAILURE;
|
||||||
|
|
|
@ -78,9 +78,9 @@ int main(int argc, char *argv[]) {
|
||||||
if (verbose) {
|
if (verbose) {
|
||||||
std::cout << "[verbose] loading " << filename << std::endl;
|
std::cout << "[verbose] loading " << filename << std::endl;
|
||||||
}
|
}
|
||||||
padded_string p;
|
simdjson::padded_string p;
|
||||||
try {
|
try {
|
||||||
get_corpus(filename).swap(p);
|
simdjson::get_corpus(filename).swap(p);
|
||||||
} catch (const std::exception &e) { // caught by reference to base
|
} catch (const std::exception &e) { // caught by reference to base
|
||||||
std::cout << "Could not load the file " << filename << std::endl;
|
std::cout << "Could not load the file " << filename << std::endl;
|
||||||
return EXIT_FAILURE;
|
return EXIT_FAILURE;
|
||||||
|
@ -128,7 +128,7 @@ int main(int argc, char *argv[]) {
|
||||||
std::cout << "[verbose] iteration # " << i << std::endl;
|
std::cout << "[verbose] iteration # " << i << std::endl;
|
||||||
}
|
}
|
||||||
unified.start();
|
unified.start();
|
||||||
ParsedJson pj;
|
simdjson::ParsedJson pj;
|
||||||
bool allocok = pj.allocateCapacity(p.size());
|
bool allocok = pj.allocateCapacity(p.size());
|
||||||
if (!allocok) {
|
if (!allocok) {
|
||||||
std::cerr << "failed to allocate memory" << std::endl;
|
std::cerr << "failed to allocate memory" << std::endl;
|
||||||
|
@ -145,7 +145,7 @@ int main(int argc, char *argv[]) {
|
||||||
}
|
}
|
||||||
unified.start();
|
unified.start();
|
||||||
// The default template is simdjson::instruction_set::native.
|
// The default template is simdjson::instruction_set::native.
|
||||||
isok = (find_structural_bits<>(p.data(), p.size(), pj) == simdjson::SUCCESS);
|
isok = (simdjson::find_structural_bits<>(p.data(), p.size(), pj) == simdjson::SUCCESS);
|
||||||
unified.end(results);
|
unified.end(results);
|
||||||
cy1 += results[0];
|
cy1 += results[0];
|
||||||
cl1 += results[1];
|
cl1 += results[1];
|
||||||
|
@ -175,7 +175,7 @@ int main(int argc, char *argv[]) {
|
||||||
if (verbose) {
|
if (verbose) {
|
||||||
std::cout << "[verbose] iteration # " << i << std::endl;
|
std::cout << "[verbose] iteration # " << i << std::endl;
|
||||||
}
|
}
|
||||||
ParsedJson pj;
|
simdjson::ParsedJson pj;
|
||||||
bool allocok = pj.allocateCapacity(p.size());
|
bool allocok = pj.allocateCapacity(p.size());
|
||||||
if (!allocok) {
|
if (!allocok) {
|
||||||
std::cerr << "failed to allocate memory" << std::endl;
|
std::cerr << "failed to allocate memory" << std::endl;
|
||||||
|
@ -187,7 +187,7 @@ int main(int argc, char *argv[]) {
|
||||||
|
|
||||||
auto start = std::chrono::steady_clock::now();
|
auto start = std::chrono::steady_clock::now();
|
||||||
// The default template is simdjson::instruction_set::native.
|
// The default template is simdjson::instruction_set::native.
|
||||||
isok = (find_structural_bits<>(p.data(), p.size(), pj) == simdjson::SUCCESS);
|
isok = (simdjson::find_structural_bits<>(p.data(), p.size(), pj) == simdjson::SUCCESS);
|
||||||
isok = isok && (simdjson::SUCCESS == unified_machine(p.data(), p.size(), pj));
|
isok = isok && (simdjson::SUCCESS == unified_machine(p.data(), p.size(), pj));
|
||||||
auto end = std::chrono::steady_clock::now();
|
auto end = std::chrono::steady_clock::now();
|
||||||
std::chrono::duration<double> secs = end - start;
|
std::chrono::duration<double> secs = end - start;
|
||||||
|
@ -198,7 +198,7 @@ int main(int argc, char *argv[]) {
|
||||||
return EXIT_FAILURE;
|
return EXIT_FAILURE;
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
ParsedJson pj = build_parsed_json(p); // do the parsing again to get the stats
|
simdjson::ParsedJson pj = build_parsed_json(p); // do the parsing again to get the stats
|
||||||
if (!pj.isValid()) {
|
if (!pj.isValid()) {
|
||||||
std::cerr << pj.getErrorMsg() << std::endl;
|
std::cerr << pj.getErrorMsg() << std::endl;
|
||||||
std::cerr << "Could not parse. " << std::endl;
|
std::cerr << "Could not parse. " << std::endl;
|
||||||
|
|
|
@ -146,7 +146,7 @@ void sajson_traverse(stat_t &stats, const sajson::value &node) {
|
||||||
}
|
}
|
||||||
|
|
||||||
__attribute__ ((noinline))
|
__attribute__ ((noinline))
|
||||||
stat_t sasjon_computestats(const padded_string &p) {
|
stat_t sasjon_computestats(const simdjson::padded_string &p) {
|
||||||
stat_t answer;
|
stat_t answer;
|
||||||
char *buffer = (char *)malloc(p.size());
|
char *buffer = (char *)malloc(p.size());
|
||||||
memcpy(buffer, p.data(), p.size());
|
memcpy(buffer, p.data(), p.size());
|
||||||
|
@ -204,7 +204,7 @@ void rapid_traverse(stat_t &stats, const rapidjson::Value &v) {
|
||||||
}
|
}
|
||||||
|
|
||||||
__attribute__ ((noinline))
|
__attribute__ ((noinline))
|
||||||
stat_t rapid_computestats(const padded_string &p) {
|
stat_t rapid_computestats(const simdjson::padded_string &p) {
|
||||||
stat_t answer;
|
stat_t answer;
|
||||||
char *buffer = (char *)malloc(p.size() + 1);
|
char *buffer = (char *)malloc(p.size() + 1);
|
||||||
memcpy(buffer, p.data(), p.size());
|
memcpy(buffer, p.data(), p.size());
|
||||||
|
@ -253,9 +253,9 @@ int main(int argc, char *argv[]) {
|
||||||
if (optind + 1 < argc) {
|
if (optind + 1 < argc) {
|
||||||
std::cerr << "warning: ignoring everything after " << argv[optind + 1] << std::endl;
|
std::cerr << "warning: ignoring everything after " << argv[optind + 1] << std::endl;
|
||||||
}
|
}
|
||||||
padded_string p;
|
simdjson::padded_string p;
|
||||||
try {
|
try {
|
||||||
get_corpus(filename).swap(p);
|
simdjson::get_corpus(filename).swap(p);
|
||||||
} catch (const std::exception &e) { // caught by reference to base
|
} catch (const std::exception &e) { // caught by reference to base
|
||||||
std::cout << "Could not load the file " << filename << std::endl;
|
std::cout << "Could not load the file " << filename << std::endl;
|
||||||
return EXIT_FAILURE;
|
return EXIT_FAILURE;
|
||||||
|
|
|
@ -83,9 +83,9 @@ int main(int argc, char *argv[]) {
|
||||||
std::cerr << "warning: ignoring everything after " << argv[optind + 1]
|
std::cerr << "warning: ignoring everything after " << argv[optind + 1]
|
||||||
<< std::endl;
|
<< std::endl;
|
||||||
}
|
}
|
||||||
padded_string p;
|
simdjson::padded_string p;
|
||||||
try {
|
try {
|
||||||
get_corpus(filename).swap(p);
|
simdjson::get_corpus(filename).swap(p);
|
||||||
} catch (const std::exception &e) { // caught by reference to base
|
} catch (const std::exception &e) { // caught by reference to base
|
||||||
std::cout << "Could not load the file " << filename << std::endl;
|
std::cout << "Could not load the file " << filename << std::endl;
|
||||||
return EXIT_FAILURE;
|
return EXIT_FAILURE;
|
||||||
|
@ -101,7 +101,7 @@ int main(int argc, char *argv[]) {
|
||||||
std::cout << p.size() << " B ";
|
std::cout << p.size() << " B ";
|
||||||
std::cout << std::endl;
|
std::cout << std::endl;
|
||||||
}
|
}
|
||||||
ParsedJson pj;
|
simdjson::ParsedJson pj;
|
||||||
bool allocok = pj.allocateCapacity(p.size(), 1024);
|
bool allocok = pj.allocateCapacity(p.size(), 1024);
|
||||||
|
|
||||||
if (!allocok) {
|
if (!allocok) {
|
||||||
|
|
|
@ -42,9 +42,9 @@ struct stat_s {
|
||||||
|
|
||||||
using stat_t = struct stat_s;
|
using stat_t = struct stat_s;
|
||||||
|
|
||||||
stat_t simdjson_computestats(const padded_string &p) {
|
stat_t simdjson_computestats(const simdjson::padded_string &p) {
|
||||||
stat_t answer;
|
stat_t answer;
|
||||||
ParsedJson pj = build_parsed_json(p);
|
simdjson::ParsedJson pj = simdjson::build_parsed_json(p);
|
||||||
answer.valid = pj.isValid();
|
answer.valid = pj.isValid();
|
||||||
if (!answer.valid) {
|
if (!answer.valid) {
|
||||||
return answer;
|
return answer;
|
||||||
|
@ -134,9 +134,9 @@ int main(int argc, char *argv[]) {
|
||||||
std::cerr << "warning: ignoring everything after " << argv[optind + 1]
|
std::cerr << "warning: ignoring everything after " << argv[optind + 1]
|
||||||
<< std::endl;
|
<< std::endl;
|
||||||
}
|
}
|
||||||
padded_string p;
|
simdjson::padded_string p;
|
||||||
try {
|
try {
|
||||||
get_corpus(filename).swap(p);
|
simdjson::get_corpus(filename).swap(p);
|
||||||
} catch (const std::exception &e) { // caught by reference to base
|
} catch (const std::exception &e) { // caught by reference to base
|
||||||
std::cerr << "Could not load the file " << filename << std::endl;
|
std::cerr << "Could not load the file " << filename << std::endl;
|
||||||
return EXIT_FAILURE;
|
return EXIT_FAILURE;
|
||||||
|
@ -163,7 +163,7 @@ int main(int argc, char *argv[]) {
|
||||||
s.object_count, s.array_count, s.null_count, s.true_count,
|
s.object_count, s.array_count, s.null_count, s.true_count,
|
||||||
s.false_count, s.byte_count, s.structural_indexes_count);
|
s.false_count, s.byte_count, s.structural_indexes_count);
|
||||||
#ifdef __linux__
|
#ifdef __linux__
|
||||||
ParsedJson pj;
|
simdjson::ParsedJson pj;
|
||||||
bool allocok = pj.allocateCapacity(p.size());
|
bool allocok = pj.allocateCapacity(p.size());
|
||||||
if (!allocok) {
|
if (!allocok) {
|
||||||
std::cerr << "failed to allocate memory" << std::endl;
|
std::cerr << "failed to allocate memory" << std::endl;
|
||||||
|
@ -181,7 +181,7 @@ int main(int argc, char *argv[]) {
|
||||||
for (uint32_t i = 0; i < iterations; i++) {
|
for (uint32_t i = 0; i < iterations; i++) {
|
||||||
unified.start();
|
unified.start();
|
||||||
// The default template is simdjson::instruction_set::native.
|
// The default template is simdjson::instruction_set::native.
|
||||||
bool isok = (find_structural_bits<>(p.data(), p.size(), pj) == simdjson::SUCCESS);
|
bool isok = (simdjson::find_structural_bits<>(p.data(), p.size(), pj) == simdjson::SUCCESS);
|
||||||
unified.end(results);
|
unified.end(results);
|
||||||
|
|
||||||
cy1 += results[0];
|
cy1 += results[0];
|
||||||
|
|
|
@ -4,6 +4,7 @@
|
||||||
#include "simdjson/common_defs.h"
|
#include "simdjson/common_defs.h"
|
||||||
#include "simdjson/parsedjson.h"
|
#include "simdjson/parsedjson.h"
|
||||||
|
|
||||||
|
namespace simdjson {
|
||||||
// structural chars here are
|
// structural chars here are
|
||||||
// they are { 0x7b } 0x7d : 0x3a [ 0x5b ] 0x5d , 0x2c (and NULL)
|
// they are { 0x7b } 0x7d : 0x3a [ 0x5b ] 0x5d , 0x2c (and NULL)
|
||||||
// we are also interested in the four whitespace characters
|
// we are also interested in the four whitespace characters
|
||||||
|
@ -293,5 +294,6 @@ inline size_t codepoint_to_utf8(uint32_t cp, uint8_t *c) {
|
||||||
// will return 0 when the code point was too large.
|
// will return 0 when the code point was too large.
|
||||||
return 0; // bad r
|
return 0; // bad r
|
||||||
}
|
}
|
||||||
|
}
|
||||||
|
|
||||||
#endif
|
#endif
|
||||||
|
|
|
@ -5,6 +5,7 @@
|
||||||
#include <iomanip>
|
#include <iomanip>
|
||||||
#include <iostream>
|
#include <iostream>
|
||||||
|
|
||||||
|
namespace simdjson {
|
||||||
// ends with zero char
|
// ends with zero char
|
||||||
static inline void print_with_escapes(const unsigned char *src) {
|
static inline void print_with_escapes(const unsigned char *src) {
|
||||||
while (*src) {
|
while (*src) {
|
||||||
|
@ -195,6 +196,7 @@ static inline void print_with_escapes(const char *src, std::ostream &os,
|
||||||
size_t len) {
|
size_t len) {
|
||||||
print_with_escapes(reinterpret_cast<const unsigned char *>(src), os, len);
|
print_with_escapes(reinterpret_cast<const unsigned char *>(src), os, len);
|
||||||
}
|
}
|
||||||
|
}
|
||||||
|
|
||||||
#
|
#
|
||||||
#endif
|
#endif
|
||||||
|
|
|
@ -12,7 +12,7 @@
|
||||||
#include "simdjson/padded_string.h"
|
#include "simdjson/padded_string.h"
|
||||||
|
|
||||||
|
|
||||||
|
namespace simdjson {
|
||||||
|
|
||||||
// load a file in memory...
|
// load a file in memory...
|
||||||
// get a corpus; pad out to cache line so we can always use SIMD
|
// get a corpus; pad out to cache line so we can always use SIMD
|
||||||
|
@ -29,6 +29,6 @@
|
||||||
// std::cout << "Could not load the file " << filename << std::endl;
|
// std::cout << "Could not load the file " << filename << std::endl;
|
||||||
// }
|
// }
|
||||||
padded_string get_corpus(const std::string& filename);
|
padded_string get_corpus(const std::string& filename);
|
||||||
|
}
|
||||||
|
|
||||||
#endif
|
#endif
|
||||||
|
|
|
@ -4,6 +4,7 @@
|
||||||
#include <cstddef>
|
#include <cstddef>
|
||||||
#include <cstdint>
|
#include <cstdint>
|
||||||
|
|
||||||
|
namespace simdjson {
|
||||||
// Take input from buf and remove useless whitespace, write it to out; buf and
|
// Take input from buf and remove useless whitespace, write it to out; buf and
|
||||||
// out can be the same pointer. Result is null terminated,
|
// out can be the same pointer. Result is null terminated,
|
||||||
// return the string length (minus the null termination).
|
// return the string length (minus the null termination).
|
||||||
|
@ -22,5 +23,5 @@ static inline size_t jsonminify(const std::string_view & p, char *out) {
|
||||||
static inline size_t jsonminify(const padded_string & p, char *out) {
|
static inline size_t jsonminify(const padded_string & p, char *out) {
|
||||||
return jsonminify(p.data(), p.size(), out);
|
return jsonminify(p.data(), p.size(), out);
|
||||||
}
|
}
|
||||||
|
}
|
||||||
#endif
|
#endif
|
||||||
|
|
|
@ -15,6 +15,7 @@
|
||||||
#include <unistd.h>
|
#include <unistd.h>
|
||||||
#endif
|
#endif
|
||||||
|
|
||||||
|
namespace simdjson {
|
||||||
// The function that users are expected to call is json_parse.
|
// The function that users are expected to call is json_parse.
|
||||||
// We have more than one such function because we want to support several
|
// We have more than one such function because we want to support several
|
||||||
// instruction sets.
|
// instruction sets.
|
||||||
|
@ -27,9 +28,9 @@ extern json_parse_functype *json_parse_ptr;
|
||||||
|
|
||||||
|
|
||||||
// json_parse_implementation is the generic function, it is specialized for various
|
// json_parse_implementation is the generic function, it is specialized for various
|
||||||
// SIMD instruction sets, e.g., as json_parse_implementation<simdjson::instruction_set::avx2>
|
// SIMD instruction sets, e.g., as json_parse_implementation<instruction_set::avx2>
|
||||||
// or json_parse_implementation<simdjson::instruction_set::neon>
|
// or json_parse_implementation<instruction_set::neon>
|
||||||
template<simdjson::instruction_set T>
|
template<instruction_set T>
|
||||||
int json_parse_implementation(const uint8_t *buf, size_t len, ParsedJson &pj, bool reallocifneeded = true) {
|
int json_parse_implementation(const uint8_t *buf, size_t len, ParsedJson &pj, bool reallocifneeded = true) {
|
||||||
if (pj.bytecapacity < len) {
|
if (pj.bytecapacity < len) {
|
||||||
return simdjson::CAPACITY;
|
return simdjson::CAPACITY;
|
||||||
|
@ -200,7 +201,5 @@ WARN_UNUSED
|
||||||
inline ParsedJson build_parsed_json(const padded_string &s) {
|
inline ParsedJson build_parsed_json(const padded_string &s) {
|
||||||
return build_parsed_json(s.data(), s.length(), false);
|
return build_parsed_json(s.data(), s.length(), false);
|
||||||
}
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
#endif
|
#endif
|
||||||
|
|
|
@ -6,6 +6,7 @@
|
||||||
#include "simdjson/parsedjson.h"
|
#include "simdjson/parsedjson.h"
|
||||||
#include "simdjson/portability.h"
|
#include "simdjson/portability.h"
|
||||||
|
|
||||||
|
namespace simdjson {
|
||||||
// Allowable floating-point values range from std::numeric_limits<double>::lowest()
|
// Allowable floating-point values range from std::numeric_limits<double>::lowest()
|
||||||
// to std::numeric_limits<double>::max(), so from
|
// to std::numeric_limits<double>::max(), so from
|
||||||
// -1.7976e308 all the way to 1.7975e308 in binary64. The lowest non-zero
|
// -1.7976e308 all the way to 1.7975e308 in binary64. The lowest non-zero
|
||||||
|
@ -553,5 +554,5 @@ static really_inline bool parse_number(const uint8_t *const buf,
|
||||||
return is_structural_or_whitespace(*p);
|
return is_structural_or_whitespace(*p);
|
||||||
#endif // SIMDJSON_SKIPNUMBERPARSING
|
#endif // SIMDJSON_SKIPNUMBERPARSING
|
||||||
}
|
}
|
||||||
|
}
|
||||||
#endif
|
#endif
|
||||||
|
|
|
@ -3,6 +3,8 @@
|
||||||
#include "simdjson/portability.h"
|
#include "simdjson/portability.h"
|
||||||
#include <memory>
|
#include <memory>
|
||||||
#include <cstring>
|
#include <cstring>
|
||||||
|
|
||||||
|
namespace simdjson {
|
||||||
// low-level function to allocate memory with padding so we can read passed the
|
// low-level function to allocate memory with padding so we can read passed the
|
||||||
// "length" bytes safely. if you must provide a pointer to some data, create it
|
// "length" bytes safely. if you must provide a pointer to some data, create it
|
||||||
// with this function: length is the max. size in bytes of the string caller is
|
// with this function: length is the max. size in bytes of the string caller is
|
||||||
|
@ -63,5 +65,6 @@ private:
|
||||||
size_t viable_size;
|
size_t viable_size;
|
||||||
char *data_ptr;
|
char *data_ptr;
|
||||||
};
|
};
|
||||||
|
}
|
||||||
|
|
||||||
#endif
|
#endif
|
||||||
|
|
|
@ -15,7 +15,7 @@
|
||||||
|
|
||||||
#define DEFAULTMAXDEPTH 1024// a JSON document with a depth exceeding 1024 is probably de facto invalid
|
#define DEFAULTMAXDEPTH 1024// a JSON document with a depth exceeding 1024 is probably de facto invalid
|
||||||
|
|
||||||
|
namespace simdjson {
|
||||||
/************
|
/************
|
||||||
* The JSON is parsed to a tape, see the accompanying tape.md file
|
* The JSON is parsed to a tape, see the accompanying tape.md file
|
||||||
* for documentation.
|
* for documentation.
|
||||||
|
@ -499,4 +499,5 @@ bool ParsedJson::iterator::next() {
|
||||||
current_type = nexttype;
|
current_type = nexttype;
|
||||||
return true;
|
return true;
|
||||||
}
|
}
|
||||||
|
}
|
||||||
#endif
|
#endif
|
||||||
|
|
|
@ -7,6 +7,7 @@
|
||||||
#include <iso646.h>
|
#include <iso646.h>
|
||||||
#include <cstdint>
|
#include <cstdint>
|
||||||
|
|
||||||
|
namespace simdjson {
|
||||||
static inline bool add_overflow(uint64_t value1, uint64_t value2, uint64_t *result) {
|
static inline bool add_overflow(uint64_t value1, uint64_t value2, uint64_t *result) {
|
||||||
return _addcarry_u64(0, value1, value2, reinterpret_cast<unsigned __int64 *>(result));
|
return _addcarry_u64(0, value1, value2, reinterpret_cast<unsigned __int64 *>(result));
|
||||||
}
|
}
|
||||||
|
@ -34,7 +35,7 @@ static inline int hamming(uint64_t input_num) {
|
||||||
__popcnt((uint32_t)(input_num >> 32)));
|
__popcnt((uint32_t)(input_num >> 32)));
|
||||||
#endif
|
#endif
|
||||||
}
|
}
|
||||||
|
}
|
||||||
#else
|
#else
|
||||||
#include <cstdint>
|
#include <cstdint>
|
||||||
#include <cstdlib>
|
#include <cstdlib>
|
||||||
|
@ -42,7 +43,7 @@ static inline int hamming(uint64_t input_num) {
|
||||||
#if defined(__BMI2__) || defined(__POPCOUNT__) || defined(__AVX2__)
|
#if defined(__BMI2__) || defined(__POPCOUNT__) || defined(__AVX2__)
|
||||||
#include <x86intrin.h>
|
#include <x86intrin.h>
|
||||||
#endif
|
#endif
|
||||||
|
namespace simdjson {
|
||||||
static inline bool add_overflow(uint64_t value1, uint64_t value2, uint64_t *result) {
|
static inline bool add_overflow(uint64_t value1, uint64_t value2, uint64_t *result) {
|
||||||
return __builtin_uaddll_overflow(value1, value2, (unsigned long long*)result);
|
return __builtin_uaddll_overflow(value1, value2, (unsigned long long*)result);
|
||||||
}
|
}
|
||||||
|
@ -76,10 +77,11 @@ static inline int hamming(uint64_t input_num) {
|
||||||
return __builtin_popcountll(input_num);
|
return __builtin_popcountll(input_num);
|
||||||
#endif
|
#endif
|
||||||
}
|
}
|
||||||
|
}
|
||||||
#endif // _MSC_VER
|
#endif // _MSC_VER
|
||||||
|
|
||||||
|
|
||||||
|
namespace simdjson {
|
||||||
// portable version of posix_memalign
|
// portable version of posix_memalign
|
||||||
static inline void *aligned_malloc(size_t alignment, size_t size) {
|
static inline void *aligned_malloc(size_t alignment, size_t size) {
|
||||||
void *p;
|
void *p;
|
||||||
|
@ -139,5 +141,6 @@ static inline void aligned_free(void *memblock) {
|
||||||
static inline void aligned_free_char(char *memblock) {
|
static inline void aligned_free_char(char *memblock) {
|
||||||
aligned_free((void*)memblock);
|
aligned_free((void*)memblock);
|
||||||
}
|
}
|
||||||
|
}
|
||||||
|
|
||||||
#endif // SIMDJSON_PORTABILITY_H
|
#endif // SIMDJSON_PORTABILITY_H
|
||||||
|
|
|
@ -3,46 +3,45 @@
|
||||||
|
|
||||||
#include <string>
|
#include <string>
|
||||||
|
|
||||||
struct simdjson {
|
namespace simdjson {
|
||||||
enum class instruction_set {
|
enum class instruction_set {
|
||||||
avx2,
|
avx2,
|
||||||
sse4_2,
|
sse4_2,
|
||||||
neon,
|
neon,
|
||||||
none,
|
none,
|
||||||
// the 'native' enum class value should point at a good default on the current machine
|
// the 'native' enum class value should point at a good default on the current machine
|
||||||
#ifdef __AVX2__
|
#ifdef __AVX2__
|
||||||
native = avx2
|
native = avx2
|
||||||
#elif defined(__ARM_NEON)
|
#elif defined(__ARM_NEON)
|
||||||
native = neon
|
native = neon
|
||||||
#else
|
#else
|
||||||
// Let us assume that we have an old x64 processor, but one that has SSE (i.e., something
|
// Let us assume that we have an old x64 processor, but one that has SSE (i.e., something
|
||||||
// that came out in the second decade of the XXIst century.
|
// that came out in the second decade of the XXIst century.
|
||||||
// It would be nicer to check explicitly, but there many not be a good way to do so
|
// It would be nicer to check explicitly, but there many not be a good way to do so
|
||||||
// that is cross-platform.
|
// that is cross-platform.
|
||||||
// Under Visual Studio, there is no way to check for SSE4.2 support at compile-time.
|
// Under Visual Studio, there is no way to check for SSE4.2 support at compile-time.
|
||||||
native = sse4_2
|
native = sse4_2
|
||||||
#endif
|
#endif
|
||||||
};
|
|
||||||
|
|
||||||
enum errorValues {
|
|
||||||
SUCCESS = 0,
|
|
||||||
CAPACITY, // This ParsedJson can't support a document that big
|
|
||||||
MEMALLOC, // Error allocating memory, most likely out of memory
|
|
||||||
TAPE_ERROR, // Something went wrong while writing to the tape (stage 2), this is a generic error
|
|
||||||
DEPTH_ERROR, // Your document exceeds the user-specified depth limitation
|
|
||||||
STRING_ERROR, // Problem while parsing a string
|
|
||||||
T_ATOM_ERROR, // Problem while parsing an atom starting with the letter 't'
|
|
||||||
F_ATOM_ERROR, // Problem while parsing an atom starting with the letter 'f'
|
|
||||||
N_ATOM_ERROR, // Problem while parsing an atom starting with the letter 'n'
|
|
||||||
NUMBER_ERROR, // Problem while parsing a number
|
|
||||||
UTF8_ERROR, // the input is not valid UTF-8
|
|
||||||
UNITIALIZED, // unknown error, or uninitialized document
|
|
||||||
EMPTY, // no structural document found
|
|
||||||
UNESCAPED_CHARS, // found unescaped characters in a string.
|
|
||||||
UNCLOSED_STRING, // missing quote at the end
|
|
||||||
UNEXPECTED_ERROR // indicative of a bug in simdjson
|
|
||||||
};
|
|
||||||
static const std::string& errorMsg(const int);
|
|
||||||
};
|
};
|
||||||
|
|
||||||
|
enum errorValues {
|
||||||
|
SUCCESS = 0,
|
||||||
|
CAPACITY, // This ParsedJson can't support a document that big
|
||||||
|
MEMALLOC, // Error allocating memory, most likely out of memory
|
||||||
|
TAPE_ERROR, // Something went wrong while writing to the tape (stage 2), this is a generic error
|
||||||
|
DEPTH_ERROR, // Your document exceeds the user-specified depth limitation
|
||||||
|
STRING_ERROR, // Problem while parsing a string
|
||||||
|
T_ATOM_ERROR, // Problem while parsing an atom starting with the letter 't'
|
||||||
|
F_ATOM_ERROR, // Problem while parsing an atom starting with the letter 'f'
|
||||||
|
N_ATOM_ERROR, // Problem while parsing an atom starting with the letter 'n'
|
||||||
|
NUMBER_ERROR, // Problem while parsing a number
|
||||||
|
UTF8_ERROR, // the input is not valid UTF-8
|
||||||
|
UNITIALIZED, // unknown error, or uninitialized document
|
||||||
|
EMPTY, // no structural document found
|
||||||
|
UNESCAPED_CHARS, // found unescaped characters in a string.
|
||||||
|
UNCLOSED_STRING, // missing quote at the end
|
||||||
|
UNEXPECTED_ERROR // indicative of a bug in simdjson
|
||||||
|
};
|
||||||
|
const std::string& errorMsg(const int);
|
||||||
|
}
|
||||||
#endif
|
#endif
|
||||||
|
|
|
@ -2,9 +2,11 @@
|
||||||
#ifndef SIMDJSON_INCLUDE_SIMDJSON_VERSION
|
#ifndef SIMDJSON_INCLUDE_SIMDJSON_VERSION
|
||||||
#define SIMDJSON_INCLUDE_SIMDJSON_VERSION
|
#define SIMDJSON_INCLUDE_SIMDJSON_VERSION
|
||||||
#define SIMDJSON_VERSION 0.1.2
|
#define SIMDJSON_VERSION 0.1.2
|
||||||
|
namespace simdjson {
|
||||||
enum {
|
enum {
|
||||||
SIMDJSON_VERSION_MAJOR = 0,
|
SIMDJSON_VERSION_MAJOR = 0,
|
||||||
SIMDJSON_VERSION_MINOR = 1,
|
SIMDJSON_VERSION_MINOR = 1,
|
||||||
SIMDJSON_VERSION_REVISION = 2
|
SIMDJSON_VERSION_REVISION = 2
|
||||||
};
|
};
|
||||||
|
}
|
||||||
#endif // SIMDJSON_INCLUDE_SIMDJSON_VERSION
|
#endif // SIMDJSON_INCLUDE_SIMDJSON_VERSION
|
||||||
|
|
|
@ -3,8 +3,9 @@
|
||||||
|
|
||||||
#include "simdjson/portability.h"
|
#include "simdjson/portability.h"
|
||||||
|
|
||||||
#ifdef __AVX__
|
|
||||||
|
|
||||||
|
namespace simdjson {
|
||||||
|
#ifdef __AVX__
|
||||||
static const unsigned char mask128_epi8[] = {
|
static const unsigned char mask128_epi8[] = {
|
||||||
0x0, 0x1, 0x2, 0x3, 0x4, 0x5, 0x6, 0x7, 0x8, 0x9, 0xa, 0xb, 0xc, 0xd, 0xe,
|
0x0, 0x1, 0x2, 0x3, 0x4, 0x5, 0x6, 0x7, 0x8, 0x9, 0xa, 0xb, 0xc, 0xd, 0xe,
|
||||||
0xf, 0x1, 0x2, 0x3, 0x4, 0x5, 0x6, 0x7, 0x8, 0x9, 0xa, 0xb, 0xc, 0xd, 0xe,
|
0xf, 0x1, 0x2, 0x3, 0x4, 0x5, 0x6, 0x7, 0x8, 0x9, 0xa, 0xb, 0xc, 0xd, 0xe,
|
||||||
|
@ -34984,13 +34985,13 @@ static const unsigned char mask128_epi32[] = {
|
||||||
0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff,
|
0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff,
|
||||||
0xff, 0xff, 0xff, 0xff,
|
0xff, 0xff, 0xff, 0xff,
|
||||||
};
|
};
|
||||||
|
}
|
||||||
#endif //__SSE3__
|
#endif //__SSE3__
|
||||||
|
|
||||||
#ifdef __AVX2__
|
#ifdef __AVX2__
|
||||||
|
|
||||||
#include <cstdint>
|
#include <cstdint>
|
||||||
|
namespace simdjson {
|
||||||
static const uint32_t mask256_epi32[] = {
|
static const uint32_t mask256_epi32[] = {
|
||||||
0, 1, 2, 3, 4, 5, 6, 7, 1, 2, 3, 4, 5, 6, 7, 7, 0, 2, 3, 4, 5, 6, 7, 7, 2,
|
0, 1, 2, 3, 4, 5, 6, 7, 1, 2, 3, 4, 5, 6, 7, 7, 0, 2, 3, 4, 5, 6, 7, 7, 2,
|
||||||
3, 4, 5, 6, 7, 7, 7, 0, 1, 3, 4, 5, 6, 7, 7, 1, 3, 4, 5, 6, 7, 7, 7, 0, 3,
|
3, 4, 5, 6, 7, 7, 7, 0, 1, 3, 4, 5, 6, 7, 7, 1, 3, 4, 5, 6, 7, 7, 7, 0, 3,
|
||||||
|
@ -35074,6 +35075,7 @@ static const uint32_t mask256_epi32[] = {
|
||||||
3, 3, 3, 3, 3, 3, 3, 3, 3, 0, 1, 2, 2, 2, 2, 2, 2, 1, 2, 2, 2, 2, 2, 2, 2,
|
3, 3, 3, 3, 3, 3, 3, 3, 3, 0, 1, 2, 2, 2, 2, 2, 2, 1, 2, 2, 2, 2, 2, 2, 2,
|
||||||
0, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 0, 1, 1, 1, 1, 1, 1, 1, 1,
|
0, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 0, 1, 1, 1, 1, 1, 1, 1, 1,
|
||||||
1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0};
|
1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0};
|
||||||
|
}
|
||||||
#endif //__AVX2__
|
#endif //__AVX2__
|
||||||
|
|
||||||
#endif
|
#endif
|
||||||
|
|
|
@ -26,9 +26,8 @@
|
||||||
|
|
||||||
// all byte values must be no larger than 0xF4
|
// all byte values must be no larger than 0xF4
|
||||||
|
|
||||||
|
namespace simdjson {
|
||||||
#ifdef __AVX2__
|
#ifdef __AVX2__
|
||||||
|
|
||||||
/*****************************/
|
/*****************************/
|
||||||
static inline __m256i push_last_byte_of_a_to_b(__m256i a, __m256i b) {
|
static inline __m256i push_last_byte_of_a_to_b(__m256i a, __m256i b) {
|
||||||
return _mm256_alignr_epi8(b, _mm256_permute2x128_si256(a, b, 0x21), 15);
|
return _mm256_alignr_epi8(b, _mm256_permute2x128_si256(a, b, 0x21), 15);
|
||||||
|
@ -194,4 +193,5 @@ avxcheckUTF8Bytes(__m256i current_bytes,
|
||||||
#else // __AVX2__
|
#else // __AVX2__
|
||||||
#warning "We require AVX2 support!"
|
#warning "We require AVX2 support!"
|
||||||
#endif // __AVX2__
|
#endif // __AVX2__
|
||||||
|
}
|
||||||
#endif
|
#endif
|
||||||
|
|
|
@ -32,6 +32,7 @@
|
||||||
|
|
||||||
#define TRANSPOSE
|
#define TRANSPOSE
|
||||||
|
|
||||||
|
namespace simdjson {
|
||||||
template<simdjson::instruction_set>
|
template<simdjson::instruction_set>
|
||||||
struct simd_input;
|
struct simd_input;
|
||||||
#ifdef __AVX2__
|
#ifdef __AVX2__
|
||||||
|
@ -853,5 +854,5 @@ WARN_UNUSED
|
||||||
int find_structural_bits(const char *buf, size_t len, ParsedJson &pj) {
|
int find_structural_bits(const char *buf, size_t len, ParsedJson &pj) {
|
||||||
return find_structural_bits<T>(reinterpret_cast<const uint8_t *>(buf), len, pj);
|
return find_structural_bits<T>(reinterpret_cast<const uint8_t *>(buf), len, pj);
|
||||||
}
|
}
|
||||||
|
}
|
||||||
#endif
|
#endif
|
||||||
|
|
|
@ -3,6 +3,7 @@
|
||||||
|
|
||||||
#include "simdjson/common_defs.h"
|
#include "simdjson/common_defs.h"
|
||||||
|
|
||||||
|
namespace simdjson {
|
||||||
struct ParsedJson;
|
struct ParsedJson;
|
||||||
|
|
||||||
void init_state_machine();
|
void init_state_machine();
|
||||||
|
@ -12,5 +13,6 @@ int unified_machine(const uint8_t *buf, size_t len, ParsedJson &pj);
|
||||||
|
|
||||||
WARN_UNUSED
|
WARN_UNUSED
|
||||||
int unified_machine(const char *buf, size_t len, ParsedJson &pj);
|
int unified_machine(const char *buf, size_t len, ParsedJson &pj);
|
||||||
|
}
|
||||||
|
|
||||||
#endif
|
#endif
|
||||||
|
|
|
@ -5,7 +5,7 @@
|
||||||
#include "simdjson/jsoncharutils.h"
|
#include "simdjson/jsoncharutils.h"
|
||||||
#include "simdjson/parsedjson.h"
|
#include "simdjson/parsedjson.h"
|
||||||
|
|
||||||
|
namespace simdjson {
|
||||||
// begin copypasta
|
// begin copypasta
|
||||||
// These chars yield themselves: " \ /
|
// These chars yield themselves: " \ /
|
||||||
// b -> backspace, f -> formfeed, n -> newline, r -> cr, t -> horizontal tab
|
// b -> backspace, f -> formfeed, n -> newline, r -> cr, t -> horizontal tab
|
||||||
|
@ -201,6 +201,6 @@ really_inline bool parse_string(UNUSED const uint8_t *buf, UNUSED size_t len,
|
||||||
return true;
|
return true;
|
||||||
#endif // SIMDJSON_SKIPSTRINGPARSING
|
#endif // SIMDJSON_SKIPSTRINGPARSING
|
||||||
}
|
}
|
||||||
|
}
|
||||||
|
|
||||||
#endif
|
#endif
|
||||||
|
|
|
@ -2,6 +2,7 @@
|
||||||
#include <cstring>
|
#include <cstring>
|
||||||
#include <cstdlib>
|
#include <cstdlib>
|
||||||
|
|
||||||
|
namespace simdjson {
|
||||||
char * allocate_padded_buffer(size_t length) {
|
char * allocate_padded_buffer(size_t length) {
|
||||||
// we could do a simple malloc
|
// we could do a simple malloc
|
||||||
//return (char *) malloc(length + SIMDJSON_PADDING);
|
//return (char *) malloc(length + SIMDJSON_PADDING);
|
||||||
|
@ -31,3 +32,4 @@ padded_string get_corpus(const std::string& filename) {
|
||||||
}
|
}
|
||||||
throw std::runtime_error("could not load corpus");
|
throw std::runtime_error("could not load corpus");
|
||||||
}
|
}
|
||||||
|
}
|
||||||
|
|
|
@ -1,8 +1,9 @@
|
||||||
#include "simdjson/portability.h"
|
#include "simdjson/portability.h"
|
||||||
#include <cstdint>
|
#include <cstdint>
|
||||||
|
|
||||||
#ifndef __AVX2__
|
#ifndef __AVX2__
|
||||||
|
|
||||||
|
namespace simdjson {
|
||||||
static uint8_t jump_table[256 * 3] = {
|
static uint8_t jump_table[256 * 3] = {
|
||||||
0, 1, 1, 0, 1, 1, 0, 1, 1, 0, 1, 1, 0, 1, 1, 0, 1, 1, 0, 1, 1, 0, 1, 1, 0,
|
0, 1, 1, 0, 1, 1, 0, 1, 1, 0, 1, 1, 0, 1, 1, 0, 1, 1, 0, 1, 1, 0, 1, 1, 0,
|
||||||
1, 1, 0, 1, 0, 0, 1, 0, 0, 1, 1, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 1, 1, 0, 1,
|
1, 1, 0, 1, 0, 0, 1, 0, 0, 1, 1, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 1, 1, 0, 1,
|
||||||
|
@ -56,12 +57,12 @@ size_t jsonminify(const unsigned char *bytes, size_t howmany,
|
||||||
}
|
}
|
||||||
return pos;
|
return pos;
|
||||||
}
|
}
|
||||||
|
}
|
||||||
#else
|
#else
|
||||||
|
|
||||||
#include "simdjson/simdprune_tables.h"
|
#include "simdjson/simdprune_tables.h"
|
||||||
#include <cstring>
|
#include <cstring>
|
||||||
|
|
||||||
|
namespace simdjson {
|
||||||
// a straightforward comparison of a mask against input.
|
// a straightforward comparison of a mask against input.
|
||||||
static uint64_t cmp_mask_against_input_mini(__m256i input_lo, __m256i input_hi,
|
static uint64_t cmp_mask_against_input_mini(__m256i input_lo, __m256i input_hi,
|
||||||
__m256i mask) {
|
__m256i mask) {
|
||||||
|
@ -247,5 +248,5 @@ size_t jsonminify(const uint8_t *buf, size_t len, uint8_t *out) {
|
||||||
*out = '\0';// NULL termination
|
*out = '\0';// NULL termination
|
||||||
return out - initout;
|
return out - initout;
|
||||||
}
|
}
|
||||||
|
}
|
||||||
#endif
|
#endif
|
||||||
|
|
|
@ -7,44 +7,44 @@
|
||||||
#endif
|
#endif
|
||||||
#include "simdjson/simdjson.h"
|
#include "simdjson/simdjson.h"
|
||||||
|
|
||||||
|
namespace simdjson {
|
||||||
// Responsible to select the best json_parse implementation
|
// Responsible to select the best json_parse implementation
|
||||||
int json_parse_dispatch(const uint8_t *buf, size_t len, ParsedJson &pj, bool reallocifneeded) {
|
int json_parse_dispatch(const uint8_t *buf, size_t len, ParsedJson &pj, bool reallocifneeded) {
|
||||||
// Versions for each implementation
|
// Versions for each implementation
|
||||||
#ifdef __AVX2__
|
#ifdef __AVX2__
|
||||||
json_parse_functype* avx_implementation = &json_parse_implementation<simdjson::instruction_set::avx2>;
|
json_parse_functype* avx_implementation = &json_parse_implementation<instruction_set::avx2>;
|
||||||
#endif
|
#endif
|
||||||
#ifdef __SSE4_2__
|
#ifdef __SSE4_2__
|
||||||
// json_parse_functype* sse4_2_implementation = &json_parse_implementation<simdjson::instruction_set::sse4_2>; // not implemented yet
|
// json_parse_functype* sse4_2_implementation = &json_parse_implementation<instruction_set::sse4_2>; // not implemented yet
|
||||||
#endif
|
#endif
|
||||||
#ifdef __ARM_NEON
|
#ifdef __ARM_NEON
|
||||||
json_parse_functype* neon_implementation = &json_parse_implementation<simdjson::instruction_set::neon>;
|
json_parse_functype* neon_implementation = &json_parse_implementation<instruction_set::neon>;
|
||||||
#endif
|
#endif
|
||||||
|
|
||||||
// Determining which implementation is the more suitable
|
// Determining which implementation is the more suitable
|
||||||
// Should be done at runtime. Does not make any sense on preprocessor.
|
// Should be done at runtime. Does not make any sense on preprocessor.
|
||||||
#ifdef __AVX2__
|
#ifdef __AVX2__
|
||||||
simdjson::instruction_set best_implementation = simdjson::instruction_set::avx2;
|
instruction_set best_implementation = instruction_set::avx2;
|
||||||
#elif defined (__SSE4_2__)
|
#elif defined (__SSE4_2__)
|
||||||
simdjson::instruction_set best_implementation = simdjson::instruction_set::sse4_2;
|
instruction_set best_implementation = instruction_set::sse4_2;
|
||||||
#elif defined (__ARM_NEON)
|
#elif defined (__ARM_NEON)
|
||||||
simdjson::instruction_set best_implementation = simdjson::instruction_set::neon;
|
instruction_set best_implementation = instruction_set::neon;
|
||||||
#else
|
#else
|
||||||
simdjson::instruction_set best_implementation = simdjson::instruction_set::none;
|
instruction_set best_implementation = instruction_set::none;
|
||||||
#endif
|
#endif
|
||||||
|
|
||||||
// Selecting the best implementation
|
// Selecting the best implementation
|
||||||
switch (best_implementation) {
|
switch (best_implementation) {
|
||||||
#ifdef __AVX2__
|
#ifdef __AVX2__
|
||||||
case simdjson::instruction_set::avx2 :
|
case instruction_set::avx2 :
|
||||||
json_parse_ptr = avx_implementation;
|
json_parse_ptr = avx_implementation;
|
||||||
break;
|
break;
|
||||||
#elif defined (__SSE4_2__)
|
#elif defined (__SSE4_2__)
|
||||||
/*case simdjson::instruction_set::sse4_2 :
|
/*case instruction_set::sse4_2 :
|
||||||
json_parse_ptr = sse4_2_implementation;
|
json_parse_ptr = sse4_2_implementation;
|
||||||
break;*/
|
break;*/
|
||||||
#elif defined (__ARM_NEON)
|
#elif defined (__ARM_NEON)
|
||||||
case simdjson::instruction_set::neon :
|
case instruction_set::neon :
|
||||||
json_parse_ptr = neon_implementation;
|
json_parse_ptr = neon_implementation;
|
||||||
break;
|
break;
|
||||||
#endif
|
#endif
|
||||||
|
@ -69,3 +69,4 @@ ParsedJson build_parsed_json(const uint8_t *buf, size_t len, bool reallocifneede
|
||||||
}
|
}
|
||||||
return pj;
|
return pj;
|
||||||
}
|
}
|
||||||
|
}
|
|
@ -1,5 +1,6 @@
|
||||||
#include "simdjson/parsedjson.h"
|
#include "simdjson/parsedjson.h"
|
||||||
|
|
||||||
|
namespace simdjson {
|
||||||
ParsedJson::ParsedJson() :
|
ParsedJson::ParsedJson() :
|
||||||
structural_indexes(nullptr), tape(nullptr), containing_scope_offset(nullptr),
|
structural_indexes(nullptr), tape(nullptr), containing_scope_offset(nullptr),
|
||||||
ret_address(nullptr), string_buf(nullptr), current_string_buf_loc(nullptr) {}
|
ret_address(nullptr), string_buf(nullptr), current_string_buf_loc(nullptr) {}
|
||||||
|
@ -97,7 +98,7 @@ int ParsedJson::getErrorCode() const {
|
||||||
}
|
}
|
||||||
|
|
||||||
std::string ParsedJson::getErrorMsg() const {
|
std::string ParsedJson::getErrorMsg() const {
|
||||||
return simdjson::errorMsg(errorcode);
|
return errorMsg(errorcode);
|
||||||
}
|
}
|
||||||
|
|
||||||
void ParsedJson::deallocate() {
|
void ParsedJson::deallocate() {
|
||||||
|
@ -318,3 +319,4 @@ bool ParsedJson::dump_raw_tape(std::ostream &os) {
|
||||||
os << tapeidx << " : "<< type <<"\t// pointing to " << payload <<" (start root)\n";
|
os << tapeidx << " : "<< type <<"\t// pointing to " << payload <<" (start root)\n";
|
||||||
return true;
|
return true;
|
||||||
}
|
}
|
||||||
|
}
|
||||||
|
|
|
@ -2,6 +2,7 @@
|
||||||
#include "simdjson/common_defs.h"
|
#include "simdjson/common_defs.h"
|
||||||
#include <iterator>
|
#include <iterator>
|
||||||
|
|
||||||
|
namespace simdjson {
|
||||||
ParsedJson::iterator::iterator(ParsedJson &pj_) : pj(pj_), depth(0), location(0), tape_length(0), depthindex(nullptr) {
|
ParsedJson::iterator::iterator(ParsedJson &pj_) : pj(pj_), depth(0), location(0), tape_length(0), depthindex(nullptr) {
|
||||||
if(!pj.isValid()) {
|
if(!pj.isValid()) {
|
||||||
throw InvalidJSON();
|
throw InvalidJSON();
|
||||||
|
@ -92,3 +93,4 @@ bool ParsedJson::iterator::print(std::ostream &os, bool escape_strings) const {
|
||||||
}
|
}
|
||||||
return true;
|
return true;
|
||||||
}
|
}
|
||||||
|
}
|
||||||
|
|
|
@ -1,23 +1,25 @@
|
||||||
#include <map>
|
#include <map>
|
||||||
#include "simdjson/simdjson.h"
|
#include "simdjson/simdjson.h"
|
||||||
|
|
||||||
|
namespace simdjson {
|
||||||
const std::map<int, const std::string> errorStrings = {
|
const std::map<int, const std::string> errorStrings = {
|
||||||
{simdjson::SUCCESS, "No errors"},
|
{SUCCESS, "No errors"},
|
||||||
{simdjson::CAPACITY, "This ParsedJson can't support a document that big"},
|
{CAPACITY, "This ParsedJson can't support a document that big"},
|
||||||
{simdjson::MEMALLOC, "Error allocating memory, we're most likely out of memory"},
|
{MEMALLOC, "Error allocating memory, we're most likely out of memory"},
|
||||||
{simdjson::TAPE_ERROR, "Something went wrong while writing to the tape"},
|
{TAPE_ERROR, "Something went wrong while writing to the tape"},
|
||||||
{simdjson::STRING_ERROR, "Problem while parsing a string"},
|
{STRING_ERROR, "Problem while parsing a string"},
|
||||||
{simdjson::T_ATOM_ERROR, "Problem while parsing an atom starting with the letter 't'"},
|
{T_ATOM_ERROR, "Problem while parsing an atom starting with the letter 't'"},
|
||||||
{simdjson::F_ATOM_ERROR, "Problem while parsing an atom starting with the letter 'f'"},
|
{F_ATOM_ERROR, "Problem while parsing an atom starting with the letter 'f'"},
|
||||||
{simdjson::N_ATOM_ERROR, "Problem while parsing an atom starting with the letter 'n'"},
|
{N_ATOM_ERROR, "Problem while parsing an atom starting with the letter 'n'"},
|
||||||
{simdjson::NUMBER_ERROR, "Problem while parsing a number"},
|
{NUMBER_ERROR, "Problem while parsing a number"},
|
||||||
{simdjson::UTF8_ERROR, "The input is not valid UTF-8"},
|
{UTF8_ERROR, "The input is not valid UTF-8"},
|
||||||
{simdjson::UNITIALIZED, "Unitialized"},
|
{UNITIALIZED, "Unitialized"},
|
||||||
{simdjson::EMPTY, "Empty"},
|
{EMPTY, "Empty"},
|
||||||
{simdjson::UNESCAPED_CHARS, "Within strings, some characters must be escapted, we found unescapted characters"},
|
{UNESCAPED_CHARS, "Within strings, some characters must be escapted, we found unescapted characters"},
|
||||||
{simdjson::UNEXPECTED_ERROR, "Unexpected error, consider reporting this problem as you may have found a bug in simdjson"},
|
{UNEXPECTED_ERROR, "Unexpected error, consider reporting this problem as you may have found a bug in simdjson"},
|
||||||
};
|
};
|
||||||
|
|
||||||
const std::string& simdjson::errorMsg(const int errorCode) {
|
const std::string& errorMsg(const int errorCode) {
|
||||||
return errorStrings.at(errorCode);
|
return errorStrings.at(errorCode);
|
||||||
}
|
}
|
||||||
|
}
|
||||||
|
|
|
@ -11,6 +11,7 @@
|
||||||
#include <iostream>
|
#include <iostream>
|
||||||
#define PATH_SEP '/'
|
#define PATH_SEP '/'
|
||||||
|
|
||||||
|
namespace simdjson {
|
||||||
|
|
||||||
WARN_UNUSED
|
WARN_UNUSED
|
||||||
really_inline bool is_valid_true_atom(const uint8_t *loc) {
|
really_inline bool is_valid_true_atom(const uint8_t *loc) {
|
||||||
|
@ -82,7 +83,7 @@ int unified_machine(const uint8_t *buf, size_t len, ParsedJson &pj) {
|
||||||
uint32_t depth = 0; // could have an arbitrary starting depth
|
uint32_t depth = 0; // could have an arbitrary starting depth
|
||||||
pj.init(); // sets isvalid to false
|
pj.init(); // sets isvalid to false
|
||||||
if(pj.bytecapacity < len) {
|
if(pj.bytecapacity < len) {
|
||||||
pj.errorcode = simdjson::CAPACITY;
|
pj.errorcode = CAPACITY;
|
||||||
return pj.errorcode;
|
return pj.errorcode;
|
||||||
}
|
}
|
||||||
// this macro reads the next structural character, updating idx, i and c.
|
// this macro reads the next structural character, updating idx, i and c.
|
||||||
|
@ -526,7 +527,7 @@ succeed:
|
||||||
pj.write_tape(pj.containing_scope_offset[depth], 'r'); // r is root
|
pj.write_tape(pj.containing_scope_offset[depth], 'r'); // r is root
|
||||||
|
|
||||||
pj.isvalid = true;
|
pj.isvalid = true;
|
||||||
pj.errorcode = simdjson::SUCCESS;
|
pj.errorcode = SUCCESS;
|
||||||
return pj.errorcode;
|
return pj.errorcode;
|
||||||
fail:
|
fail:
|
||||||
// we do not need the next line because this is done by pj.init(), pessimistically.
|
// we do not need the next line because this is done by pj.init(), pessimistically.
|
||||||
|
@ -537,12 +538,12 @@ fail:
|
||||||
// We could even trigger special code paths to assess what happened carefully,
|
// We could even trigger special code paths to assess what happened carefully,
|
||||||
// all without any added cost.
|
// all without any added cost.
|
||||||
if (depth >= pj.depthcapacity) {
|
if (depth >= pj.depthcapacity) {
|
||||||
pj.errorcode = simdjson::DEPTH_ERROR;
|
pj.errorcode = DEPTH_ERROR;
|
||||||
return pj.errorcode;
|
return pj.errorcode;
|
||||||
}
|
}
|
||||||
switch(c) {
|
switch(c) {
|
||||||
case '"':
|
case '"':
|
||||||
pj.errorcode = simdjson::STRING_ERROR;
|
pj.errorcode = STRING_ERROR;
|
||||||
return pj.errorcode;
|
return pj.errorcode;
|
||||||
case '0':
|
case '0':
|
||||||
case '1':
|
case '1':
|
||||||
|
@ -555,24 +556,25 @@ fail:
|
||||||
case '8':
|
case '8':
|
||||||
case '9':
|
case '9':
|
||||||
case '-':
|
case '-':
|
||||||
pj.errorcode = simdjson::NUMBER_ERROR;
|
pj.errorcode = NUMBER_ERROR;
|
||||||
return pj.errorcode;
|
return pj.errorcode;
|
||||||
case 't':
|
case 't':
|
||||||
pj.errorcode = simdjson::T_ATOM_ERROR;
|
pj.errorcode = T_ATOM_ERROR;
|
||||||
return pj.errorcode;
|
return pj.errorcode;
|
||||||
case 'n':
|
case 'n':
|
||||||
pj.errorcode = simdjson::N_ATOM_ERROR;
|
pj.errorcode = N_ATOM_ERROR;
|
||||||
return pj.errorcode;
|
return pj.errorcode;
|
||||||
case 'f':
|
case 'f':
|
||||||
pj.errorcode = simdjson::F_ATOM_ERROR;
|
pj.errorcode = F_ATOM_ERROR;
|
||||||
return pj.errorcode;
|
return pj.errorcode;
|
||||||
default:
|
default:
|
||||||
break;
|
break;
|
||||||
}
|
}
|
||||||
pj.errorcode = simdjson::TAPE_ERROR;
|
pj.errorcode = TAPE_ERROR;
|
||||||
return pj.errorcode;
|
return pj.errorcode;
|
||||||
}
|
}
|
||||||
|
|
||||||
int unified_machine(const char *buf, size_t len, ParsedJson &pj) {
|
int unified_machine(const char *buf, size_t len, ParsedJson &pj) {
|
||||||
return unified_machine(reinterpret_cast<const uint8_t*>(buf), len, pj);
|
return unified_machine(reinterpret_cast<const uint8_t*>(buf), len, pj);
|
||||||
}
|
}
|
||||||
|
}
|
||||||
|
|
|
@ -59,9 +59,9 @@ int main(int argc, char *argv[]) {
|
||||||
exit(1);
|
exit(1);
|
||||||
}
|
}
|
||||||
const char *filename = argv[optind];
|
const char *filename = argv[optind];
|
||||||
padded_string p;
|
simdjson::padded_string p;
|
||||||
try {
|
try {
|
||||||
get_corpus(filename).swap(p);
|
simdjson::get_corpus(filename).swap(p);
|
||||||
} catch (const std::exception &e) { // caught by reference to base
|
} catch (const std::exception &e) { // caught by reference to base
|
||||||
std::cout << "Could not load the file " << filename << std::endl;
|
std::cout << "Could not load the file " << filename << std::endl;
|
||||||
return EXIT_FAILURE;
|
return EXIT_FAILURE;
|
||||||
|
@ -76,7 +76,7 @@ int main(int argc, char *argv[]) {
|
||||||
std::cout << p.size() << " B ";
|
std::cout << p.size() << " B ";
|
||||||
std::cout << std::endl;
|
std::cout << std::endl;
|
||||||
}
|
}
|
||||||
ParsedJson pj;
|
simdjson::ParsedJson pj;
|
||||||
size_t maxdepth = 1024 * 4;
|
size_t maxdepth = 1024 * 4;
|
||||||
bool allocok = pj.allocateCapacity(p.size(), maxdepth);
|
bool allocok = pj.allocateCapacity(p.size(), maxdepth);
|
||||||
if (!allocok) {
|
if (!allocok) {
|
||||||
|
|
|
@ -39,7 +39,7 @@ bool skyprophet_test() {
|
||||||
if (maxsize < s.size())
|
if (maxsize < s.size())
|
||||||
maxsize = s.size();
|
maxsize = s.size();
|
||||||
}
|
}
|
||||||
ParsedJson pj;
|
simdjson::ParsedJson pj;
|
||||||
if (!pj.allocateCapacity(maxsize)) {
|
if (!pj.allocateCapacity(maxsize)) {
|
||||||
printf("allocation failure in skyprophet_test\n");
|
printf("allocation failure in skyprophet_test\n");
|
||||||
return false;
|
return false;
|
||||||
|
|
|
@ -65,14 +65,14 @@ bool validate(const char *dirname) {
|
||||||
} else {
|
} else {
|
||||||
strcpy(fullpath + dirlen, name);
|
strcpy(fullpath + dirlen, name);
|
||||||
}
|
}
|
||||||
padded_string p;
|
simdjson::padded_string p;
|
||||||
try {
|
try {
|
||||||
get_corpus(fullpath).swap(p);
|
simdjson::get_corpus(fullpath).swap(p);
|
||||||
} catch (const std::exception &e) {
|
} catch (const std::exception &e) {
|
||||||
std::cerr << "Could not load the file " << fullpath << std::endl;
|
std::cerr << "Could not load the file " << fullpath << std::endl;
|
||||||
return EXIT_FAILURE;
|
return EXIT_FAILURE;
|
||||||
}
|
}
|
||||||
ParsedJson pj;
|
simdjson::ParsedJson pj;
|
||||||
bool allocok = pj.allocateCapacity(p.size(), 1024);
|
bool allocok = pj.allocateCapacity(p.size(), 1024);
|
||||||
if (!allocok) {
|
if (!allocok) {
|
||||||
std::cerr << "can't allocate memory" << std::endl;
|
std::cerr << "can't allocate memory" << std::endl;
|
||||||
|
|
|
@ -132,15 +132,15 @@ bool validate(const char *dirname) {
|
||||||
} else {
|
} else {
|
||||||
strcpy(fullpath + dirlen, name);
|
strcpy(fullpath + dirlen, name);
|
||||||
}
|
}
|
||||||
padded_string p;
|
simdjson::padded_string p;
|
||||||
try {
|
try {
|
||||||
get_corpus(fullpath).swap(p);
|
simdjson::get_corpus(fullpath).swap(p);
|
||||||
} catch (const std::exception &e) {
|
} catch (const std::exception &e) {
|
||||||
std::cout << "Could not load the file " << fullpath << std::endl;
|
std::cout << "Could not load the file " << fullpath << std::endl;
|
||||||
return EXIT_FAILURE;
|
return EXIT_FAILURE;
|
||||||
}
|
}
|
||||||
// terrible hack but just to get it working
|
// terrible hack but just to get it working
|
||||||
ParsedJson pj;
|
simdjson::ParsedJson pj;
|
||||||
bool allocok = pj.allocateCapacity(p.size(), 1024);
|
bool allocok = pj.allocateCapacity(p.size(), 1024);
|
||||||
if (!allocok) {
|
if (!allocok) {
|
||||||
std::cerr << "can't allocate memory" << std::endl;
|
std::cerr << "can't allocate memory" << std::endl;
|
||||||
|
|
|
@ -325,14 +325,14 @@ bool validate(const char *dirname) {
|
||||||
} else {
|
} else {
|
||||||
strcpy(fullpath + dirlen, name);
|
strcpy(fullpath + dirlen, name);
|
||||||
}
|
}
|
||||||
padded_string p;
|
simdjson::padded_string p;
|
||||||
try {
|
try {
|
||||||
get_corpus(fullpath).swap(p);
|
simdjson::get_corpus(fullpath).swap(p);
|
||||||
} catch (const std::exception &e) {
|
} catch (const std::exception &e) {
|
||||||
std::cout << "Could not load the file " << fullpath << std::endl;
|
std::cout << "Could not load the file " << fullpath << std::endl;
|
||||||
return EXIT_FAILURE;
|
return EXIT_FAILURE;
|
||||||
}
|
}
|
||||||
ParsedJson pj;
|
simdjson::ParsedJson pj;
|
||||||
bool allocok = pj.allocateCapacity(p.size(), 1024);
|
bool allocok = pj.allocateCapacity(p.size(), 1024);
|
||||||
if (!allocok) {
|
if (!allocok) {
|
||||||
std::cerr << "can't allocate memory" << std::endl;
|
std::cerr << "can't allocate memory" << std::endl;
|
||||||
|
|
|
@ -5,7 +5,7 @@
|
||||||
#include "simdjson/jsonioutil.h"
|
#include "simdjson/jsonioutil.h"
|
||||||
#include "simdjson/jsonparser.h"
|
#include "simdjson/jsonparser.h"
|
||||||
|
|
||||||
void compute_dump(ParsedJson::iterator &pjh) {
|
void compute_dump(simdjson::ParsedJson::iterator &pjh) {
|
||||||
if (pjh.is_object()) {
|
if (pjh.is_object()) {
|
||||||
std::cout << "{";
|
std::cout << "{";
|
||||||
if (pjh.down()) {
|
if (pjh.down()) {
|
||||||
|
@ -72,26 +72,26 @@ int main(int argc, char *argv[]) {
|
||||||
if (optind + 1 < argc) {
|
if (optind + 1 < argc) {
|
||||||
std::cerr << "warning: ignoring everything after " << argv[optind + 1] << std::endl;
|
std::cerr << "warning: ignoring everything after " << argv[optind + 1] << std::endl;
|
||||||
}
|
}
|
||||||
padded_string p;
|
simdjson::padded_string p;
|
||||||
try {
|
try {
|
||||||
get_corpus(filename).swap(p);
|
simdjson::get_corpus(filename).swap(p);
|
||||||
} catch (const std::exception &e) { // caught by reference to base
|
} catch (const std::exception &e) { // caught by reference to base
|
||||||
std::cout << "Could not load the file " << filename << std::endl;
|
std::cout << "Could not load the file " << filename << std::endl;
|
||||||
return EXIT_FAILURE;
|
return EXIT_FAILURE;
|
||||||
}
|
}
|
||||||
ParsedJson pj;
|
simdjson::ParsedJson pj;
|
||||||
bool allocok = pj.allocateCapacity(p.size(), 1024);
|
bool allocok = pj.allocateCapacity(p.size(), 1024);
|
||||||
if (!allocok) {
|
if (!allocok) {
|
||||||
std::cerr << "failed to allocate memory" << std::endl;
|
std::cerr << "failed to allocate memory" << std::endl;
|
||||||
return EXIT_FAILURE;
|
return EXIT_FAILURE;
|
||||||
}
|
}
|
||||||
int res = json_parse(p, pj); // do the parsing, return false on error
|
int res = simdjson::json_parse(p, pj); // do the parsing, return false on error
|
||||||
if (res) {
|
if (res) {
|
||||||
std::cerr << " Parsing failed. " << std::endl;
|
std::cerr << " Parsing failed. " << std::endl;
|
||||||
return EXIT_FAILURE;
|
return EXIT_FAILURE;
|
||||||
}
|
}
|
||||||
if (apidump) {
|
if (apidump) {
|
||||||
ParsedJson::iterator pjh(pj);
|
simdjson::ParsedJson::iterator pjh(pj);
|
||||||
if (!pjh.isOk()) {
|
if (!pjh.isOk()) {
|
||||||
std::cerr << " Could not iterate parsed result. " << std::endl;
|
std::cerr << " Could not iterate parsed result. " << std::endl;
|
||||||
return EXIT_FAILURE;
|
return EXIT_FAILURE;
|
||||||
|
|
|
@ -41,9 +41,9 @@ using stat_t = struct stat_s;
|
||||||
|
|
||||||
|
|
||||||
|
|
||||||
stat_t simdjson_computestats(const padded_string &p) {
|
stat_t simdjson_computestats(const simdjson::padded_string &p) {
|
||||||
stat_t answer;
|
stat_t answer;
|
||||||
ParsedJson pj = build_parsed_json(p);
|
simdjson::ParsedJson pj = simdjson::build_parsed_json(p);
|
||||||
answer.valid = pj.isValid();
|
answer.valid = pj.isValid();
|
||||||
if (!answer.valid) {
|
if (!answer.valid) {
|
||||||
return answer;
|
return answer;
|
||||||
|
@ -125,9 +125,9 @@ int main(int argc, char *argv[]) {
|
||||||
if (myoptind + 1 < argc) {
|
if (myoptind + 1 < argc) {
|
||||||
std::cerr << "warning: ignoring everything after " << argv[myoptind + 1] << std::endl;
|
std::cerr << "warning: ignoring everything after " << argv[myoptind + 1] << std::endl;
|
||||||
}
|
}
|
||||||
padded_string p;
|
simdjson::padded_string p;
|
||||||
try {
|
try {
|
||||||
get_corpus(filename).swap(p);
|
simdjson::get_corpus(filename).swap(p);
|
||||||
} catch (const std::exception &e) { // caught by reference to base
|
} catch (const std::exception &e) { // caught by reference to base
|
||||||
std::cerr << "Could not load the file " << filename << std::endl;
|
std::cerr << "Could not load the file " << filename << std::endl;
|
||||||
return EXIT_FAILURE;
|
return EXIT_FAILURE;
|
||||||
|
|
|
@ -8,14 +8,14 @@ int main(int argc, char *argv[]) {
|
||||||
std::cerr << "Usage: " << argv[0] << " <jsonfile>\n";
|
std::cerr << "Usage: " << argv[0] << " <jsonfile>\n";
|
||||||
exit(1);
|
exit(1);
|
||||||
}
|
}
|
||||||
padded_string p;
|
simdjson::padded_string p;
|
||||||
std::string filename = argv[argc - 1];
|
std::string filename = argv[argc - 1];
|
||||||
try{
|
try{
|
||||||
get_corpus(filename).swap(p);
|
simdjson::get_corpus(filename).swap(p);
|
||||||
} catch (const std::exception& e) {
|
} catch (const std::exception& e) {
|
||||||
std::cout << "Could not load the file " << filename << std::endl;
|
std::cout << "Could not load the file " << filename << std::endl;
|
||||||
return EXIT_FAILURE;
|
return EXIT_FAILURE;
|
||||||
}
|
}
|
||||||
jsonminify(p, p.data());
|
simdjson::jsonminify(p, p.data());
|
||||||
printf("%s",p.data());
|
printf("%s",p.data());
|
||||||
}
|
}
|
||||||
|
|
Loading…
Reference in New Issue