2020-03-08 05:10:23 +08:00
|
|
|
#include <cinttypes>
|
|
|
|
#include <cstdio>
|
|
|
|
#include <cstdlib>
|
|
|
|
#include <cstring>
|
|
|
|
#include <iostream>
|
|
|
|
#include <string>
|
|
|
|
#include <vector>
|
|
|
|
#include <cmath>
|
|
|
|
#include <set>
|
|
|
|
#include <string_view>
|
|
|
|
|
|
|
|
#include "simdjson.h"
|
|
|
|
|
|
|
|
using namespace simdjson;
|
|
|
|
using namespace std;
|
|
|
|
|
2020-06-21 13:03:57 +08:00
|
|
|
#include "test_macros.h"
|
2020-03-08 05:10:23 +08:00
|
|
|
|
|
|
|
namespace parser_load {
|
2020-06-03 11:21:46 +08:00
|
|
|
const char * NONEXISTENT_FILE = "this_file_does_not_exist.json";
|
2020-03-08 05:10:23 +08:00
|
|
|
bool parser_load_capacity() {
|
|
|
|
TEST_START();
|
2020-03-29 02:43:41 +08:00
|
|
|
dom::parser parser(1); // 1 byte max capacity
|
2020-04-15 08:26:26 +08:00
|
|
|
auto error = parser.load(TWITTER_JSON).error();
|
2020-03-08 05:10:23 +08:00
|
|
|
ASSERT_ERROR(error, CAPACITY);
|
|
|
|
TEST_SUCCEED();
|
|
|
|
}
|
|
|
|
bool parser_load_many_capacity() {
|
|
|
|
TEST_START();
|
2020-03-29 02:43:41 +08:00
|
|
|
dom::parser parser(1); // 1 byte max capacity
|
2020-06-21 06:47:41 +08:00
|
|
|
dom::document_stream docs;
|
|
|
|
ASSERT_SUCCESS(parser.load_many(TWITTER_JSON).get(docs));
|
|
|
|
for (auto doc : docs) {
|
2020-04-15 08:26:26 +08:00
|
|
|
ASSERT_ERROR(doc.error(), CAPACITY);
|
2020-03-08 05:10:23 +08:00
|
|
|
TEST_SUCCEED();
|
|
|
|
}
|
|
|
|
TEST_FAIL("No documents returned");
|
|
|
|
}
|
|
|
|
|
2020-06-05 08:40:15 +08:00
|
|
|
bool parser_parse_many_documents_error_in_the_middle() {
|
|
|
|
TEST_START();
|
|
|
|
const padded_string DOC = "1 2 [} 3"_padded;
|
|
|
|
size_t count = 0;
|
|
|
|
dom::parser parser;
|
2020-06-21 06:47:41 +08:00
|
|
|
dom::document_stream docs;
|
|
|
|
ASSERT_SUCCESS(parser.parse_many(DOC).get(docs));
|
|
|
|
for (auto doc : docs) {
|
2020-06-05 08:40:15 +08:00
|
|
|
count++;
|
2020-06-22 05:36:38 +08:00
|
|
|
uint64_t val;
|
|
|
|
auto error = doc.get(val);
|
2020-06-05 08:40:15 +08:00
|
|
|
if (count == 3) {
|
|
|
|
ASSERT_ERROR(error, TAPE_ERROR);
|
|
|
|
} else {
|
2020-06-22 05:36:38 +08:00
|
|
|
ASSERT_SUCCESS(error);
|
|
|
|
ASSERT_EQUAL(val, count);
|
2020-06-05 08:40:15 +08:00
|
|
|
}
|
|
|
|
}
|
2020-06-22 05:36:38 +08:00
|
|
|
ASSERT_EQUAL(count, 3);
|
2020-06-05 08:40:15 +08:00
|
|
|
TEST_SUCCEED();
|
|
|
|
}
|
|
|
|
|
|
|
|
bool parser_parse_many_documents_partial() {
|
|
|
|
TEST_START();
|
|
|
|
const padded_string DOC = "["_padded;
|
|
|
|
size_t count = 0;
|
|
|
|
dom::parser parser;
|
2020-06-21 06:47:41 +08:00
|
|
|
dom::document_stream docs;
|
|
|
|
ASSERT_SUCCESS(parser.parse_many(DOC).get(docs));
|
|
|
|
for (auto doc : docs) {
|
2020-06-05 08:40:15 +08:00
|
|
|
count++;
|
|
|
|
ASSERT_ERROR(doc.error(), TAPE_ERROR);
|
|
|
|
}
|
2020-06-22 05:36:38 +08:00
|
|
|
ASSERT_EQUAL(count, 1);
|
2020-06-05 08:40:15 +08:00
|
|
|
TEST_SUCCEED();
|
|
|
|
}
|
|
|
|
|
|
|
|
bool parser_parse_many_documents_partial_at_the_end() {
|
|
|
|
TEST_START();
|
|
|
|
const padded_string DOC = "1 2 ["_padded;
|
|
|
|
size_t count = 0;
|
|
|
|
dom::parser parser;
|
2020-06-21 06:47:41 +08:00
|
|
|
dom::document_stream docs;
|
|
|
|
ASSERT_SUCCESS(parser.parse_many(DOC).get(docs));
|
|
|
|
for (auto doc : docs) {
|
2020-06-05 08:40:15 +08:00
|
|
|
count++;
|
2020-06-22 05:36:38 +08:00
|
|
|
uint64_t val;
|
|
|
|
auto error = doc.get(val);
|
2020-06-05 08:40:15 +08:00
|
|
|
if (count == 3) {
|
|
|
|
ASSERT_ERROR(error, TAPE_ERROR);
|
|
|
|
} else {
|
2020-06-22 05:36:38 +08:00
|
|
|
ASSERT_SUCCESS(error);
|
|
|
|
ASSERT_EQUAL(val, count);
|
2020-06-05 08:40:15 +08:00
|
|
|
}
|
|
|
|
}
|
2020-06-22 05:36:38 +08:00
|
|
|
ASSERT_EQUAL(count, 3);
|
2020-06-05 08:40:15 +08:00
|
|
|
TEST_SUCCEED();
|
|
|
|
}
|
|
|
|
|
2020-03-08 05:10:23 +08:00
|
|
|
bool parser_load_nonexistent() {
|
|
|
|
TEST_START();
|
2020-03-29 02:43:41 +08:00
|
|
|
dom::parser parser;
|
2020-06-22 05:36:38 +08:00
|
|
|
ASSERT_ERROR( parser.load(NONEXISTENT_FILE).error(), IO_ERROR );
|
2020-03-08 05:10:23 +08:00
|
|
|
TEST_SUCCEED();
|
|
|
|
}
|
|
|
|
bool parser_load_many_nonexistent() {
|
|
|
|
TEST_START();
|
2020-03-29 02:43:41 +08:00
|
|
|
dom::parser parser;
|
2020-06-22 05:36:38 +08:00
|
|
|
ASSERT_ERROR( parser.load_many(NONEXISTENT_FILE).error(), IO_ERROR );
|
2020-06-22 02:49:52 +08:00
|
|
|
TEST_SUCCEED();
|
2020-03-08 05:10:23 +08:00
|
|
|
}
|
|
|
|
bool padded_string_load_nonexistent() {
|
|
|
|
TEST_START();
|
2020-06-22 05:36:38 +08:00
|
|
|
ASSERT_ERROR(padded_string::load(NONEXISTENT_FILE).error(), IO_ERROR);
|
2020-03-08 05:10:23 +08:00
|
|
|
TEST_SUCCEED();
|
|
|
|
}
|
|
|
|
|
|
|
|
bool parser_load_chain() {
|
|
|
|
TEST_START();
|
2020-03-29 02:43:41 +08:00
|
|
|
dom::parser parser;
|
2020-10-13 21:18:54 +08:00
|
|
|
simdjson_unused uint64_t foo;
|
2020-06-22 05:36:38 +08:00
|
|
|
ASSERT_ERROR( parser.load(NONEXISTENT_FILE)["foo"].get(foo), IO_ERROR);
|
2020-03-08 05:10:23 +08:00
|
|
|
TEST_SUCCEED();
|
|
|
|
}
|
|
|
|
bool parser_load_many_chain() {
|
|
|
|
TEST_START();
|
2020-03-29 02:43:41 +08:00
|
|
|
dom::parser parser;
|
2020-10-13 21:18:54 +08:00
|
|
|
simdjson_unused dom::document_stream stream;
|
2020-06-22 05:36:38 +08:00
|
|
|
ASSERT_ERROR( parser.load_many(NONEXISTENT_FILE).get(stream), IO_ERROR );
|
2020-06-22 02:49:52 +08:00
|
|
|
TEST_SUCCEED();
|
2020-03-08 05:10:23 +08:00
|
|
|
}
|
2020-06-22 05:36:38 +08:00
|
|
|
|
2020-03-08 05:10:23 +08:00
|
|
|
bool run() {
|
2020-06-05 08:40:15 +08:00
|
|
|
return true
|
|
|
|
&& parser_load_capacity()
|
|
|
|
&& parser_load_many_capacity()
|
|
|
|
&& parser_load_nonexistent()
|
|
|
|
&& parser_load_many_nonexistent()
|
|
|
|
&& padded_string_load_nonexistent()
|
|
|
|
&& parser_load_chain()
|
|
|
|
&& parser_load_many_chain()
|
|
|
|
&& parser_parse_many_documents_error_in_the_middle()
|
|
|
|
&& parser_parse_many_documents_partial()
|
|
|
|
&& parser_parse_many_documents_partial_at_the_end()
|
|
|
|
;
|
2020-03-08 05:10:23 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2020-08-13 01:25:22 +08:00
|
|
|
namespace adversarial {
|
|
|
|
#define PADDING_FILLED_WITH_NUMBERS "222222222222222222222222222222222"
|
|
|
|
bool number_overrun_at_root() {
|
|
|
|
TEST_START();
|
|
|
|
constexpr const char *json = "1" PADDING_FILLED_WITH_NUMBERS ",";
|
2020-09-23 15:07:14 +08:00
|
|
|
constexpr size_t len = 1; // std::strlen("1");
|
2020-08-13 01:25:22 +08:00
|
|
|
|
|
|
|
dom::parser parser;
|
|
|
|
uint64_t foo;
|
|
|
|
ASSERT_SUCCESS( parser.parse(json, len).get(foo) ); // Parse just the first digit
|
|
|
|
ASSERT_EQUAL( foo, 1 );
|
|
|
|
TEST_SUCCEED();
|
|
|
|
}
|
|
|
|
bool number_overrun_in_array() {
|
|
|
|
TEST_START();
|
|
|
|
constexpr const char *json = "[1" PADDING_FILLED_WITH_NUMBERS "]";
|
2020-09-23 15:07:14 +08:00
|
|
|
constexpr size_t len = 2; // std::strlen("[1");
|
2020-08-13 01:25:22 +08:00
|
|
|
|
|
|
|
dom::parser parser;
|
|
|
|
uint64_t foo;
|
|
|
|
ASSERT_ERROR( parser.parse(json, len).get(foo), TAPE_ERROR ); // Parse just the first digit
|
|
|
|
TEST_SUCCEED();
|
|
|
|
}
|
|
|
|
bool number_overrun_in_object() {
|
|
|
|
TEST_START();
|
|
|
|
constexpr const char *json = "{\"key\":1" PADDING_FILLED_WITH_NUMBERS "}";
|
2020-09-23 15:07:14 +08:00
|
|
|
constexpr size_t len = 8; // std::strlen("{\"key\":1");
|
2020-08-13 01:25:22 +08:00
|
|
|
|
|
|
|
dom::parser parser;
|
|
|
|
uint64_t foo;
|
|
|
|
ASSERT_ERROR( parser.parse(json, len).get(foo), TAPE_ERROR ); // Parse just the first digit
|
|
|
|
TEST_SUCCEED();
|
|
|
|
}
|
|
|
|
bool run() {
|
2020-09-23 15:07:14 +08:00
|
|
|
static_assert(33 > SIMDJSON_PADDING, "corruption test doesn't have enough padding"); // 33 = std::strlen(PADDING_FILLED_WITH_NUMBERS)
|
2020-08-13 01:25:22 +08:00
|
|
|
return true
|
|
|
|
&& number_overrun_at_root()
|
|
|
|
&& number_overrun_in_array()
|
|
|
|
&& number_overrun_in_object()
|
|
|
|
;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2020-03-08 05:10:23 +08:00
|
|
|
int main() {
|
|
|
|
// this is put here deliberately to check that the documentation is correct (README),
|
|
|
|
// should this fail to compile, you should update the documentation:
|
2020-11-04 04:48:09 +08:00
|
|
|
if (simdjson::active_implementation->name() == "unsupported") {
|
|
|
|
printf("unsupported CPU\n");
|
2020-03-08 05:10:23 +08:00
|
|
|
}
|
|
|
|
std::cout << "Running error tests." << std::endl;
|
2020-08-13 01:25:22 +08:00
|
|
|
if (!(true
|
|
|
|
&& parser_load::run()
|
|
|
|
&& adversarial::run()
|
|
|
|
)) {
|
2020-03-08 05:10:23 +08:00
|
|
|
return EXIT_FAILURE;
|
|
|
|
}
|
|
|
|
std::cout << "Error tests are ok." << std::endl;
|
|
|
|
return EXIT_SUCCESS;
|
|
|
|
}
|