simdjson/fuzz/fuzz_utf8.cpp

54 lines
1.5 KiB
C++

/*
* For fuzzing all of the implementations (haswell/fallback/westmere),
* finding any difference between the output of each which would
* indicate inconsistency. Also, it gets the non-default backend
* some fuzzing love.
*
* Copyright Paul Dreik 20200912 for the simdjson project.
*/
#include "simdjson.h"
#include <cstddef>
#include <cstdlib>
extern "C" int LLVMFuzzerTestOneInput(const uint8_t *Data, size_t Size) {
auto utf8verify=[Data,Size](const simdjson::implementation* impl) -> bool {
return impl->validate_utf8((const char*)Data,Size);
};
auto first = simdjson::available_implementations.begin();
auto last = simdjson::available_implementations.end();
auto it = first;
while((it != last) && (!(*it)->supported_by_runtime_system())) { it++; }
assert(it != last);
const bool reference=utf8verify(*it);
bool failed=false;
for(; it != last; ++it) {
if(!(*it)->supported_by_runtime_system()) { continue; }
const bool current=utf8verify(*it);
if(current!=reference) {
failed=true;
}
}
if(failed) {
std::cerr<<std::boolalpha<<"Mismatch between implementations of validate_utf8() found:\n";
for(it = first;it != last; ++it) {
if(!(*it)->supported_by_runtime_system()) { continue; }
const bool current=utf8verify(*it);
std::cerr<<(*it)->name()<<" returns "<<current<<std::endl;
}
std::abort();
}
//all is well
return 0;
}