2021-01-05 07:22:35 +08:00
|
|
|
#pragma once
|
|
|
|
|
|
|
|
#ifdef SIMDJSON_COMPETITION_RAPIDJSON
|
|
|
|
|
|
|
|
#include "distinct_user_id.h"
|
|
|
|
|
|
|
|
namespace distinct_user_id {
|
|
|
|
|
|
|
|
using namespace rapidjson;
|
|
|
|
|
2021-01-05 12:20:24 +08:00
|
|
|
struct rapidjson_base {
|
2021-01-05 07:22:35 +08:00
|
|
|
Document doc{};
|
|
|
|
|
2021-01-06 03:31:34 +08:00
|
|
|
bool run(Document &root, std::vector<uint64_t> &result) {
|
2021-01-06 02:42:17 +08:00
|
|
|
if (root.HasParseError()) { printf("parse error\n"); return false; }
|
|
|
|
if (!root.IsObject()) { printf("root is not an object\n"); return false; }
|
2021-01-05 07:22:35 +08:00
|
|
|
auto statuses = root.FindMember("statuses");
|
2021-01-06 02:42:17 +08:00
|
|
|
if (statuses == root.MemberEnd() || !statuses->value.IsArray()) { printf("statuses is not an array\n"); return false; }
|
2021-01-05 07:22:35 +08:00
|
|
|
for (auto &tweet : statuses->value.GetArray()) {
|
|
|
|
if (!tweet.IsObject()) { return false; }
|
|
|
|
auto user = tweet.FindMember("user");
|
2021-01-06 02:42:17 +08:00
|
|
|
if (user == tweet.MemberEnd() || !user->value.IsObject()) { printf("user is not an object\n"); return false; }
|
2021-01-05 07:22:35 +08:00
|
|
|
auto id = user->value.FindMember("id");
|
2021-01-06 02:42:17 +08:00
|
|
|
if (id == user->value.MemberEnd() || !id->value.IsUint64()) { printf("id is not an int\n"); return false; }
|
2021-01-06 03:31:34 +08:00
|
|
|
result.push_back(id->value.GetUint64());
|
2021-01-05 07:22:35 +08:00
|
|
|
|
|
|
|
auto retweet = tweet.FindMember("retweeted_status");
|
|
|
|
if (retweet != tweet.MemberEnd()) {
|
2021-01-06 02:42:17 +08:00
|
|
|
if (!retweet->value.IsObject()) { printf("retweet is not an object\n"); return false; }
|
2021-01-05 07:22:35 +08:00
|
|
|
user = retweet->value.FindMember("user");
|
2021-01-06 02:42:17 +08:00
|
|
|
if (user == retweet->value.MemberEnd() || !user->value.IsObject()) { printf("rewtweet.user is not an object\n"); return false; }
|
2021-01-05 07:22:35 +08:00
|
|
|
id = user->value.FindMember("id");
|
2021-01-06 02:42:17 +08:00
|
|
|
if (id == user->value.MemberEnd() || !id->value.IsUint64()) { printf("retweet.id is not an int\n"); return false; }
|
2021-01-06 03:31:34 +08:00
|
|
|
result.push_back(id->value.GetUint64());
|
2021-01-05 07:22:35 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
};
|
|
|
|
|
2021-01-06 03:41:07 +08:00
|
|
|
struct rapidjson : rapidjson_base {
|
2021-01-06 03:31:34 +08:00
|
|
|
bool run(simdjson::padded_string &json, std::vector<uint64_t> &result) {
|
|
|
|
return rapidjson_base::run(doc.Parse<kParseValidateEncodingFlag>(json.data()), result);
|
2021-01-05 12:20:24 +08:00
|
|
|
}
|
|
|
|
};
|
2021-01-06 02:45:49 +08:00
|
|
|
BENCHMARK_TEMPLATE(distinct_user_id, rapidjson)->UseManualTime();
|
2021-01-05 07:22:35 +08:00
|
|
|
|
2021-01-06 03:41:07 +08:00
|
|
|
struct rapidjson_insitu : rapidjson_base {
|
2021-01-06 03:31:34 +08:00
|
|
|
bool run(simdjson::padded_string &json, std::vector<uint64_t> &result) {
|
|
|
|
return rapidjson_base::run(doc.ParseInsitu<kParseValidateEncodingFlag>(json.data()), result);
|
2021-01-05 12:30:54 +08:00
|
|
|
}
|
|
|
|
};
|
2021-01-06 02:45:49 +08:00
|
|
|
BENCHMARK_TEMPLATE(distinct_user_id, rapidjson_insitu)->UseManualTime();
|
2021-01-05 12:30:54 +08:00
|
|
|
|
2021-01-05 07:22:35 +08:00
|
|
|
} // namespace partial_tweets
|
|
|
|
|
|
|
|
#endif // SIMDJSON_COMPETITION_RAPIDJSON
|