// Protocol Buffers - Google's data interchange format // Copyright 2023 Google LLC. All rights reserved. // // Use of this source code is governed by a BSD-style // license that can be found in the LICENSE file or at // https://developers.google.com/open-source/licenses/bsd #include #include #include #include #include #include #include "google/ads/googleads/v17/services/google_ads_service.upbdefs.h" #include "google/protobuf/descriptor.pb.h" #include "absl/container/flat_hash_set.h" #include "absl/log/absl_check.h" #include "google/protobuf/dynamic_message.h" #include "google/protobuf/json/json.h" #include "benchmarks/descriptor.pb.h" #include "benchmarks/descriptor.upb.h" #include "benchmarks/descriptor.upb_minitable.h" #include "benchmarks/descriptor.upbdefs.h" #include "benchmarks/descriptor_sv.pb.h" #include "upb/base/string_view.h" #include "upb/base/upcast.h" #include "upb/json/decode.h" #include "upb/json/encode.h" #include "upb/mem/arena.h" #include "upb/reflection/def.hpp" #include "upb/reflection/internal/def_pool.h" #include "upb/wire/decode.h" upb_StringView descriptor = benchmarks_descriptor_proto_upbdefinit.descriptor; namespace protobuf = ::google::protobuf; // A buffer big enough to parse descriptor.proto without going to heap. // We use 64-bit ints here to force alignment. int64_t buf[8191]; void CollectFileDescriptors( const _upb_DefPool_Init* file, std::vector& serialized_files, absl::flat_hash_set& seen) { if (!seen.insert(file).second) return; for (_upb_DefPool_Init** deps = file->deps; *deps; deps++) { CollectFileDescriptors(*deps, serialized_files, seen); } serialized_files.push_back(file->descriptor); } static void BM_ArenaOneAlloc(benchmark::State& state) { for (auto _ : state) { upb_Arena* arena = upb_Arena_New(); upb_Arena_Malloc(arena, 1); upb_Arena_Free(arena); } } BENCHMARK(BM_ArenaOneAlloc); static void BM_ArenaInitialBlockOneAlloc(benchmark::State& state) { for (auto _ : state) { upb_Arena* arena = upb_Arena_Init(buf, sizeof(buf), nullptr); upb_Arena_Malloc(arena, 1); upb_Arena_Free(arena); } } BENCHMARK(BM_ArenaInitialBlockOneAlloc); static void BM_ArenaFuseUnbalanced(benchmark::State& state) { std::vector arenas(state.range(0)); size_t n = 0; for (auto _ : state) { for (auto& arena : arenas) { arena = upb_Arena_New(); } for (auto& arena : arenas) { upb_Arena_Fuse(arenas[0], arena); } for (auto& arena : arenas) { upb_Arena_Free(arena); } n += arenas.size(); } state.SetItemsProcessed(n); } BENCHMARK(BM_ArenaFuseUnbalanced)->Range(2, 128); static void BM_ArenaFuseBalanced(benchmark::State& state) { std::vector arenas(state.range(0)); size_t n = 0; for (auto _ : state) { for (auto& arena : arenas) { arena = upb_Arena_New(); } // Perform a series of fuses that keeps the halves balanced. const size_t max = ceil(log2(double(arenas.size()))); for (size_t n = 0; n <= max; n++) { size_t step = 1 << n; for (size_t i = 0; i + step < arenas.size(); i += (step * 2)) { upb_Arena_Fuse(arenas[i], arenas[i + step]); } } for (auto& arena : arenas) { upb_Arena_Free(arena); } n += arenas.size(); } state.SetItemsProcessed(n); } BENCHMARK(BM_ArenaFuseBalanced)->Range(2, 128); enum LoadDescriptorMode { NoLayout, WithLayout, }; template static void BM_LoadAdsDescriptor_Upb(benchmark::State& state) { size_t bytes_per_iter = 0; for (auto _ : state) { upb::DefPool defpool; if (Mode == NoLayout) { google_ads_googleads_v17_services_SearchGoogleAdsRequest_getmsgdef( defpool.ptr()); } else { _upb_DefPool_LoadDefInitEx( defpool.ptr(), &google_ads_googleads_v17_services_google_ads_service_proto_upbdefinit, true); } bytes_per_iter = _upb_DefPool_BytesLoaded(defpool.ptr()); benchmark::DoNotOptimize(defpool); } state.SetBytesProcessed(state.iterations() * bytes_per_iter); } BENCHMARK_TEMPLATE(BM_LoadAdsDescriptor_Upb, NoLayout); BENCHMARK_TEMPLATE(BM_LoadAdsDescriptor_Upb, WithLayout); template static void BM_LoadAdsDescriptor_Proto2(benchmark::State& state) { extern _upb_DefPool_Init google_ads_googleads_v17_services_google_ads_service_proto_upbdefinit; std::vector serialized_files; absl::flat_hash_set seen_files; CollectFileDescriptors( &google_ads_googleads_v17_services_google_ads_service_proto_upbdefinit, serialized_files, seen_files); size_t bytes_per_iter = 0; for (auto _ : state) { bytes_per_iter = 0; protobuf::Arena arena; protobuf::DescriptorPool pool; for (auto file : serialized_files) { absl::string_view input(file.data, file.size); auto proto = protobuf::Arena::Create(&arena); bool ok = proto->ParseFrom(input) && pool.BuildFile(*proto) != nullptr; if (!ok) { printf("Failed to add file.\n"); exit(1); } bytes_per_iter += input.size(); benchmark::DoNotOptimize(proto); } if (Mode == WithLayout) { protobuf::DynamicMessageFactory factory; const protobuf::Descriptor* d = pool.FindMessageTypeByName( "google.ads.googleads.v17.services.SearchGoogleAdsResponse"); if (!d) { printf("Failed to find descriptor.\n"); exit(1); } (void)factory.GetPrototype(d); } } state.SetBytesProcessed(state.iterations() * bytes_per_iter); } BENCHMARK_TEMPLATE(BM_LoadAdsDescriptor_Proto2, NoLayout); BENCHMARK_TEMPLATE(BM_LoadAdsDescriptor_Proto2, WithLayout); enum CopyStrings { Copy, Alias, }; enum ArenaMode { NoArena, UseArena, InitBlock, }; enum MinitableMode { CompiledIn, Parsed, }; /* Minor changes in code can result in changes to binary layout of the compiled in minitables. Benchmarking against both the compiled-in representation and the runtime parsed representation laid out in an arena can identify a performance improvement or regression is due to the actual change or due to unrelated binary layout changes. */ const upb_MiniTable* GetFileDescriptorMiniTable(MinitableMode mode, upb::DefPool* defpool) { if (mode == CompiledIn) { return &upb_0benchmark__FileDescriptorProto_msg_init; } else { _upb_DefPool_LoadDefInitEx( defpool->ptr(), &benchmarks_descriptor_proto_upbdefinit, true); const upb_MessageDef* m = upb_DefPool_FindMessageByName( defpool->ptr(), "upb_benchmark.FileDescriptorProto"); if (!m) { fprintf(stderr, "Failed to find message definition.\n"); exit(1); } return upb_MessageDef_MiniTable(m); } } template static void BM_Parse_Upb_FileDesc(benchmark::State& state) { upb::DefPool defpool; const upb_MiniTable* mt = GetFileDescriptorMiniTable(MMode, &defpool); for (auto _ : state) { upb_Arena* arena; if (AMode == InitBlock) { arena = upb_Arena_Init(buf, sizeof(buf), nullptr); } else { arena = upb_Arena_New(); } upb_Message* set = upb_Message_New(mt, arena); upb_DecodeStatus status = upb_Decode(descriptor.data, descriptor.size, set, mt, nullptr, Copy == Alias ? kUpb_DecodeOption_AliasString : 0, arena); if (status != kUpb_DecodeStatus_Ok) { printf("Failed to parse with status %d.\n", status); exit(1); } benchmark::DoNotOptimize(set); upb_Arena_Free(arena); } state.SetBytesProcessed(state.iterations() * descriptor.size); } BENCHMARK_TEMPLATE(BM_Parse_Upb_FileDesc, CompiledIn, UseArena, Copy); BENCHMARK_TEMPLATE(BM_Parse_Upb_FileDesc, CompiledIn, UseArena, Alias); BENCHMARK_TEMPLATE(BM_Parse_Upb_FileDesc, CompiledIn, InitBlock, Copy); BENCHMARK_TEMPLATE(BM_Parse_Upb_FileDesc, CompiledIn, InitBlock, Alias); BENCHMARK_TEMPLATE(BM_Parse_Upb_FileDesc, Parsed, UseArena, Copy); BENCHMARK_TEMPLATE(BM_Parse_Upb_FileDesc, Parsed, UseArena, Alias); BENCHMARK_TEMPLATE(BM_Parse_Upb_FileDesc, Parsed, InitBlock, Copy); BENCHMARK_TEMPLATE(BM_Parse_Upb_FileDesc, Parsed, InitBlock, Alias); template struct Proto2Factory; template struct Proto2Factory { public: P* GetProto() { return &proto; } private: P proto; }; template struct Proto2Factory { public: P* GetProto() { return protobuf::Arena::Create

(&arena); } private: protobuf::Arena arena; }; template struct Proto2Factory { public: Proto2Factory() : arena(GetOptions()) {} P* GetProto() { return protobuf::Arena::Create

(&arena); } private: protobuf::ArenaOptions GetOptions() { protobuf::ArenaOptions opts; opts.initial_block = (char*)buf; opts.initial_block_size = sizeof(buf); return opts; } protobuf::Arena arena; }; using FileDesc = ::upb_benchmark::FileDescriptorProto; using FileDescSV = ::upb_benchmark::sv::FileDescriptorProto; template void BM_Parse_Proto2(benchmark::State& state) { constexpr protobuf::MessageLite::ParseFlags kParseFlags = kCopy == Copy ? protobuf::MessageLite::ParseFlags::kMergePartial : protobuf::MessageLite::ParseFlags::kMergePartialWithAliasing; for (auto _ : state) { Proto2Factory proto_factory; auto proto = proto_factory.GetProto(); absl::string_view input(descriptor.data, descriptor.size); bool ok = proto->template ParseFrom(input); if (!ok) { printf("Failed to parse.\n"); exit(1); } benchmark::DoNotOptimize(proto); } state.SetBytesProcessed(state.iterations() * descriptor.size); } BENCHMARK_TEMPLATE(BM_Parse_Proto2, FileDesc, NoArena, Copy); BENCHMARK_TEMPLATE(BM_Parse_Proto2, FileDesc, UseArena, Copy); BENCHMARK_TEMPLATE(BM_Parse_Proto2, FileDesc, InitBlock, Copy); BENCHMARK_TEMPLATE(BM_Parse_Proto2, FileDescSV, InitBlock, Alias); static void BM_SerializeDescriptor_Proto2(benchmark::State& state) { upb_benchmark::FileDescriptorProto proto; (void)proto.ParseFromString( absl::string_view(descriptor.data, descriptor.size)); for (auto _ : state) { (void)proto.SerializePartialToArray(buf, sizeof(buf)); benchmark::DoNotOptimize(buf); } state.SetBytesProcessed(state.iterations() * descriptor.size); } BENCHMARK(BM_SerializeDescriptor_Proto2); template static void BM_SerializeDescriptor_Upb(benchmark::State& state) { upb::DefPool defpool; const upb_MiniTable* mt = GetFileDescriptorMiniTable(MMode, &defpool); upb_Arena* arena = upb_Arena_New(); upb_Message* set = upb_Message_New(mt, arena); upb_DecodeStatus status = upb_Decode(descriptor.data, descriptor.size, set, mt, nullptr, 0, arena); if (status != kUpb_DecodeStatus_Ok) { printf("Failed to parse.\n"); exit(1); } int64_t total = 0; for (auto _ : state) { upb_Arena* enc_arena; if (AMode == InitBlock) { enc_arena = upb_Arena_Init(buf, sizeof(buf), nullptr); } else { enc_arena = upb_Arena_New(); } size_t size; char* data; upb_EncodeStatus encode_status = upb_Encode(set, mt, 0, enc_arena, &data, &size); if (encode_status != kUpb_EncodeStatus_Ok) { printf("Failed to serialize.\n"); exit(1); } total += size; benchmark::DoNotOptimize(data); upb_Arena_Free(enc_arena); } state.SetBytesProcessed(total); upb_Arena_Free(arena); } BENCHMARK_TEMPLATE(BM_SerializeDescriptor_Upb, CompiledIn, UseArena); BENCHMARK_TEMPLATE(BM_SerializeDescriptor_Upb, CompiledIn, InitBlock); BENCHMARK_TEMPLATE(BM_SerializeDescriptor_Upb, Parsed, UseArena); BENCHMARK_TEMPLATE(BM_SerializeDescriptor_Upb, Parsed, InitBlock); static absl::string_view UpbJsonEncode(upb_benchmark_FileDescriptorProto* proto, const upb_MessageDef* md, upb_Arena* arena) { size_t size = upb_JsonEncode(UPB_UPCAST(proto), md, nullptr, 0, nullptr, 0, nullptr); char* buf = reinterpret_cast(upb_Arena_Malloc(arena, size + 1)); upb_JsonEncode(UPB_UPCAST(proto), md, nullptr, 0, buf, size, nullptr); return absl::string_view(buf, size); } static void BM_JsonParse_Upb(benchmark::State& state) { upb_Arena* arena = upb_Arena_New(); upb_benchmark_FileDescriptorProto* set = upb_benchmark_FileDescriptorProto_parse(descriptor.data, descriptor.size, arena); if (!set) { printf("Failed to parse.\n"); exit(1); } upb::DefPool defpool; const upb_MessageDef* md = upb_benchmark_FileDescriptorProto_getmsgdef(defpool.ptr()); auto json = UpbJsonEncode(set, md, arena); for (auto _ : state) { upb_Arena* arena = upb_Arena_New(); upb_benchmark_FileDescriptorProto* proto = upb_benchmark_FileDescriptorProto_new(arena); upb_JsonDecode(json.data(), json.size(), UPB_UPCAST(proto), md, defpool.ptr(), 0, arena, nullptr); benchmark::DoNotOptimize(proto); upb_Arena_Free(arena); } state.SetBytesProcessed(state.iterations() * json.size()); } BENCHMARK(BM_JsonParse_Upb); static void BM_JsonParse_Proto2(benchmark::State& state) { protobuf::FileDescriptorProto proto; absl::string_view input(descriptor.data, descriptor.size); (void)proto.ParseFromString(input); std::string json; ABSL_CHECK_OK(google::protobuf::json::MessageToJsonString(proto, &json)); for (auto _ : state) { protobuf::FileDescriptorProto proto; ABSL_CHECK_OK(google::protobuf::json::JsonStringToMessage(json, &proto)); benchmark::DoNotOptimize(proto); } state.SetBytesProcessed(state.iterations() * json.size()); } BENCHMARK(BM_JsonParse_Proto2); static void BM_JsonSerialize_Upb(benchmark::State& state) { upb_Arena* arena = upb_Arena_New(); upb_benchmark_FileDescriptorProto* set = upb_benchmark_FileDescriptorProto_parse(descriptor.data, descriptor.size, arena); ABSL_CHECK(set != nullptr); upb::DefPool defpool; const upb_MessageDef* md = upb_benchmark_FileDescriptorProto_getmsgdef(defpool.ptr()); auto json = UpbJsonEncode(set, md, arena); std::string json_str; json_str.resize(json.size()); for (auto _ : state) { // This isn't a fully fair comparison, as it assumes we already know the // correct size of the buffer. In practice, we usually need to run the // encoder twice, once to discover the size of the buffer. upb_JsonEncode(UPB_UPCAST(set), md, nullptr, 0, json_str.data(), json_str.size(), nullptr); benchmark::DoNotOptimize(json_str); } state.SetBytesProcessed(state.iterations() * json.size()); } BENCHMARK(BM_JsonSerialize_Upb); static void BM_JsonSerialize_Proto2(benchmark::State& state) { protobuf::FileDescriptorProto proto; absl::string_view input(descriptor.data, descriptor.size); (void)proto.ParseFromString(input); std::string json; for (auto _ : state) { json.clear(); ABSL_CHECK_OK(google::protobuf::json::MessageToJsonString(proto, &json)); benchmark::DoNotOptimize(json); } state.SetBytesProcessed(state.iterations() * json.size()); } BENCHMARK(BM_JsonSerialize_Proto2);