/* * Copyright (C) 2021 The Android Open Source Project * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. * You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ #include #include #include #include #include #include #include #include "Utils.h" #include "utils/DwarfSectionImplFake.h" #include "utils/MemoryFake.h" #include "utils/RegsFake.h" namespace unwindstack { namespace { // This collection of benchmarks exercises the DwarfSectionImpl::Eval function with a set of // artificial unwind data. The number of registers and register evaluation method are varied // for each individual benchmark. constexpr int kReturnAddressReg = 5; template class EvalBenchmark : public benchmark::Fixture { public: EvalBenchmark() { fake_memory_ = new MemoryFake; std::shared_ptr memory(fake_memory_); section_ = std::make_unique>(memory); } // Benchmarks DwarfSectionImpl::Eval given the DwarfLocation object, loc_regs, initialized in each // individual benchmark macro/function. // // This method initializes the fake register object and the DwarfCie object the same regardless // of the benchmark. So the initialization of loc_regs is carefully crafted in each benchmark // macro so that the evaluated PC and SP match the expected values after each call to Eval in the // benchmarking loop. // // In addition to the Eval call, register value assertion is included in the benchmarking loop // to ensure that we always capture the actual register evaluation // (DwarfSectionImpl::EvalRegister). For example, if Eval is modified to lazily evaluate register // values, we will still capture the register evaluation for the PC and SP (common case) in the // register value assertion. void RunBenchmark(benchmark::State& state, DwarfLocations& loc_regs) { DwarfCie cie{.return_address_register = kReturnAddressReg}; bool finished; RegsImplFake regs(64); regs.set_pc(0x1000); regs.set_sp(0x3500); regs[0] = 0x10000000; MemoryTracker mem_tracker; for (const auto& _ : state) { state.PauseTiming(); mem_tracker.StartTrackingAllocations(); state.ResumeTiming(); std::stringstream err_stream; if (!section_->Eval(&cie, fake_memory_, loc_regs, ®s, &finished)) { err_stream << "Eval() failed at address " << section_->LastErrorAddress(); state.SkipWithError(err_stream.str().c_str()); return; } if (finished || regs.pc() != 0x60000000U || regs.sp() != 0x10000000U) { err_stream << "Eval() finished successfully but registers were not evaluated correctly." << "\nExpected: finished == false, regs.pc() == 0x60000000, regs.sp() == 0x10000000." << "\nActual: finished == " << std::boolalpha << finished << std::hex << ", regs.pc() == 0x" << regs.pc() << ", regs.sp() == 0x" << regs.sp(); state.SkipWithError(err_stream.str().c_str()); return; } state.PauseTiming(); mem_tracker.StopTrackingAllocations(); state.ResumeTiming(); } mem_tracker.SetBenchmarkCounters(state); } protected: MemoryFake* fake_memory_; std::unique_ptr> section_; }; // Benchmarks exercising Eval with the DWARF_LOCATION_REGISTER evaluation method. BENCHMARK_TEMPLATE_F(EvalBenchmark, BM_eval_register_few_regs, uint64_t)(benchmark::State& state) { DwarfLocations loc_regs; loc_regs[CFA_REG] = DwarfLocation{DWARF_LOCATION_REGISTER, {0, 0}}; loc_regs[kReturnAddressReg] = DwarfLocation{DWARF_LOCATION_REGISTER, {0, 0x50000000}}; RunBenchmark(state, loc_regs); } BENCHMARK_TEMPLATE_F(EvalBenchmark, BM_eval_register_many_regs, uint64_t)(benchmark::State& state) { DwarfLocations loc_regs; loc_regs[CFA_REG] = DwarfLocation{DWARF_LOCATION_REGISTER, {0, 0}}; for (uint64_t i = 0; i < 64; i++) { loc_regs[i] = DwarfLocation{DWARF_LOCATION_REGISTER, {0, i * 0x10000000}}; } RunBenchmark(state, loc_regs); } // Benchmarks exercising Eval with the DWARF_LOCATION_VAL_OFFSET evaluation method. BENCHMARK_TEMPLATE_F(EvalBenchmark, BM_eval_val_offset_few_regs, uint64_t) (benchmark::State& state) { DwarfLocations loc_regs; loc_regs[CFA_REG] = DwarfLocation{DWARF_LOCATION_REGISTER, {0, 0}}; loc_regs[kReturnAddressReg] = DwarfLocation{DWARF_LOCATION_VAL_OFFSET, {0x50000000, 0}}; RunBenchmark(state, loc_regs); } BENCHMARK_TEMPLATE_F(EvalBenchmark, BM_eval_val_offset_many_regs, uint64_t) (benchmark::State& state) { DwarfLocations loc_regs; loc_regs[CFA_REG] = DwarfLocation{DWARF_LOCATION_REGISTER, {0, 0}}; for (uint64_t i = 0; i < 64; i++) { loc_regs[i] = DwarfLocation{DWARF_LOCATION_VAL_OFFSET, {i * 0x10000000, 0}}; } RunBenchmark(state, loc_regs); } // Benchmarks exercising Eval with the DWARF_LOCATION_OFFSET evaluation method. BENCHMARK_TEMPLATE_F(EvalBenchmark, BM_eval_offset_few_regs, uint64_t) (benchmark::State& state) { fake_memory_->SetData64(0x20000000, 0x60000000); DwarfLocations loc_regs; loc_regs[CFA_REG] = DwarfLocation{DWARF_LOCATION_REGISTER, {0, 0}}; loc_regs[kReturnAddressReg] = DwarfLocation{DWARF_LOCATION_OFFSET, {0x10000000, 0}}; RunBenchmark(state, loc_regs); } BENCHMARK_TEMPLATE_F(EvalBenchmark, BM_eval_offset_many_regs, uint64_t) (benchmark::State& state) { fake_memory_->SetData64(0x20000000, 0x60000000); fake_memory_->SetData64(0x30000000, 0x10000000); DwarfLocations loc_regs; loc_regs[CFA_REG] = DwarfLocation{DWARF_LOCATION_REGISTER, {0, 0}}; for (uint64_t i = 1; i < 64; i++) { loc_regs[i] = DwarfLocation{DWARF_LOCATION_OFFSET, {0x10000000, 0}}; } // Read from different place in memory for reg 0 so reg 0 maintains value of 0x10000000 // across multiple calls to Eval. loc_regs[0] = DwarfLocation{DWARF_LOCATION_OFFSET, {0x20000000, 0}}; RunBenchmark(state, loc_regs); } // Benchmarks exercising Eval with the DWARF_LOCATION_EXPRESSION evaluation method. // The dwarf op-code used for the expression benchmarks are OP_const4u (see DwarfOp::Eval). BENCHMARK_TEMPLATE_F(EvalBenchmark, BM_eval_expression_few_regs, uint64_t) (benchmark::State& state) { fake_memory_->SetMemory(0x5000, std::vector{0x0c, 0x00, 0x00, 0x00, 0x80}); uint64_t pc_value = 0x60000000; fake_memory_->SetMemory(0x80000000, &pc_value, sizeof(pc_value)); DwarfLocations loc_regs; loc_regs[CFA_REG] = DwarfLocation{DWARF_LOCATION_REGISTER, {0, 0}}; loc_regs[kReturnAddressReg] = DwarfLocation{DWARF_LOCATION_EXPRESSION, {0x4, 0x5004}}; RunBenchmark(state, loc_regs); } BENCHMARK_TEMPLATE_F(EvalBenchmark, BM_eval_expression_many_regs, uint64_t) (benchmark::State& state) { fake_memory_->SetMemory(0x5000, std::vector{0x0c, 0x00, 0x00, 0x00, 0x80}); uint64_t pc_value = 0x60000000; fake_memory_->SetMemory(0x80000000, &pc_value, sizeof(pc_value)); fake_memory_->SetMemory(0x6000, std::vector{0x0c, 0x00, 0x00, 0x00, 0x90}); uint64_t sp_value = 0x10000000; fake_memory_->SetMemory(0x90000000, &sp_value, sizeof(sp_value)); DwarfLocations loc_regs; loc_regs[CFA_REG] = DwarfLocation{DWARF_LOCATION_REGISTER, {0, 0}}; for (uint64_t i = 1; i < 64; i++) { loc_regs[i] = DwarfLocation{DWARF_LOCATION_EXPRESSION, {0x4, 0x5004}}; } // Read from different place in memory for reg 0 so reg 0 maintains value of 0x10000000 // across multiple calls to Eval. loc_regs[0] = DwarfLocation{DWARF_LOCATION_EXPRESSION, {0x4, 0x6004}}; RunBenchmark(state, loc_regs); } // Benchmarks exercising Eval with the DWARF_LOCATION_VAL_EXPRESSION evaluation method. // The dwarf op-code used for the value expression benchmarks are OP_const4u (see DwarfOp::Eval). BENCHMARK_TEMPLATE_F(EvalBenchmark, BM_eval_val_expression_few_regs, uint64_t) (benchmark::State& state) { fake_memory_->SetMemory(0x5000, std::vector{0x0c, 0x00, 0x00, 0x00, 0x60}); DwarfLocations loc_regs; loc_regs[CFA_REG] = DwarfLocation{DWARF_LOCATION_REGISTER, {0, 0}}; loc_regs[kReturnAddressReg] = DwarfLocation{DWARF_LOCATION_VAL_EXPRESSION, {0x4, 0x5004}}; RunBenchmark(state, loc_regs); } BENCHMARK_TEMPLATE_F(EvalBenchmark, BM_eval_val_expression_many_regs, uint64_t) (benchmark::State& state) { fake_memory_->SetMemory(0x5000, std::vector{0x0c, 0x00, 0x00, 0x00, 0x60}); fake_memory_->SetMemory(0x6000, std::vector{0x0c, 0x00, 0x00, 0x00, 0x10}); DwarfLocations loc_regs; loc_regs[CFA_REG] = DwarfLocation{DWARF_LOCATION_REGISTER, {0, 0}}; for (uint64_t i = 1; i < 64; i++) { loc_regs[i] = DwarfLocation{DWARF_LOCATION_VAL_EXPRESSION, {0x4, 0x5004}}; } // Read from different place in memory for reg 0 so reg 0 maintains value of 0x10000000 // across multiple calls to Eval. loc_regs[0] = DwarfLocation{DWARF_LOCATION_VAL_EXPRESSION, {0x4, 0x6004}}; RunBenchmark(state, loc_regs); } } // namespace } // namespace unwindstack