4e62055462
Benchmark added to test an optimization I'll send round next, test added when an even bigger refactoring (as part of a more interesting optimization) broke strtol() in a way the strtol() tests didn't notice. Test: treehugger Change-Id: Ic974900021107938dbbbe98648960adb102d9595
240 lines
7.1 KiB
C++
240 lines
7.1 KiB
C++
/*
|
|
* Copyright (C) 2017 The Android Open Source Project
|
|
*
|
|
* Licensed under the Apache License, Version 2.0 (the "License");
|
|
* you may not use this file except in compliance with the License.
|
|
* You may obtain a copy of the License at
|
|
*
|
|
* http://www.apache.org/licenses/LICENSE-2.0
|
|
*
|
|
* Unless required by applicable law or agreed to in writing, software
|
|
* distributed under the License is distributed on an "AS IS" BASIS,
|
|
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
* See the License for the specific language governing permissions and
|
|
* limitations under the License.
|
|
*/
|
|
|
|
#include <err.h>
|
|
#include <langinfo.h>
|
|
#include <locale.h>
|
|
#include <malloc.h>
|
|
#include <stdlib.h>
|
|
#include <unistd.h>
|
|
|
|
#include <benchmark/benchmark.h>
|
|
#include "ScopedDecayTimeRestorer.h"
|
|
#include "util.h"
|
|
|
|
static void MallocFree(benchmark::State& state) {
|
|
const size_t nbytes = state.range(0);
|
|
int pagesize = getpagesize();
|
|
|
|
for (auto _ : state) {
|
|
void* ptr;
|
|
benchmark::DoNotOptimize(ptr = malloc(nbytes));
|
|
MakeAllocationResident(ptr, nbytes, pagesize);
|
|
free(ptr);
|
|
}
|
|
|
|
state.SetBytesProcessed(uint64_t(state.iterations()) * uint64_t(nbytes));
|
|
}
|
|
|
|
static void BM_stdlib_malloc_free_default(benchmark::State& state) {
|
|
#if defined(__BIONIC__)
|
|
ScopedDecayTimeRestorer restorer;
|
|
|
|
// The default is expected to be a zero decay time.
|
|
mallopt(M_DECAY_TIME, 0);
|
|
#endif
|
|
|
|
MallocFree(state);
|
|
}
|
|
BIONIC_BENCHMARK_WITH_ARG(BM_stdlib_malloc_free_default, "AT_COMMON_SIZES");
|
|
|
|
#if defined(__BIONIC__)
|
|
static void BM_stdlib_malloc_free_decay1(benchmark::State& state) {
|
|
ScopedDecayTimeRestorer restorer;
|
|
|
|
mallopt(M_DECAY_TIME, 1);
|
|
|
|
MallocFree(state);
|
|
}
|
|
BIONIC_BENCHMARK_WITH_ARG(BM_stdlib_malloc_free_decay1, "AT_COMMON_SIZES");
|
|
#endif
|
|
|
|
static void CallocFree(benchmark::State& state) {
|
|
const size_t nbytes = state.range(0);
|
|
int pagesize = getpagesize();
|
|
|
|
for (auto _ : state) {
|
|
void* ptr;
|
|
benchmark::DoNotOptimize(ptr = calloc(1, nbytes));
|
|
MakeAllocationResident(ptr, nbytes, pagesize);
|
|
free(ptr);
|
|
}
|
|
|
|
state.SetBytesProcessed(uint64_t(state.iterations()) * uint64_t(nbytes));
|
|
}
|
|
|
|
static void BM_stdlib_calloc_free_default(benchmark::State& state) {
|
|
#if defined(__BIONIC__)
|
|
ScopedDecayTimeRestorer restorer;
|
|
|
|
// The default is expected to be a zero decay time.
|
|
mallopt(M_DECAY_TIME, 0);
|
|
#endif
|
|
|
|
CallocFree(state);
|
|
}
|
|
BIONIC_BENCHMARK_WITH_ARG(BM_stdlib_calloc_free_default, "AT_COMMON_SIZES");
|
|
|
|
#if defined(__BIONIC__)
|
|
static void BM_stdlib_calloc_free_decay1(benchmark::State& state) {
|
|
mallopt(M_DECAY_TIME, 1);
|
|
|
|
CallocFree(state);
|
|
|
|
mallopt(M_DECAY_TIME, 0);
|
|
}
|
|
BIONIC_BENCHMARK_WITH_ARG(BM_stdlib_calloc_free_decay1, "AT_COMMON_SIZES");
|
|
#endif
|
|
|
|
static void MallocMultiple(benchmark::State& state, size_t nbytes, size_t numAllocs) {
|
|
int pagesize = getpagesize();
|
|
void* ptrs[numAllocs];
|
|
for (auto _ : state) {
|
|
for (size_t i = 0; i < numAllocs; i++) {
|
|
benchmark::DoNotOptimize(ptrs[i] = reinterpret_cast<uint8_t*>(malloc(nbytes)));
|
|
MakeAllocationResident(ptrs[i], nbytes, pagesize);
|
|
}
|
|
state.PauseTiming(); // Stop timers while freeing pointers.
|
|
for (size_t i = 0; i < numAllocs; i++) {
|
|
free(ptrs[i]);
|
|
}
|
|
state.ResumeTiming();
|
|
}
|
|
|
|
state.SetBytesProcessed(uint64_t(state.iterations()) * uint64_t(nbytes) * numAllocs);
|
|
}
|
|
|
|
void BM_stdlib_malloc_forty_default(benchmark::State& state) {
|
|
#if defined(__BIONIC__)
|
|
ScopedDecayTimeRestorer restorer;
|
|
|
|
// The default is expected to be a zero decay time.
|
|
mallopt(M_DECAY_TIME, 0);
|
|
#endif
|
|
|
|
MallocMultiple(state, state.range(0), 40);
|
|
}
|
|
BIONIC_BENCHMARK_WITH_ARG(BM_stdlib_malloc_forty_default, "AT_COMMON_SIZES");
|
|
|
|
#if defined(__BIONIC__)
|
|
void BM_stdlib_malloc_forty_decay1(benchmark::State& state) {
|
|
ScopedDecayTimeRestorer restorer;
|
|
|
|
mallopt(M_DECAY_TIME, 1);
|
|
|
|
MallocMultiple(state, state.range(0), 40);
|
|
}
|
|
BIONIC_BENCHMARK_WITH_ARG(BM_stdlib_malloc_forty_decay1, "AT_COMMON_SIZES");
|
|
#endif
|
|
|
|
void BM_stdlib_malloc_multiple_8192_allocs_default(benchmark::State& state) {
|
|
#if defined(__BIONIC__)
|
|
ScopedDecayTimeRestorer restorer;
|
|
|
|
// The default is expected to be a zero decay time.
|
|
mallopt(M_DECAY_TIME, 0);
|
|
#endif
|
|
|
|
MallocMultiple(state, 8192, state.range(0));
|
|
}
|
|
BIONIC_BENCHMARK_WITH_ARG(BM_stdlib_malloc_multiple_8192_allocs_default, "AT_SMALL_SIZES");
|
|
|
|
#if defined(__BIONIC__)
|
|
void BM_stdlib_malloc_multiple_8192_allocs_decay1(benchmark::State& state) {
|
|
ScopedDecayTimeRestorer restorer;
|
|
|
|
mallopt(M_DECAY_TIME, 1);
|
|
|
|
MallocMultiple(state, 8192, state.range(0));
|
|
}
|
|
BIONIC_BENCHMARK_WITH_ARG(BM_stdlib_malloc_multiple_8192_allocs_decay1, "AT_SMALL_SIZES");
|
|
#endif
|
|
|
|
static void BM_stdlib_mbstowcs_ascii(benchmark::State& state) {
|
|
// It doesn't really matter what ASCII character we pick.
|
|
// The flow through the fast path is the same regardless.
|
|
const size_t count = 500000;
|
|
std::vector<char> mbs(count, 'e');
|
|
std::vector<wchar_t> wcs(count);
|
|
|
|
for (auto _ : state) {
|
|
benchmark::DoNotOptimize(mbstowcs(&wcs[0], &mbs[0], wcs.size()));
|
|
}
|
|
|
|
state.SetBytesProcessed(uint64_t(state.iterations()) * uint64_t(wcs.size()));
|
|
}
|
|
BIONIC_BENCHMARK_WITH_ARG(BM_stdlib_mbstowcs_ascii, "");
|
|
|
|
static void BM_stdlib_mbstowcs_wide(benchmark::State& state) {
|
|
// It doesn't matter much what wide character we pick.
|
|
// A three-byte character seems pretty representative, and all three byte
|
|
// characters are the same from the code's perspective.
|
|
const size_t count = 500000;
|
|
std::string mbs;
|
|
for (size_t i = 0; i < count; i++) {
|
|
mbs += "\xe5\xb1\xb1";
|
|
}
|
|
std::vector<wchar_t> wcs(count);
|
|
|
|
for (auto _ : state) {
|
|
benchmark::DoNotOptimize(mbstowcs(&wcs[0], &mbs[0], wcs.size()));
|
|
}
|
|
|
|
state.SetBytesProcessed(uint64_t(state.iterations()) * uint64_t(wcs.size()));
|
|
}
|
|
BIONIC_BENCHMARK_WITH_ARG(BM_stdlib_mbstowcs_wide, "");
|
|
|
|
static void BM_stdlib_mbrtowc_1(benchmark::State& state) {
|
|
wchar_t wc;
|
|
for (auto _ : state) {
|
|
benchmark::DoNotOptimize(mbrtowc(&wc, "e", 1, nullptr));
|
|
}
|
|
}
|
|
BIONIC_BENCHMARK_WITH_ARG(BM_stdlib_mbrtowc_1, "");
|
|
|
|
static void BM_stdlib_mbrtowc_2(benchmark::State& state) {
|
|
wchar_t wc;
|
|
for (auto _ : state) {
|
|
benchmark::DoNotOptimize(mbrtowc(&wc, "\xc3\x9f", 3, nullptr));
|
|
}
|
|
}
|
|
BIONIC_BENCHMARK_WITH_ARG(BM_stdlib_mbrtowc_2, "");
|
|
|
|
static void BM_stdlib_mbrtowc_3(benchmark::State& state) {
|
|
wchar_t wc;
|
|
for (auto _ : state) {
|
|
benchmark::DoNotOptimize(mbrtowc(&wc, "\xe5\xb1\xb1", 3, nullptr));
|
|
}
|
|
}
|
|
BIONIC_BENCHMARK_WITH_ARG(BM_stdlib_mbrtowc_3, "");
|
|
|
|
static void BM_stdlib_mbrtowc_4(benchmark::State& state) {
|
|
wchar_t wc;
|
|
for (auto _ : state) {
|
|
benchmark::DoNotOptimize(mbrtowc(&wc, "\xf0\xa4\xad\xa2", 4, nullptr));
|
|
}
|
|
}
|
|
BIONIC_BENCHMARK_WITH_ARG(BM_stdlib_mbrtowc_4, "");
|
|
|
|
BIONIC_TRIVIAL_BENCHMARK(BM_stdlib_atoi, atoi(" -123"));
|
|
BIONIC_TRIVIAL_BENCHMARK(BM_stdlib_atol, atol(" -123"));
|
|
BIONIC_TRIVIAL_BENCHMARK(BM_stdlib_strtol, strtol(" -123", nullptr, 0));
|
|
BIONIC_TRIVIAL_BENCHMARK(BM_stdlib_strtoll, strtoll(" -123", nullptr, 0));
|
|
BIONIC_TRIVIAL_BENCHMARK(BM_stdlib_strtoul, strtoul(" -123", nullptr, 0));
|
|
BIONIC_TRIVIAL_BENCHMARK(BM_stdlib_strtoull, strtoull(" -123", nullptr, 0));
|
|
|
|
BIONIC_TRIVIAL_BENCHMARK(BM_stdlib_strtol_hex, strtol("0xdeadbeef", nullptr, 0));
|
|
BIONIC_TRIVIAL_BENCHMARK(BM_stdlib_strtoul_hex, strtoul("0xdeadbeef", nullptr, 0));
|