96705e3712
Many of our benchmarks are basically just "call one function with a fixed argument". We don't need to keep repeating all the boilerplate for that. This also ensures we don't forget the benchmark::DoNotOptimize, which -- in addition to being a good idea in general -- specifically solves the problem with gettid benchmark and provides a more accurate result by removing the indirection through a function pointer. Test: ran benchmarks Change-Id: Id67535243678cd0d48f51cf25141e2040da9af03
224 lines
6.7 KiB
C++
224 lines
6.7 KiB
C++
/*
|
|
* Copyright (C) 2017 The Android Open Source Project
|
|
*
|
|
* Licensed under the Apache License, Version 2.0 (the "License");
|
|
* you may not use this file except in compliance with the License.
|
|
* You may obtain a copy of the License at
|
|
*
|
|
* http://www.apache.org/licenses/LICENSE-2.0
|
|
*
|
|
* Unless required by applicable law or agreed to in writing, software
|
|
* distributed under the License is distributed on an "AS IS" BASIS,
|
|
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
* See the License for the specific language governing permissions and
|
|
* limitations under the License.
|
|
*/
|
|
|
|
#include <err.h>
|
|
#include <langinfo.h>
|
|
#include <locale.h>
|
|
#include <malloc.h>
|
|
#include <stdlib.h>
|
|
#include <unistd.h>
|
|
|
|
#include <benchmark/benchmark.h>
|
|
#include "util.h"
|
|
|
|
#if defined(__BIONIC__)
|
|
|
|
#else
|
|
#endif
|
|
|
|
static __always_inline void MakeAllocationResident(void* ptr, size_t nbytes, int pagesize) {
|
|
uint8_t* data = reinterpret_cast<uint8_t*>(ptr);
|
|
for (size_t i = 0; i < nbytes; i += pagesize) {
|
|
data[i] = 1;
|
|
}
|
|
}
|
|
|
|
static void MallocFree(benchmark::State& state) {
|
|
const size_t nbytes = state.range(0);
|
|
int pagesize = getpagesize();
|
|
|
|
for (auto _ : state) {
|
|
void* ptr;
|
|
benchmark::DoNotOptimize(ptr = malloc(nbytes));
|
|
MakeAllocationResident(ptr, nbytes, pagesize);
|
|
free(ptr);
|
|
}
|
|
|
|
state.SetBytesProcessed(uint64_t(state.iterations()) * uint64_t(nbytes));
|
|
}
|
|
|
|
static void BM_stdlib_malloc_free_default(benchmark::State& state) {
|
|
#if defined(__BIONIC__)
|
|
// The default is expected to be a zero decay time.
|
|
mallopt(M_DECAY_TIME, 0);
|
|
#endif
|
|
|
|
MallocFree(state);
|
|
}
|
|
BIONIC_BENCHMARK_WITH_ARG(BM_stdlib_malloc_free_default, "AT_COMMON_SIZES");
|
|
|
|
#if defined(__BIONIC__)
|
|
static void BM_stdlib_malloc_free_decay1(benchmark::State& state) {
|
|
mallopt(M_DECAY_TIME, 1);
|
|
|
|
MallocFree(state);
|
|
|
|
mallopt(M_DECAY_TIME, 0);
|
|
}
|
|
BIONIC_BENCHMARK_WITH_ARG(BM_stdlib_malloc_free_decay1, "AT_COMMON_SIZES");
|
|
#endif
|
|
|
|
static void MallocMultiple(benchmark::State& state, size_t nbytes, size_t numAllocs) {
|
|
int pagesize = getpagesize();
|
|
void* ptrs[numAllocs];
|
|
for (auto _ : state) {
|
|
for (size_t i = 0; i < numAllocs; i++) {
|
|
benchmark::DoNotOptimize(ptrs[i] = reinterpret_cast<uint8_t*>(malloc(nbytes)));
|
|
MakeAllocationResident(ptrs[i], nbytes, pagesize);
|
|
}
|
|
state.PauseTiming(); // Stop timers while freeing pointers.
|
|
for (size_t i = 0; i < numAllocs; i++) {
|
|
free(ptrs[i]);
|
|
}
|
|
state.ResumeTiming();
|
|
}
|
|
|
|
state.SetBytesProcessed(uint64_t(state.iterations()) * uint64_t(nbytes) * numAllocs);
|
|
}
|
|
|
|
void BM_stdlib_malloc_forty_default(benchmark::State& state) {
|
|
|
|
#if defined(__BIONIC__)
|
|
// The default is expected to be a zero decay time.
|
|
mallopt(M_DECAY_TIME, 0);
|
|
#endif
|
|
|
|
MallocMultiple(state, state.range(0), 40);
|
|
}
|
|
BIONIC_BENCHMARK_WITH_ARG(BM_stdlib_malloc_forty_default, "AT_COMMON_SIZES");
|
|
|
|
#if defined(__BIONIC__)
|
|
void BM_stdlib_malloc_forty_decay1(benchmark::State& state) {
|
|
mallopt(M_DECAY_TIME, 1);
|
|
|
|
MallocMultiple(state, state.range(0), 40);
|
|
|
|
mallopt(M_DECAY_TIME, 0);
|
|
}
|
|
BIONIC_BENCHMARK_WITH_ARG(BM_stdlib_malloc_forty_decay1, "AT_COMMON_SIZES");
|
|
#endif
|
|
|
|
void BM_stdlib_malloc_multiple_8192_allocs_default(benchmark::State& state) {
|
|
#if defined(__BIONIC__)
|
|
// The default is expected to be a zero decay time.
|
|
mallopt(M_DECAY_TIME, 0);
|
|
#endif
|
|
|
|
MallocMultiple(state, 8192, state.range(0));
|
|
}
|
|
BIONIC_BENCHMARK_WITH_ARG(BM_stdlib_malloc_multiple_8192_allocs_default, "AT_SMALL_SIZES");
|
|
|
|
#if defined(__BIONIC__)
|
|
void BM_stdlib_malloc_multiple_8192_allocs_decay1(benchmark::State& state) {
|
|
mallopt(M_DECAY_TIME, 1);
|
|
|
|
MallocMultiple(state, 8192, state.range(0));
|
|
|
|
mallopt(M_DECAY_TIME, 0);
|
|
}
|
|
BIONIC_BENCHMARK_WITH_ARG(BM_stdlib_malloc_multiple_8192_allocs_decay1, "AT_SMALL_SIZES");
|
|
#endif
|
|
|
|
static void BM_stdlib_mbstowcs(benchmark::State& state) {
|
|
const size_t buf_alignment = state.range(0);
|
|
const size_t widebuf_alignment = state.range(1);
|
|
|
|
std::vector<char> buf;
|
|
std::vector<wchar_t> widebuf;
|
|
|
|
setlocale(LC_CTYPE, "C.UTF-8")
|
|
|| setlocale(LC_CTYPE, "en_US.UTF-8")
|
|
|| setlocale(LC_CTYPE, "en_GB.UTF-8")
|
|
|| setlocale(LC_CTYPE, "en.UTF-8")
|
|
|| setlocale(LC_CTYPE, "de_DE-8")
|
|
|| setlocale(LC_CTYPE, "fr_FR-8");
|
|
if (strcmp(nl_langinfo(CODESET), "UTF-8")) {
|
|
errx(1, "ERROR: unable to set locale in BM_stdlib_mbstowcs");
|
|
}
|
|
|
|
char* buf_aligned = GetAlignedPtr(&buf, buf_alignment, 500000);
|
|
wchar_t* widebuf_aligned = GetAlignedPtr(&widebuf, widebuf_alignment, 500000);
|
|
size_t i, j, k, l;
|
|
l = 0;
|
|
for (i=0xc3; i<0xe0; i++)
|
|
for (j=0x80; j<0xc0; j++)
|
|
buf[l++] = i, buf[l++] = j;
|
|
for (i=0xe1; i<0xed; i++)
|
|
for (j=0x80; j<0xc0; j++)
|
|
for (k=0x80; k<0xc0; k++)
|
|
buf[l++] = i, buf[l++] = j, buf[l++] = k;
|
|
for (i=0xf1; i<0xf4; i++)
|
|
for (j=0x80; j<0xc0; j++)
|
|
for (k=0x80; k<0xc0; k++)
|
|
buf[l++] = i, buf[l++] = j, buf[l++] = 0x80, buf[l++] = k;
|
|
buf[l++] = 0;
|
|
|
|
volatile size_t c __attribute__((unused)) = 0;
|
|
for (auto _ : state) {
|
|
c = mbstowcs(widebuf_aligned, buf_aligned, 500000);
|
|
}
|
|
|
|
state.SetBytesProcessed(uint64_t(state.iterations()) * uint64_t(500000));
|
|
}
|
|
BIONIC_BENCHMARK_WITH_ARG(BM_stdlib_mbstowcs, "0 0");
|
|
|
|
static void BM_stdlib_mbrtowc(benchmark::State& state) {
|
|
const size_t buf_alignment = state.range(0);
|
|
|
|
std::vector<char> buf;
|
|
|
|
setlocale(LC_CTYPE, "C.UTF-8")
|
|
|| setlocale(LC_CTYPE, "en_US.UTF-8")
|
|
|| setlocale(LC_CTYPE, "en_GB.UTF-8")
|
|
|| setlocale(LC_CTYPE, "en.UTF-8")
|
|
|| setlocale(LC_CTYPE, "de_DE-8")
|
|
|| setlocale(LC_CTYPE, "fr_FR-8");
|
|
if (strcmp(nl_langinfo(CODESET), "UTF-8")) {
|
|
errx(1, "ERROR: unable to set locale in BM_stdlib_mbrtowc");
|
|
}
|
|
|
|
char* buf_aligned = GetAlignedPtr(&buf, buf_alignment, 500000);
|
|
size_t i, j, k, l;
|
|
l = 0;
|
|
for (i=0xc3; i<0xe0; i++)
|
|
for (j=0x80; j<0xc0; j++)
|
|
buf[l++] = i, buf[l++] = j;
|
|
for (i=0xe1; i<0xed; i++)
|
|
for (j=0x80; j<0xc0; j++)
|
|
for (k=0x80; k<0xc0; k++)
|
|
buf[l++] = i, buf[l++] = j, buf[l++] = k;
|
|
for (i=0xf1; i<0xf4; i++)
|
|
for (j=0x80; j<0xc0; j++)
|
|
for (k=0x80; k<0xc0; k++)
|
|
buf[l++] = i, buf[l++] = j, buf[l++] = 0x80, buf[l++] = k;
|
|
buf[l++] = 0;
|
|
|
|
wchar_t wc = 0;
|
|
for (auto _ : state) {
|
|
for (j = 0; buf_aligned[j]; j+=mbrtowc(&wc, buf_aligned + j, 4, nullptr)) {
|
|
}
|
|
}
|
|
|
|
state.SetBytesProcessed(uint64_t(state.iterations()) * uint64_t(500000));
|
|
}
|
|
BIONIC_BENCHMARK_WITH_ARG(BM_stdlib_mbrtowc, "0");
|
|
|
|
BIONIC_TRIVIAL_BENCHMARK(BM_stdlib_atoi, atoi(" -123"));
|
|
BIONIC_TRIVIAL_BENCHMARK(BM_stdlib_atol, atol(" -123"));
|
|
BIONIC_TRIVIAL_BENCHMARK(BM_stdlib_strtol, strtol(" -123", nullptr, 0));
|
|
BIONIC_TRIVIAL_BENCHMARK(BM_stdlib_strtoll, strtoll(" -123", nullptr, 0));
|
|
BIONIC_TRIVIAL_BENCHMARK(BM_stdlib_strtoul, strtoul(" -123", nullptr, 0));
|
|
BIONIC_TRIVIAL_BENCHMARK(BM_stdlib_strtoull, strtoull(" -123", nullptr, 0));
|