blob: fb7beb5a386796932e559307f4ed969858dc67f8 [file] [log] [blame]
// Copyright 2020 The Marl Authors.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
// https://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.
#include "marl_bench.h"
#include "marl/waitgroup.h"
#include "benchmark/benchmark.h"
BENCHMARK_DEFINE_F(Schedule, Empty)(benchmark::State& state) {
run(state, [&](int numTasks) {
for (auto _ : state) {
for (auto i = 0; i < numTasks; i++) {
marl::schedule([] {});
}
}
});
}
BENCHMARK_REGISTER_F(Schedule, Empty)->Apply(Schedule::args);
BENCHMARK_DEFINE_F(Schedule, SomeWork)
(benchmark::State& state) {
run(state, [&](int numTasks) {
for (auto _ : state) {
marl::WaitGroup wg;
wg.add(numTasks);
for (auto i = 0; i < numTasks; i++) {
marl::schedule([=] {
uint32_t value = doSomeWork(i);
benchmark::DoNotOptimize(value);
wg.done();
});
}
wg.wait();
}
});
}
BENCHMARK_REGISTER_F(Schedule, SomeWork)->Apply(Schedule::args);
BENCHMARK_DEFINE_F(Schedule, MultipleForkAndJoin)(benchmark::State& state) {
run(state, [&](int numTasks) {
const int batchSize = std::max(1, Schedule::numThreads(state));
for (auto _ : state) {
marl::WaitGroup wg;
for (int i = 0; i < numTasks; i++) {
wg.add(1);
marl::schedule([=] {
// Give each task a significant amount of work so that concurrency matters.
// If any worker performs more than one task, it will affect the results.
int value = i;
for (int j = 0; j < 256; ++j) {
value = doSomeWork(value);
}
benchmark::DoNotOptimize(value);
wg.done();
});
// Wait for completion after every batch. This simulates the fork-and-join pattern.
if ((i + 1) % batchSize == 0) {
wg.wait();
}
}
wg.wait();
}
});
}
BENCHMARK_REGISTER_F(Schedule, MultipleForkAndJoin)->Apply(Schedule::args<512>);
BENCHMARK_DEFINE_F(Schedule, SomeWorkWorkerAffinityOneOf)
(benchmark::State& state) {
marl::Scheduler::Config cfg;
cfg.setWorkerThreadAffinityPolicy(
marl::Thread::Affinity::Policy::oneOf(marl::Thread::Affinity::all()));
run(state, cfg, [&](int numTasks) {
for (auto _ : state) {
marl::WaitGroup wg;
wg.add(numTasks);
for (auto i = 0; i < numTasks; i++) {
marl::schedule([=] {
uint32_t value = doSomeWork(i);
benchmark::DoNotOptimize(value);
wg.done();
});
}
wg.wait();
}
});
}
BENCHMARK_REGISTER_F(Schedule, SomeWorkWorkerAffinityOneOf)
->Apply(Schedule::args);