123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238 |
- /*
- * Copyright 2018-present Facebook, Inc.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- * http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
- #include <thread>
- #include <folly/synchronization/ParkingLot.h>
- #include <folly/Benchmark.h>
- #include <folly/detail/Futex.h>
- #include <folly/synchronization/Baton.h>
- #include <folly/synchronization/test/Barrier.h>
- DEFINE_uint64(threads, 32, "Number of threads for benchmark");
- using namespace folly;
- using namespace folly::test;
- ParkingLot<> lot;
- BENCHMARK(FutexNoWaitersWake, iters) {
- BenchmarkSuspender susp;
- folly::detail::Futex<> fu;
- Barrier b(FLAGS_threads + 1);
- std::vector<std::thread> threads{FLAGS_threads};
- for (auto& t : threads) {
- t = std::thread([&]() {
- b.wait();
- for (auto i = 0u; i < iters; i++) {
- detail::futexWake(&fu, 1);
- }
- });
- }
- susp.dismiss();
- b.wait();
- for (auto& t : threads) {
- t.join();
- }
- }
- BENCHMARK_RELATIVE(ParkingLotNoWaitersWake, iters) {
- BenchmarkSuspender susp;
- Barrier b(FLAGS_threads + 1);
- std::vector<std::thread> threads{FLAGS_threads};
- for (auto& t : threads) {
- t = std::thread([&]() {
- b.wait();
- for (auto i = 0u; i < iters; i++) {
- lot.unpark(&lot, [](Unit) { return UnparkControl::RetainContinue; });
- }
- });
- }
- susp.dismiss();
- b.wait();
- for (auto& t : threads) {
- t.join();
- }
- }
- BENCHMARK(FutexWakeOne, iters) {
- BenchmarkSuspender susp;
- folly::detail::Futex<> fu;
- Barrier b(FLAGS_threads + 1);
- std::vector<std::thread> threads{FLAGS_threads};
- for (auto& t : threads) {
- t = std::thread([&]() {
- b.wait();
- while (true) {
- detail::futexWait(&fu, 0);
- if (fu.load(std::memory_order_relaxed)) {
- return;
- }
- }
- });
- }
- susp.dismiss();
- b.wait();
- for (auto i = 0u; i < iters; i++) {
- detail::futexWake(&fu, 1);
- }
- fu.store(1);
- detail::futexWake(&fu, threads.size());
- for (auto& t : threads) {
- t.join();
- }
- }
- BENCHMARK_RELATIVE(ParkingLotWakeOne, iters) {
- BenchmarkSuspender susp;
- std::atomic<bool> done{false};
- Barrier b(FLAGS_threads + 1);
- std::vector<std::thread> threads{FLAGS_threads};
- for (auto& t : threads) {
- t = std::thread([&]() {
- b.wait();
- while (true) {
- Unit f;
- lot.park(
- &done,
- f,
- [&] { return done.load(std::memory_order_relaxed) == 0; },
- [] {});
- if (done.load(std::memory_order_relaxed)) {
- return;
- }
- }
- });
- }
- susp.dismiss();
- b.wait();
- for (auto i = 0u; i < iters; i++) {
- lot.unpark(&done, [](Unit) { return UnparkControl::RemoveBreak; });
- }
- done = true;
- lot.unpark(&done, [](Unit) { return UnparkControl::RemoveContinue; });
- for (auto& t : threads) {
- t.join();
- }
- }
- BENCHMARK(FutexWakeAll, iters) {
- BenchmarkSuspender susp;
- Barrier b(FLAGS_threads + 1);
- folly::detail::Futex<> fu;
- std::atomic<bool> done{false};
- std::vector<std::thread> threads{FLAGS_threads};
- for (auto& t : threads) {
- t = std::thread([&]() {
- b.wait();
- while (true) {
- detail::futexWait(&fu, 0);
- if (done.load(std::memory_order_relaxed)) {
- return;
- }
- }
- });
- }
- susp.dismiss();
- b.wait();
- for (auto i = 0u; i < iters; i++) {
- detail::futexWake(&fu, threads.size());
- }
- fu.store(1);
- done = true;
- detail::futexWake(&fu, threads.size());
- for (auto& t : threads) {
- t.join();
- }
- }
- BENCHMARK_RELATIVE(ParkingLotWakeAll, iters) {
- BenchmarkSuspender susp;
- Barrier b(FLAGS_threads + 1);
- std::atomic<bool> done{false};
- std::vector<std::thread> threads{FLAGS_threads};
- for (auto& t : threads) {
- t = std::thread([&]() {
- b.wait();
- while (true) {
- Unit f;
- lot.park(
- &done,
- f,
- [&] { return done.load(std::memory_order_relaxed) == 0; },
- [] {});
- if (done.load(std::memory_order_relaxed)) {
- return;
- }
- }
- });
- }
- susp.dismiss();
- b.wait();
- for (auto i = 0u; i < iters; i++) {
- lot.unpark(&done, [](Unit) { return UnparkControl::RemoveContinue; });
- }
- done = true;
- lot.unpark(&done, [](Unit) { return UnparkControl::RemoveContinue; });
- for (auto& t : threads) {
- t.join();
- }
- }
- int main(int argc, char** argv) {
- gflags::ParseCommandLineFlags(&argc, &argv, true);
- folly::runBenchmarks();
- }
- /*
- ./buck-out/gen/folly/synchronization/test/parking_lot_test --benchmark
- --bm_min_iters=10000 --threads=4
- ============================================================================
- folly/synchronization/test/ParkingLotBenchmark.cpprelative time/iter iters/s
- ============================================================================
- FutexNoWaitersWake 163.43ns 6.12M
- ParkingLotNoWaitersWake 29.64% 551.43ns 1.81M
- FutexWakeOne 156.78ns 6.38M
- ParkingLotWakeOne 37.49% 418.21ns 2.39M
- FutexWakeAll 1.82us 549.52K
- ParkingLotWakeAll 449.63% 404.73ns 2.47M
- ============================================================================
- ./buck-out/gen/folly/synchronization/test/parking_lot_test --benchmark
- --bm_min_iters=10000 --threads=32
- ============================================================================
- folly/synchronization/test/ParkingLotBenchmark.cpprelative time/iter iters/s
- ============================================================================
- FutexNoWaitersWake 379.59ns 2.63M
- ParkingLotNoWaitersWake 7.94% 4.78us 209.08K
- FutexWakeOne 163.59ns 6.11M
- ParkingLotWakeOne 6.41% 2.55us 392.07K
- FutexWakeAll 12.46us 80.27K
- ParkingLotWakeAll 784.76% 1.59us 629.92K
- ============================================================================ */
|