folly/folly/concurrency/test/UnboundedQueueTest.cpp

/*
 * Copyright (c) Meta Platforms, Inc. and affiliates.
 *
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */

#include <folly/concurrency/UnboundedQueue.h>

#include <folly/MPMCQueue.h>
#include <folly/ProducerConsumerQueue.h>
#include <folly/lang/Keep.h>
#include <folly/portability/GFlags.h>
#include <folly/portability/GTest.h>

#include <boost/thread/barrier.hpp>
#include <glog/logging.h>

#include <atomic>
#include <iomanip>
#include <thread>

DEFINE_bool(bench, false, "run benchmark");
DEFINE_int32(reps, 10, "number of reps");
DEFINE_int32(ops, 1000000, "number of operations per rep");
DEFINE_int64(capacity, 256 * 1024, "capacity");

template <typename T, bool MayBlock>
using USPSC = folly::USPSCQueue<T, MayBlock>;

template <typename T, bool MayBlock>
using UMPSC = folly::UMPSCQueue<T, MayBlock>;

template <typename T, bool MayBlock>
using USPMC = folly::USPMCQueue<T, MayBlock>;

template <typename T, bool MayBlock>
using UMPMC = folly::UMPMCQueue<T, MayBlock>;

// check functions for inspecting inlined native code

FOLLY_ATTR_WEAK void noop(folly::Optional<int>&&) {}

extern "C" FOLLY_KEEP void check_uspsc_mayblock_dequeue_ref(
    USPSC<int, true>& queue, int& item) {
  queue.dequeue(item);
}
extern "C" FOLLY_KEEP bool check_uspsc_mayblock_try_dequeue_ref(
    USPSC<int, true>& queue, int& item) {
  return queue.try_dequeue(item);
}
extern "C" FOLLY_KEEP bool check_uspsc_mayblock_try_dequeue_for_ref(
    USPSC<int, true>& queue,
    int& item,
    std::chrono::milliseconds const& timeout) {
  return queue.try_dequeue_for(item, timeout);
}
extern "C" FOLLY_KEEP bool check_uspsc_mayblock_try_dequeue_until_ref(
    USPSC<int, true>& queue,
    int& item,
    std::chrono::steady_clock::time_point const& deadline) {
  return queue.try_dequeue_until(item, deadline);
}

extern "C" FOLLY_KEEP int check_uspsc_mayblock_dequeue_ret(
    USPSC<int, true>& queue) {
  return queue.dequeue();
}
extern "C" FOLLY_KEEP void check_uspsc_mayblock_try_dequeue_ret(
    USPSC<int, true>& queue) {
  noop(queue.try_dequeue());
}
extern "C" FOLLY_KEEP void check_uspsc_mayblock_try_dequeue_for_ret(
    USPSC<int, true>& queue, std::chrono::milliseconds const& timeout) {
  noop(queue.try_dequeue_for(timeout));
}
extern "C" FOLLY_KEEP void check_uspsc_mayblock_try_dequeue_until_ret(
    USPSC<int, true>& queue,
    std::chrono::steady_clock::time_point const& deadline) {
  noop(queue.try_dequeue_until(deadline));
}

extern "C" FOLLY_KEEP void check_umpmc_mayblock_dequeue_ref(
    UMPMC<int, true>& queue, int& item) {
  queue.dequeue(item);
}
extern "C" FOLLY_KEEP bool check_umpmc_mayblock_try_dequeue_ref(
    UMPMC<int, true>& queue, int& item) {
  return queue.try_dequeue(item);
}
extern "C" FOLLY_KEEP bool check_umpmc_mayblock_try_dequeue_for_ref(
    UMPMC<int, true>& queue,
    int& item,
    std::chrono::milliseconds const& timeout) {
  return queue.try_dequeue_for(item, timeout);
}
extern "C" FOLLY_KEEP bool check_umpmc_mayblock_try_dequeue_until_ref(
    UMPMC<int, true>& queue,
    int& item,
    std::chrono::steady_clock::time_point const& deadline) {
  return queue.try_dequeue_until(item, deadline);
}

extern "C" FOLLY_KEEP int check_umpmc_mayblock_dequeue_ret(
    UMPMC<int, true>& queue) {
  return queue.dequeue();
}
extern "C" FOLLY_KEEP void check_umpmc_mayblock_try_dequeue_ret(
    UMPMC<int, true>& queue) {
  noop(queue.try_dequeue());
}
extern "C" FOLLY_KEEP void check_umpmc_mayblock_try_dequeue_for_ret(
    UMPMC<int, true>& queue, std::chrono::milliseconds const& timeout) {
  noop(queue.try_dequeue_for(timeout));
}
extern "C" FOLLY_KEEP void check_umpmc_mayblock_try_dequeue_until_ret(
    UMPMC<int, true>& queue,
    std::chrono::steady_clock::time_point const& deadline) {
  noop(queue.try_dequeue_until(deadline));
}

template <template <typename, bool> class Q, bool MayBlock>
void basic_test() {
  Q<int, MayBlock> q;
  ASSERT_TRUE(q.empty());
  ASSERT_EQ(q.size(), 0);
  int v = -1;
  ASSERT_FALSE(q.try_dequeue(v));

  q.enqueue(1);
  ASSERT_FALSE(q.empty());
  ASSERT_EQ(q.size(), 1);

  q.enqueue(2);
  ASSERT_EQ(q.size(), 2);
  ASSERT_FALSE(q.empty());

  ASSERT_TRUE(q.try_dequeue(v));
  ASSERT_EQ(v, 1);
  ASSERT_FALSE(q.empty());
  ASSERT_EQ(q.size(), 1);

  ASSERT_TRUE(q.try_dequeue(v));
  ASSERT_EQ(v, 2);
  ASSERT_TRUE(q.empty());
  ASSERT_EQ(q.size(), 0);
}

TEST(UnboundedQueue, basic) {
  basic_test<USPSC, false>();
  basic_test<UMPSC, false>();
  basic_test<USPMC, false>();
  basic_test<UMPMC, false>();
  basic_test<USPSC, true>();
  basic_test<UMPSC, true>();
  basic_test<USPMC, true>();
  basic_test<UMPMC, true>();
}

template <template <typename, bool> class Q, bool MayBlock>
void timeout_test() {
  Q<int, MayBlock> q;
  int v;
  ASSERT_FALSE(q.try_dequeue_until(
      v, std::chrono::steady_clock::now() + std::chrono::microseconds(1)));
  ASSERT_FALSE(q.try_dequeue_for(v, std::chrono::microseconds(1)));
  q.enqueue(10);
  ASSERT_TRUE(q.try_dequeue_until(
      v, std::chrono::steady_clock::now() + std::chrono::microseconds(1)));
  ASSERT_EQ(v, 10);
}

TEST(UnboundedQueue, timeout) {
  timeout_test<USPSC, false>();
  timeout_test<UMPSC, false>();
  timeout_test<USPMC, false>();
  timeout_test<UMPMC, false>();
  timeout_test<USPSC, true>();
  timeout_test<UMPSC, true>();
  timeout_test<USPMC, true>();
  timeout_test<UMPMC, true>();
}

template <template <typename, bool> class Q, bool MayBlock>
void peek_test() {
  Q<int, MayBlock> q;
  auto res = q.try_peek();
  ASSERT_FALSE(res);
  for (int i = 0; i < 1000; ++i) {
    q.enqueue(i);
  }
  for (int i = 0; i < 700; ++i) {
    int v;
    q.dequeue(v);
  }
  res = q.try_peek();
  ASSERT_TRUE(res);
  ASSERT_EQ(*res, 700);
}

TEST(UnboundedQueue, peek) {
  peek_test<USPSC, false>();
  peek_test<UMPSC, false>();
  peek_test<USPSC, true>();
  peek_test<UMPSC, true>();
}

TEST(UnboundedQueue, cleanupOnDestruction) {
  struct Foo {
    int* p_{nullptr};
    explicit Foo(int* p) : p_(p) {}
    Foo(Foo&& o) noexcept : p_(std::exchange(o.p_, nullptr)) {}
    ~Foo() {
      if (p_) {
        ++(*p_);
      }
    }
    Foo& operator=(Foo&& o) noexcept {
      p_ = std::exchange(o.p_, nullptr);
      return *this;
    }
  };
  int count = 0;
  int num = 3;
  {
    folly::UMPMCQueue<Foo, false> q;
    for (int i = 0; i < num; ++i) {
      Foo foo(&count);
      q.enqueue(std::move(foo));
    }
  }
  EXPECT_EQ(count, num);
}

template <typename ProdFunc, typename ConsFunc, typename EndFunc>
inline uint64_t run_once(
    int nprod,
    int ncons,
    const ProdFunc& prodFn,
    const ConsFunc& consFn,
    const EndFunc& endFn) {
  boost::barrier barrier(1 + nprod + ncons);

  /* producers */
  std::vector<std::thread> prodThr(nprod);
  for (int tid = 0; tid < nprod; ++tid) {
    prodThr[tid] = std::thread([&, tid] {
      barrier.wait(); // A - wait for thread start
      barrier.wait(); // B - init the work
      prodFn(tid);
      barrier.wait(); // C - join the work
    });
  }

  /* consumers */
  std::vector<std::thread> consThr(ncons);
  for (int tid = 0; tid < ncons; ++tid) {
    consThr[tid] = std::thread([&, tid] {
      barrier.wait(); // A - wait for thread start
      barrier.wait(); // B - init the work
      consFn(tid);
      barrier.wait(); // C - join the work
    });
  }

  barrier.wait(); // A - wait for thread start

  /* begin time measurement */
  auto const tbegin = std::chrono::steady_clock::now();

  barrier.wait(); // B - init the work
  barrier.wait(); // C - join the work

  /* end time measurement */
  auto const tend = std::chrono::steady_clock::now();

  /* wait for completion */
  for (int i = 0; i < nprod; ++i) {
    prodThr[i].join();
  }
  for (int i = 0; i < ncons; ++i) {
    consThr[i].join();
  }

  endFn();
  auto const dur = tend - tbegin;
  return std::chrono::duration_cast<std::chrono::nanoseconds>(dur).count();
}

template <bool SingleProducer, bool SingleConsumer, bool MayBlock>
void enq_deq_test(const int nprod, const int ncons) {
  if (SingleProducer) {
    ASSERT_EQ(nprod, 1);
  }
  if (SingleConsumer) {
    ASSERT_EQ(ncons, 1);
  }

  int ops = 1000;
  folly::UnboundedQueue<int, SingleProducer, SingleConsumer, MayBlock, 4> q;
  std::atomic<uint64_t> sum(0);

  auto prod = [&](int tid) {
    for (int i = tid; i < ops; i += nprod) {
      q.enqueue(i);
    }
  };

  auto cons = [&](int tid) {
    uint64_t mysum = 0;
    for (int i = tid; i < ops; i += ncons) {
      int v = -1;
      int vpeek = -1;

      if constexpr (SingleConsumer) {
        while (true) {
          auto res = q.try_peek();
          if (res) {
            vpeek = *res;
            break;
          }
        }
      }
      if ((i % 3) == 0) {
        while (!q.try_dequeue(v)) {
          /* keep trying */;
        }
      } else if ((i % 3) == 1) {
        auto duration = std::chrono::milliseconds(1);
        while (!q.try_dequeue_for(v, duration)) {
          /* keep trying */;
        }
      } else {
        q.dequeue(v);
      }
      if (nprod == 1 && ncons == 1) {
        ASSERT_EQ(v, i);
      }
      if (SingleConsumer) {
        ASSERT_EQ(v, vpeek);
      }
      mysum += v;
    }
    sum.fetch_add(mysum);
  };

  auto endfn = [&] {
    uint64_t expected = (ops) * (ops - 1) / 2;
    uint64_t actual = sum.load();
    ASSERT_EQ(expected, actual);
  };
  run_once(nprod, ncons, prod, cons, endfn);
}

TEST(UnboundedQueue, enqDeq) {
  /* SPSC */
  enq_deq_test<true, true, false>(1, 1);
  enq_deq_test<true, true, true>(1, 1);
  /* MPSC */
  enq_deq_test<false, true, false>(1, 1);
  enq_deq_test<false, true, true>(1, 1);
  enq_deq_test<false, true, false>(2, 1);
  enq_deq_test<false, true, true>(2, 1);
  enq_deq_test<false, true, false>(10, 1);
  enq_deq_test<false, true, true>(10, 1);
  /* SPMC */
  enq_deq_test<true, false, false>(1, 1);
  enq_deq_test<true, false, true>(1, 1);
  enq_deq_test<true, false, false>(1, 2);
  enq_deq_test<true, false, true>(1, 2);
  enq_deq_test<true, false, false>(1, 10);
  enq_deq_test<true, false, true>(1, 10);
  /* MPMC */
  enq_deq_test<false, false, false>(1, 1);
  enq_deq_test<false, false, true>(1, 1);
  enq_deq_test<false, false, false>(2, 1);
  enq_deq_test<false, false, true>(2, 1);
  enq_deq_test<false, false, false>(10, 1);
  enq_deq_test<false, false, true>(10, 1);
  enq_deq_test<false, false, false>(1, 2);
  enq_deq_test<false, false, true>(1, 2);
  enq_deq_test<false, false, false>(1, 10);
  enq_deq_test<false, false, true>(1, 10);
  enq_deq_test<false, false, false>(2, 2);
  enq_deq_test<false, false, true>(2, 2);
  enq_deq_test<false, false, false>(10, 10);
  enq_deq_test<false, false, true>(10, 10);
}

template <typename RepFunc>
uint64_t runBench(const std::string& name, uint64_t ops, const RepFunc& repFn) {
  uint64_t reps = FLAGS_reps;
  uint64_t min = UINTMAX_MAX;
  uint64_t max = 0;
  uint64_t sum = 0;

  std::vector<uint64_t> durs(reps);

  repFn(); // sometimes first run is outlier
  for (uint64_t r = 0; r < reps; ++r) {
    uint64_t dur = repFn();
    durs[r] = dur;
    sum += dur;
    min = std::min(min, dur);
    max = std::max(max, dur);
    // if each rep takes too long run at least 3 reps
    const uint64_t minute = 60000000000ULL;
    if (sum > minute && r >= 2) {
      reps = r + 1;
      break;
    }
  }

  const std::string unit = " ns";
  uint64_t avg = sum / reps;
  uint64_t res = min;
  uint64_t varsum = 0;
  for (uint64_t r = 0; r < reps; ++r) {
    auto term = int64_t(reps * durs[r]) - int64_t(sum);
    varsum += term * term;
  }
  uint64_t dev = uint64_t(std::sqrt(varsum) * std::pow(reps, -1.5));
  std::cout << name;
  std::cout << "   " << std::setw(4) << max / ops << unit;
  std::cout << "   " << std::setw(4) << avg / ops << unit;
  std::cout << "   " << std::setw(4) << dev / ops << unit;
  std::cout << "   " << std::setw(4) << res / ops << unit;
  std::cout << std::endl;
  return res;
}

template <template <typename, bool> class Q, typename T, int Op>
uint64_t bench(const int nprod, const int ncons, const std::string& name) {
  const uint64_t ops = FLAGS_ops;
  auto repFn = [&, ops] {
    Q<T, Op == 3 || Op == 4 || Op == 5> q;
    std::atomic<uint64_t> sum(0);
    auto prod = [&](int tid) {
      for (uint64_t i = tid; i < ops; i += nprod) {
        q.enqueue(i);
      }
    };
    auto cons = [&](int tid) {
      uint64_t mysum = 0;
      for (uint64_t i = tid; i < ops; i += ncons) {
        T v;
        if (Op == 0 || Op == 3) {
          while (FOLLY_UNLIKELY(!q.try_dequeue(v))) {
            /* keep trying */;
          }
        } else if (Op == 1 || Op == 4) {
          auto duration = std::chrono::microseconds(1000);
          while (FOLLY_UNLIKELY(!q.try_dequeue_for(v, duration))) {
            /* keep trying */;
          }
        } else {
          DCHECK(Op == 2 || Op == 5);
          q.dequeue(v);
        }
        if (nprod == 1 && ncons == 1) {
          DCHECK_EQ(int(v), i);
        }
        mysum += v;
      }
      sum.fetch_add(mysum);
    };
    auto endfn = [&] {
      uint64_t expected = (ops) * (ops - 1) / 2;
      uint64_t actual = sum.load();
      DCHECK_EQ(expected, actual);
    };
    return run_once(nprod, ncons, prod, cons, endfn);
  };
  return runBench(name, ops, repFn);
}

/* For performance comparison */
template <typename T>
class MPMC {
  folly::MPMCQueue<T> q_;

 public:
  MPMC() : q_(FLAGS_capacity) {}

  template <typename... Args>
  void enqueue(Args&&... args) {
    q_.blockingWrite(std::forward<Args>(args)...);
  }

  void dequeue(T& item) { q_.blockingRead(item); }

  bool try_dequeue(T& item) { return q_.read(item); }

  template <typename Rep, typename Period>
  bool try_dequeue_for(
      T& item, const std::chrono::duration<Rep, Period>& duration) noexcept {
    auto deadline = std::chrono::steady_clock::now() + duration;
    return q_.tryReadUntil(deadline, item);
  }
};

template <typename T, bool ignore>
using FMPMC = MPMC<T>;

template <typename T>
class PCQ {
  folly::ProducerConsumerQueue<T> q_;

 public:
  PCQ() : q_(FLAGS_capacity) {}

  template <typename... Args>
  void enqueue(Args&&... args) {
    while (!q_.write(std::forward<Args>(args)...)) {
      /* keep trying*/;
    }
  }

  void dequeue(T&) { ASSERT_TRUE(false); }

  bool try_dequeue(T& item) { return q_.read(item); }

  template <typename Rep, typename Period>
  bool try_dequeue_for(T&, const std::chrono::duration<Rep, Period>&) noexcept {
    return false;
  }
};

template <typename T, bool ignore>
using FPCQ = PCQ<T>;

template <size_t M>
struct IntArray {
  int a[M];
  IntArray() {}
  /* implicit */ IntArray(int v) {
    for (size_t i = 0; i < M; ++i) {
      a[i] = v;
    }
  }
  operator int() { return a[0]; }
};

void dottedLine() {
  std::cout
      << "........................................................................"
      << std::endl;
}

template <typename T>
void type_benches(const int np, const int nc, const std::string& name) {
  std::cout << name << "====================================================="
            << std::endl;
  if (np == 1 && nc == 1) {
    bench<USPSC, T, 0>(1, 1, "Unbounded SPSC try   spin only  ");
    bench<USPSC, T, 1>(1, 1, "Unbounded SPSC timed spin only  ");
    bench<USPSC, T, 2>(1, 1, "Unbounded SPSC wait  spin only  ");
    bench<USPSC, T, 3>(1, 1, "Unbounded SPSC try   may block  ");
    bench<USPSC, T, 4>(1, 1, "Unbounded SPSC timed may block  ");
    bench<USPSC, T, 5>(1, 1, "Unbounded SPSC wait  may block  ");
    dottedLine();
  }
  if (nc == 1) {
    bench<UMPSC, T, 0>(np, 1, "Unbounded MPSC try   spin only  ");
    bench<UMPSC, T, 1>(np, 1, "Unbounded MPSC timed spin only  ");
    bench<UMPSC, T, 2>(np, 1, "Unbounded MPSC wait  spin only  ");
    bench<UMPSC, T, 3>(np, 1, "Unbounded MPSC try   may block  ");
    bench<UMPSC, T, 4>(np, 1, "Unbounded MPSC timed may block  ");
    bench<UMPSC, T, 5>(np, 1, "Unbounded MPSC wait  may block  ");
    dottedLine();
  }
  if (np == 1) {
    bench<USPMC, T, 0>(1, nc, "Unbounded SPMC try   spin only  ");
    bench<USPMC, T, 1>(1, nc, "Unbounded SPMC timed spin only  ");
    bench<USPMC, T, 2>(1, nc, "Unbounded SPMC wait  spin only  ");
    bench<USPMC, T, 3>(1, nc, "Unbounded SPMC try   may block  ");
    bench<USPMC, T, 4>(1, nc, "Unbounded SPMC timed may block  ");
    bench<USPMC, T, 5>(1, nc, "Unbounded SPMC wait  may block  ");
    dottedLine();
  }
  bench<UMPMC, T, 0>(np, nc, "Unbounded MPMC try   spin only  ");
  bench<UMPMC, T, 1>(np, nc, "Unbounded MPMC timed spin only  ");
  bench<UMPMC, T, 2>(np, nc, "Unbounded MPMC wait  spin only  ");
  bench<UMPMC, T, 3>(np, nc, "Unbounded MPMC try   may block  ");
  bench<UMPMC, T, 4>(np, nc, "Unbounded MPMC timed may block  ");
  bench<UMPMC, T, 5>(np, nc, "Unbounded MPMC wait  may block  ");
  dottedLine();
  if (np == 1 && nc == 1) {
    bench<FPCQ, T, 0>(1, 1, "folly::PCQ  read                ");
    dottedLine();
  }
  bench<FMPMC, T, 3>(np, nc, "folly::MPMC  read               ");
  bench<FMPMC, T, 4>(np, nc, "folly::MPMC  tryReadUntil       ");
  bench<FMPMC, T, 5>(np, nc, "folly::MPMC  blockingRead       ");
  std::cout
      << "========================================================================"
      << std::endl;
}

void benches(const int np, const int nc) {
  std::cout << "====================== " << std::setw(2) << np << " prod"
            << "  " << std::setw(2) << nc << " cons"
            << " ================================" << std::endl;
  type_benches<uint32_t>(np, nc, "=== uint32_t ======");
  // Benchmarks for other element sizes can be added as follows:
  //   type_benches<IntArray<4>>(np, nc, "=== IntArray<4> ===");
}

TEST(UnboundedQueue, bench) {
  if (!FLAGS_bench) {
    return;
  }
  std::cout
      << "========================================================================"
      << std::endl;
  std::cout << std::setw(2) << FLAGS_reps << " reps of " << std::setw(8)
            << FLAGS_ops << " handoffs\n";
  dottedLine();
  std::cout << "$ numactl -N 1 $dir/unbounded_queue_test --bench\n";
  dottedLine();
  std::cout << "Using capacity " << FLAGS_capacity
            << " for folly::ProducerConsumerQueue and\n"
            << "folly::MPMCQueue\n";
  std::cout
      << "========================================================================"
      << std::endl;
  std::cout
      << "Test name                         Max time  Avg time  Dev time  Min time"
      << std::endl;

  for (int nc : {1, 2, 4, 8, 16, 32}) {
    int np = 1;
    benches(np, nc);
  }

  for (int np : {1, 2, 4, 8, 16, 32}) {
    int nc = 1;
    benches(np, nc);
  }

  for (int np : {2, 4, 8, 16, 32}) {
    for (int nc : {2, 4, 8, 16, 32}) {
      benches(np, nc);
    }
  }
}

/*
==============================================================
10 reps of  1000000 handoffs
..............................................................
$ numactl -N 1 $dir/unbounded_queue_test --bench
..............................................................
Using capacity 262144 for folly::ProducerConsumerQueue and
folly::MPMCQueue
==============================================================
Test name                         Max time  Avg time  Min time
======================  1 prod   1 cons ======================
=== uint32_t =================================================
Unbounded SPSC try   spin only        5 ns      5 ns      5 ns
Unbounded SPSC timed spin only        5 ns      5 ns      5 ns
Unbounded SPSC wait  spin only        6 ns      6 ns      5 ns
Unbounded SPSC try   may block       38 ns     37 ns     35 ns
Unbounded SPSC timed may block       38 ns     36 ns     34 ns
Unbounded SPSC wait  may block       34 ns     34 ns     33 ns
..............................................................
Unbounded MPSC try   spin only       45 ns     43 ns     42 ns
Unbounded MPSC timed spin only       47 ns     43 ns     42 ns
Unbounded MPSC wait  spin only       45 ns     43 ns     41 ns
Unbounded MPSC try   may block       55 ns     52 ns     51 ns
Unbounded MPSC timed may block       54 ns     52 ns     51 ns
Unbounded MPSC wait  may block       51 ns     50 ns     49 ns
..............................................................
Unbounded SPMC try   spin only       18 ns     17 ns     16 ns
Unbounded SPMC timed spin only       23 ns     21 ns     18 ns
Unbounded SPMC wait  spin only       22 ns     19 ns     16 ns
Unbounded SPMC try   may block       30 ns     26 ns     22 ns
Unbounded SPMC timed may block       32 ns     24 ns     20 ns
Unbounded SPMC wait  may block       49 ns     35 ns     29 ns
..............................................................
Unbounded MPMC try   spin only       25 ns     24 ns     24 ns
Unbounded MPMC timed spin only       38 ns     35 ns     30 ns
Unbounded MPMC wait  spin only       41 ns     39 ns     37 ns
Unbounded MPMC try   may block       53 ns     52 ns     51 ns
Unbounded MPMC timed may block       52 ns     51 ns     49 ns
Unbounded MPMC wait  may block       53 ns     51 ns     50 ns
..............................................................
folly::PCQ  read                     16 ns     11 ns      7 ns
..............................................................
folly::MPMC  read                    52 ns     52 ns     51 ns
folly::MPMC  tryReadUntil            96 ns     90 ns     55 ns
folly::MPMC  blockingRead            61 ns     56 ns     50 ns
==============================================================
======================  1 prod   2 cons ======================
=== uint32_t =================================================
Unbounded SPMC try   spin only       76 ns     68 ns     53 ns
Unbounded SPMC timed spin only       79 ns     71 ns     65 ns
Unbounded SPMC wait  spin only       39 ns     35 ns     32 ns
Unbounded SPMC try   may block       83 ns     81 ns     76 ns
Unbounded SPMC timed may block       86 ns     63 ns     23 ns
Unbounded SPMC wait  may block       38 ns     36 ns     34 ns
..............................................................
Unbounded MPMC try   spin only       86 ns     79 ns     64 ns
Unbounded MPMC timed spin only       84 ns     77 ns     74 ns
Unbounded MPMC wait  spin only       36 ns     35 ns     34 ns
Unbounded MPMC try   may block       83 ns     79 ns     75 ns
Unbounded MPMC timed may block       83 ns     76 ns     63 ns
Unbounded MPMC wait  may block       56 ns     48 ns     36 ns
..............................................................
folly::MPMC  read                   103 ns     93 ns     68 ns
folly::MPMC  tryReadUntil           109 ns    102 ns     91 ns
folly::MPMC  blockingRead            61 ns     58 ns     54 ns
==============================================================
======================  1 prod   4 cons ======================
=== uint32_t =================================================
Unbounded SPMC try   spin only      116 ns    109 ns     97 ns
Unbounded SPMC timed spin only      117 ns    111 ns    108 ns
Unbounded SPMC wait  spin only       43 ns     40 ns     37 ns
Unbounded SPMC try   may block      127 ns    113 ns     98 ns
Unbounded SPMC timed may block      116 ns    109 ns     97 ns
Unbounded SPMC wait  may block       45 ns     43 ns     40 ns
..............................................................
Unbounded MPMC try   spin only      121 ns    113 ns    102 ns
Unbounded MPMC timed spin only      118 ns    108 ns     88 ns
Unbounded MPMC wait  spin only       45 ns     41 ns     34 ns
Unbounded MPMC try   may block      117 ns    108 ns     96 ns
Unbounded MPMC timed may block      118 ns    109 ns     99 ns
Unbounded MPMC wait  may block       62 ns     53 ns     43 ns
..............................................................
folly::MPMC  read                   139 ns    130 ns    111 ns
folly::MPMC  tryReadUntil           205 ns    135 ns    115 ns
folly::MPMC  blockingRead           104 ns     74 ns     54 ns
==============================================================
======================  1 prod   8 cons ======================
=== uint32_t =================================================
Unbounded SPMC try   spin only      169 ns    163 ns    157 ns
Unbounded SPMC timed spin only      167 ns    158 ns    133 ns
Unbounded SPMC wait  spin only       44 ns     39 ns     36 ns
Unbounded SPMC try   may block      170 ns    165 ns    156 ns
Unbounded SPMC timed may block      172 ns    163 ns    153 ns
Unbounded SPMC wait  may block       49 ns     40 ns     35 ns
..............................................................
Unbounded MPMC try   spin only      166 ns    158 ns    149 ns
Unbounded MPMC timed spin only      171 ns    161 ns    145 ns
Unbounded MPMC wait  spin only       62 ns     52 ns     42 ns
Unbounded MPMC try   may block      169 ns    161 ns    149 ns
Unbounded MPMC timed may block      170 ns    160 ns    147 ns
Unbounded MPMC wait  may block       70 ns     63 ns     61 ns
..............................................................
folly::MPMC  read                   174 ns    167 ns    159 ns
folly::MPMC  tryReadUntil           349 ns    171 ns    148 ns
folly::MPMC  blockingRead           182 ns    138 ns    115 ns
==============================================================
======================  1 prod  16 cons ======================
=== uint32_t =================================================
Unbounded SPMC try   spin only      219 ns    198 ns    190 ns
Unbounded SPMC timed spin only      202 ns    198 ns    193 ns
Unbounded SPMC wait  spin only       36 ns     36 ns     35 ns
Unbounded SPMC try   may block      202 ns    195 ns    190 ns
Unbounded SPMC timed may block      208 ns    197 ns    190 ns
Unbounded SPMC wait  may block       96 ns     77 ns     64 ns
..............................................................
Unbounded MPMC try   spin only      204 ns    198 ns    194 ns
Unbounded MPMC timed spin only      202 ns    195 ns    190 ns
Unbounded MPMC wait  spin only       61 ns     59 ns     57 ns
Unbounded MPMC try   may block      206 ns    196 ns    191 ns
Unbounded MPMC timed may block      204 ns    198 ns    192 ns
Unbounded MPMC wait  may block      100 ns     88 ns     84 ns
..............................................................
folly::MPMC  read                   210 ns    191 ns    182 ns
folly::MPMC  tryReadUntil           574 ns    248 ns    192 ns
folly::MPMC  blockingRead          1400 ns   1319 ns   1227 ns
==============================================================
======================  1 prod  32 cons ======================
=== uint32_t =================================================
Unbounded SPMC try   spin only      209 ns    205 ns    199 ns
Unbounded SPMC timed spin only      208 ns    205 ns    200 ns
Unbounded SPMC wait  spin only      175 ns     51 ns     33 ns
Unbounded SPMC try   may block      215 ns    203 ns    186 ns
Unbounded SPMC timed may block      453 ns    334 ns    204 ns
Unbounded SPMC wait  may block      110 ns     87 ns     55 ns
..............................................................
Unbounded MPMC try   spin only      328 ns    218 ns    197 ns
Unbounded MPMC timed spin only      217 ns    206 ns    200 ns
Unbounded MPMC wait  spin only      147 ns     85 ns     58 ns
Unbounded MPMC try   may block      310 ns    223 ns    199 ns
Unbounded MPMC timed may block      461 ns    275 ns    196 ns
Unbounded MPMC wait  may block      148 ns    111 ns     78 ns
..............................................................
folly::MPMC  read                   280 ns    215 ns    194 ns
folly::MPMC  tryReadUntil          28740 ns   13508 ns    212 ns
folly::MPMC  blockingRead          1343 ns   1293 ns   1269 ns
==============================================================
======================  1 prod   1 cons ======================
=== uint32_t =================================================
Unbounded SPSC try   spin only        5 ns      5 ns      5 ns
Unbounded SPSC timed spin only        8 ns      6 ns      6 ns
Unbounded SPSC wait  spin only        6 ns      6 ns      5 ns
Unbounded SPSC try   may block       37 ns     36 ns     35 ns
Unbounded SPSC timed may block       37 ns     36 ns     35 ns
Unbounded SPSC wait  may block       35 ns     35 ns     34 ns
..............................................................
Unbounded MPSC try   spin only       43 ns     42 ns     41 ns
Unbounded MPSC timed spin only       45 ns     42 ns     42 ns
Unbounded MPSC wait  spin only       44 ns     43 ns     42 ns
Unbounded MPSC try   may block       55 ns     51 ns     50 ns
Unbounded MPSC timed may block       61 ns     52 ns     50 ns
Unbounded MPSC wait  may block       54 ns     52 ns     50 ns
..............................................................
Unbounded SPMC try   spin only       18 ns     17 ns     17 ns
Unbounded SPMC timed spin only       23 ns     19 ns     17 ns
Unbounded SPMC wait  spin only       20 ns     17 ns     15 ns
Unbounded SPMC try   may block       30 ns     23 ns     19 ns
Unbounded SPMC timed may block       23 ns     19 ns     17 ns
Unbounded SPMC wait  may block       36 ns     31 ns     26 ns
..............................................................
Unbounded MPMC try   spin only       25 ns     23 ns     17 ns
Unbounded MPMC timed spin only       37 ns     34 ns     25 ns
Unbounded MPMC wait  spin only       40 ns     38 ns     36 ns
Unbounded MPMC try   may block       51 ns     49 ns     48 ns
Unbounded MPMC timed may block       53 ns     50 ns     48 ns
Unbounded MPMC wait  may block       53 ns     49 ns     34 ns
..............................................................
folly::PCQ  read                     15 ns     12 ns      7 ns
..............................................................
folly::MPMC  read                    53 ns     51 ns     50 ns
folly::MPMC  tryReadUntil           100 ns     96 ns     90 ns
folly::MPMC  blockingRead            75 ns     59 ns     52 ns
==============================================================
======================  2 prod   1 cons ======================
=== uint32_t =================================================
Unbounded MPSC try   spin only       49 ns     49 ns     46 ns
Unbounded MPSC timed spin only       52 ns     50 ns     49 ns
Unbounded MPSC wait  spin only       53 ns     52 ns     51 ns
Unbounded MPSC try   may block       63 ns     60 ns     57 ns
Unbounded MPSC timed may block       64 ns     61 ns     54 ns
Unbounded MPSC wait  may block       62 ns     59 ns     35 ns
..............................................................
Unbounded MPMC try   spin only       44 ns     41 ns     38 ns
Unbounded MPMC timed spin only       50 ns     49 ns     49 ns
Unbounded MPMC wait  spin only       51 ns     49 ns     49 ns
Unbounded MPMC try   may block       63 ns     60 ns     57 ns
Unbounded MPMC timed may block       62 ns     60 ns     57 ns
Unbounded MPMC wait  may block       62 ns     60 ns     58 ns
..............................................................
folly::MPMC  read                    78 ns     57 ns     52 ns
folly::MPMC  tryReadUntil            78 ns     72 ns     70 ns
folly::MPMC  blockingRead            56 ns     54 ns     52 ns
==============================================================
======================  4 prod   1 cons ======================
=== uint32_t =================================================
Unbounded MPSC try   spin only       48 ns     47 ns     46 ns
Unbounded MPSC timed spin only       47 ns     47 ns     46 ns
Unbounded MPSC wait  spin only       49 ns     47 ns     47 ns
Unbounded MPSC try   may block       61 ns     59 ns     55 ns
Unbounded MPSC timed may block       62 ns     58 ns     46 ns
Unbounded MPSC wait  may block       62 ns     61 ns     59 ns
..............................................................
Unbounded MPMC try   spin only       42 ns     42 ns     40 ns
Unbounded MPMC timed spin only       48 ns     47 ns     45 ns
Unbounded MPMC wait  spin only       48 ns     47 ns     46 ns
Unbounded MPMC try   may block       63 ns     62 ns     61 ns
Unbounded MPMC timed may block       63 ns     61 ns     51 ns
Unbounded MPMC wait  may block       62 ns     61 ns     59 ns
..............................................................
folly::MPMC  read                    56 ns     55 ns     54 ns
folly::MPMC  tryReadUntil           112 ns    106 ns     97 ns
folly::MPMC  blockingRead            47 ns     47 ns     45 ns
==============================================================
======================  8 prod   1 cons ======================
=== uint32_t =================================================
Unbounded MPSC try   spin only       44 ns     43 ns     42 ns
Unbounded MPSC timed spin only       45 ns     44 ns     40 ns
Unbounded MPSC wait  spin only       45 ns     44 ns     41 ns
Unbounded MPSC try   may block       61 ns     60 ns     58 ns
Unbounded MPSC timed may block       61 ns     59 ns     56 ns
Unbounded MPSC wait  may block       61 ns     59 ns     56 ns
..............................................................
Unbounded MPMC try   spin only       43 ns     40 ns     36 ns
Unbounded MPMC timed spin only       45 ns     44 ns     41 ns
Unbounded MPMC wait  spin only       45 ns     43 ns     41 ns
Unbounded MPMC try   may block       62 ns     60 ns     58 ns
Unbounded MPMC timed may block       62 ns     59 ns     56 ns
Unbounded MPMC wait  may block       61 ns     58 ns     54 ns
..............................................................
folly::MPMC  read                   147 ns    119 ns     63 ns
folly::MPMC  tryReadUntil           152 ns    130 ns     97 ns
folly::MPMC  blockingRead           135 ns    101 ns     48 ns
==============================================================
====================== 16 prod   1 cons ======================
=== uint32_t =================================================
Unbounded MPSC try   spin only       47 ns     38 ns     35 ns
Unbounded MPSC timed spin only       36 ns     36 ns     35 ns
Unbounded MPSC wait  spin only       46 ns     37 ns     35 ns
Unbounded MPSC try   may block       58 ns     47 ns     45 ns
Unbounded MPSC timed may block       46 ns     46 ns     45 ns
Unbounded MPSC wait  may block       47 ns     45 ns     45 ns
..............................................................
Unbounded MPMC try   spin only       41 ns     39 ns     35 ns
Unbounded MPMC timed spin only       45 ns     41 ns     38 ns
Unbounded MPMC wait  spin only       43 ns     40 ns     38 ns
Unbounded MPMC try   may block       51 ns     49 ns     47 ns
Unbounded MPMC timed may block       52 ns     49 ns     47 ns
Unbounded MPMC wait  may block       59 ns     50 ns     46 ns
..............................................................
folly::MPMC  read                   924 ns    839 ns    664 ns
folly::MPMC  tryReadUntil           968 ns    865 ns    678 ns
folly::MPMC  blockingRead           929 ns    727 ns    487 ns
==============================================================
====================== 32 prod   1 cons ======================
=== uint32_t =================================================
Unbounded MPSC try   spin only       90 ns     44 ns     36 ns
Unbounded MPSC timed spin only       91 ns     43 ns     35 ns
Unbounded MPSC wait  spin only       92 ns     55 ns     36 ns
Unbounded MPSC try   may block       87 ns     52 ns     45 ns
Unbounded MPSC timed may block       70 ns     48 ns     45 ns
Unbounded MPSC wait  may block      109 ns     60 ns     45 ns
..............................................................
Unbounded MPMC try   spin only       47 ns     42 ns     37 ns
Unbounded MPMC timed spin only       50 ns     46 ns     38 ns
Unbounded MPMC wait  spin only       50 ns     42 ns     36 ns
Unbounded MPMC try   may block      103 ns     59 ns     50 ns
Unbounded MPMC timed may block       56 ns     52 ns     47 ns
Unbounded MPMC wait  may block       59 ns     51 ns     46 ns
..............................................................
folly::MPMC  read                  1029 ns    911 ns    694 ns
folly::MPMC  tryReadUntil          1023 ns    969 ns    907 ns
folly::MPMC  blockingRead          1024 ns    921 ns    790 ns
==============================================================
======================  2 prod   2 cons ======================
=== uint32_t =================================================
Unbounded MPMC try   spin only       83 ns     66 ns     24 ns
Unbounded MPMC timed spin only       84 ns     74 ns     49 ns
Unbounded MPMC wait  spin only       50 ns     49 ns     47 ns
Unbounded MPMC try   may block       86 ns     81 ns     77 ns
Unbounded MPMC timed may block       82 ns     74 ns     59 ns
Unbounded MPMC wait  may block       62 ns     59 ns     56 ns
..............................................................
folly::MPMC  read                    98 ns     85 ns     63 ns
folly::MPMC  tryReadUntil           105 ns     94 ns     83 ns
folly::MPMC  blockingRead            59 ns     56 ns     54 ns
==============================================================
======================  2 prod   4 cons ======================
=== uint32_t =================================================
Unbounded MPMC try   spin only      114 ns    105 ns     91 ns
Unbounded MPMC timed spin only      119 ns    107 ns    102 ns
Unbounded MPMC wait  spin only       54 ns     53 ns     52 ns
Unbounded MPMC try   may block      114 ns    106 ns     93 ns
Unbounded MPMC timed may block      111 ns    100 ns     92 ns
Unbounded MPMC wait  may block       70 ns     64 ns     60 ns
..............................................................
folly::MPMC  read                   133 ns    125 ns    120 ns
folly::MPMC  tryReadUntil           130 ns    125 ns    114 ns
folly::MPMC  blockingRead            69 ns     68 ns     66 ns
==============================================================
======================  2 prod   8 cons ======================
=== uint32_t =================================================
Unbounded MPMC try   spin only      169 ns    160 ns    152 ns
Unbounded MPMC timed spin only      165 ns    158 ns    149 ns
Unbounded MPMC wait  spin only       59 ns     54 ns     45 ns
Unbounded MPMC try   may block      166 ns    158 ns    131 ns
Unbounded MPMC timed may block      168 ns    163 ns    158 ns
Unbounded MPMC wait  may block       73 ns     66 ns     60 ns
..............................................................
folly::MPMC  read                   170 ns    167 ns    160 ns
folly::MPMC  tryReadUntil           163 ns    154 ns    146 ns
folly::MPMC  blockingRead            82 ns     73 ns     60 ns
==============================================================
======================  2 prod  16 cons ======================
=== uint32_t =================================================
Unbounded MPMC try   spin only      207 ns    198 ns    191 ns
Unbounded MPMC timed spin only      211 ns    198 ns    192 ns
Unbounded MPMC wait  spin only       57 ns     55 ns     54 ns
Unbounded MPMC try   may block      197 ns    193 ns    188 ns
Unbounded MPMC timed may block      201 ns    195 ns    188 ns
Unbounded MPMC wait  may block       89 ns     78 ns     70 ns
..............................................................
folly::MPMC  read                   196 ns    189 ns    181 ns
folly::MPMC  tryReadUntil           202 ns    184 ns    173 ns
folly::MPMC  blockingRead           267 ns    100 ns     76 ns
==============================================================
======================  2 prod  32 cons ======================
=== uint32_t =================================================
Unbounded MPMC try   spin only      228 ns    207 ns    193 ns
Unbounded MPMC timed spin only      210 ns    205 ns    198 ns
Unbounded MPMC wait  spin only      102 ns     71 ns     56 ns
Unbounded MPMC try   may block      268 ns    211 ns    198 ns
Unbounded MPMC timed may block      226 ns    205 ns    183 ns
Unbounded MPMC wait  may block      502 ns    164 ns     67 ns
..............................................................
folly::MPMC  read                   228 ns    205 ns    195 ns
folly::MPMC  tryReadUntil           207 ns    200 ns    192 ns
folly::MPMC  blockingRead           830 ns    612 ns    192 ns
==============================================================
======================  4 prod   2 cons ======================
=== uint32_t =================================================
Unbounded MPMC try   spin only       87 ns     65 ns     33 ns
Unbounded MPMC timed spin only       79 ns     60 ns     36 ns
Unbounded MPMC wait  spin only       47 ns     46 ns     44 ns
Unbounded MPMC try   may block       87 ns     77 ns     52 ns
Unbounded MPMC timed may block       86 ns     79 ns     57 ns
Unbounded MPMC wait  may block       62 ns     61 ns     60 ns
..............................................................
folly::MPMC  read                   110 ns     95 ns     60 ns
folly::MPMC  tryReadUntil           108 ns    104 ns     96 ns
folly::MPMC  blockingRead            60 ns     57 ns     47 ns
==============================================================
======================  4 prod   4 cons ======================
=== uint32_t =================================================
Unbounded MPMC try   spin only      110 ns    100 ns     86 ns
Unbounded MPMC timed spin only      113 ns    104 ns     93 ns
Unbounded MPMC wait  spin only       49 ns     46 ns     45 ns
Unbounded MPMC try   may block      115 ns    105 ns     84 ns
Unbounded MPMC timed may block      119 ns    108 ns     89 ns
Unbounded MPMC wait  may block       63 ns     61 ns     54 ns
..............................................................
folly::MPMC  read                   140 ns    131 ns    113 ns
folly::MPMC  tryReadUntil           132 ns    129 ns    121 ns
folly::MPMC  blockingRead            58 ns     53 ns     48 ns
==============================================================
======================  4 prod   8 cons ======================
=== uint32_t =================================================
Unbounded MPMC try   spin only      170 ns    162 ns    151 ns
Unbounded MPMC timed spin only      174 ns    158 ns    139 ns
Unbounded MPMC wait  spin only       51 ns     50 ns     48 ns
Unbounded MPMC try   may block      164 ns    160 ns    154 ns
Unbounded MPMC timed may block      165 ns    158 ns    144 ns
Unbounded MPMC wait  may block       67 ns     62 ns     52 ns
..............................................................
folly::MPMC  read                   174 ns    166 ns    156 ns
folly::MPMC  tryReadUntil           165 ns    160 ns    150 ns
folly::MPMC  blockingRead            58 ns     56 ns     49 ns
==============================================================
======================  4 prod  16 cons ======================
=== uint32_t =================================================
Unbounded MPMC try   spin only      200 ns    195 ns    181 ns
Unbounded MPMC timed spin only      200 ns    195 ns    191 ns
Unbounded MPMC wait  spin only       51 ns     49 ns     45 ns
Unbounded MPMC try   may block      198 ns    192 ns    188 ns
Unbounded MPMC timed may block      199 ns    190 ns    182 ns
Unbounded MPMC wait  may block       77 ns     66 ns     60 ns
..............................................................
folly::MPMC  read                   195 ns    186 ns    175 ns
folly::MPMC  tryReadUntil           204 ns    187 ns    167 ns
folly::MPMC  blockingRead            66 ns     60 ns     57 ns
==============================================================
======================  4 prod  32 cons ======================
=== uint32_t =================================================
Unbounded MPMC try   spin only      246 ns    210 ns    195 ns
Unbounded MPMC timed spin only      217 ns    207 ns    199 ns
Unbounded MPMC wait  spin only       66 ns     52 ns     46 ns
Unbounded MPMC try   may block      250 ns    207 ns    197 ns
Unbounded MPMC timed may block      208 ns    202 ns    195 ns
Unbounded MPMC wait  may block       80 ns     66 ns     56 ns
..............................................................
folly::MPMC  read                   231 ns    201 ns    190 ns
folly::MPMC  tryReadUntil           202 ns    199 ns    196 ns
folly::MPMC  blockingRead            65 ns     61 ns     57 ns
==============================================================
======================  8 prod   2 cons ======================
=== uint32_t =================================================
Unbounded MPMC try   spin only       50 ns     41 ns     39 ns
Unbounded MPMC timed spin only       73 ns     49 ns     40 ns
Unbounded MPMC wait  spin only       46 ns     43 ns     39 ns
Unbounded MPMC try   may block       81 ns     62 ns     56 ns
Unbounded MPMC timed may block       75 ns     61 ns     53 ns
Unbounded MPMC wait  may block       61 ns     57 ns     50 ns
..............................................................
folly::MPMC  read                   120 ns    102 ns     58 ns
folly::MPMC  tryReadUntil           119 ns    112 ns    103 ns
folly::MPMC  blockingRead            85 ns     71 ns     58 ns
==============================================================
======================  8 prod   4 cons ======================
=== uint32_t =================================================
Unbounded MPMC try   spin only      104 ns     87 ns     39 ns
Unbounded MPMC timed spin only      109 ns     89 ns     40 ns
Unbounded MPMC wait  spin only       46 ns     45 ns     43 ns
Unbounded MPMC try   may block      121 ns    101 ns     74 ns
Unbounded MPMC timed may block      116 ns    103 ns     72 ns
Unbounded MPMC wait  may block       62 ns     57 ns     52 ns
..............................................................
folly::MPMC  read                   136 ns    130 ns    118 ns
folly::MPMC  tryReadUntil           132 ns    127 ns    118 ns
folly::MPMC  blockingRead            68 ns     61 ns     51 ns
==============================================================
======================  8 prod   8 cons ======================
=== uint32_t =================================================
Unbounded MPMC try   spin only      175 ns    171 ns    162 ns
Unbounded MPMC timed spin only      177 ns    169 ns    159 ns
Unbounded MPMC wait  spin only       49 ns     47 ns     45 ns
Unbounded MPMC try   may block      175 ns    171 ns    156 ns
Unbounded MPMC timed may block      180 ns    170 ns    162 ns
Unbounded MPMC wait  may block       63 ns     62 ns     59 ns
..............................................................
folly::MPMC  read                   177 ns    162 ns    147 ns
folly::MPMC  tryReadUntil           170 ns    162 ns    148 ns
folly::MPMC  blockingRead            57 ns     53 ns     49 ns
==============================================================
======================  8 prod  16 cons ======================
=== uint32_t =================================================
Unbounded MPMC try   spin only      203 ns    192 ns    185 ns
Unbounded MPMC timed spin only      199 ns    193 ns    185 ns
Unbounded MPMC wait  spin only       48 ns     46 ns     44 ns
Unbounded MPMC try   may block      204 ns    194 ns    182 ns
Unbounded MPMC timed may block      198 ns    187 ns    171 ns
Unbounded MPMC wait  may block       63 ns     61 ns     57 ns
..............................................................
folly::MPMC  read                   193 ns    185 ns    167 ns
folly::MPMC  tryReadUntil           199 ns    188 ns    164 ns
folly::MPMC  blockingRead            57 ns     52 ns     49 ns
==============================================================
======================  8 prod  32 cons ======================
=== uint32_t =================================================
Unbounded MPMC try   spin only      222 ns    208 ns    198 ns
Unbounded MPMC timed spin only      234 ns    212 ns    203 ns
Unbounded MPMC wait  spin only       89 ns     58 ns     45 ns
Unbounded MPMC try   may block      234 ns    207 ns    196 ns
Unbounded MPMC timed may block      205 ns    203 ns    197 ns
Unbounded MPMC wait  may block       65 ns     63 ns     61 ns
..............................................................
folly::MPMC  read                   240 ns    204 ns    194 ns
folly::MPMC  tryReadUntil           205 ns    202 ns    199 ns
folly::MPMC  blockingRead            56 ns     52 ns     49 ns
==============================================================
====================== 16 prod   2 cons ======================
=== uint32_t =================================================
Unbounded MPMC try   spin only       52 ns     40 ns     34 ns
Unbounded MPMC timed spin only       63 ns     47 ns     36 ns
Unbounded MPMC wait  spin only       45 ns     39 ns     36 ns
Unbounded MPMC try   may block       62 ns     51 ns     47 ns
Unbounded MPMC timed may block       77 ns     52 ns     46 ns
Unbounded MPMC wait  may block       63 ns     50 ns     46 ns
..............................................................
folly::MPMC  read                   114 ns    103 ns     77 ns
folly::MPMC  tryReadUntil           116 ns    106 ns     85 ns
folly::MPMC  blockingRead            85 ns     79 ns     63 ns
==============================================================
====================== 16 prod   4 cons ======================
=== uint32_t =================================================
Unbounded MPMC try   spin only      106 ns     68 ns     33 ns
Unbounded MPMC timed spin only       88 ns     56 ns     36 ns
Unbounded MPMC wait  spin only       46 ns     39 ns     35 ns
Unbounded MPMC try   may block       95 ns     66 ns     47 ns
Unbounded MPMC timed may block       80 ns     57 ns     46 ns
Unbounded MPMC wait  may block       52 ns     48 ns     45 ns
..............................................................
folly::MPMC  read                   121 ns    113 ns    104 ns
folly::MPMC  tryReadUntil           119 ns    110 ns    101 ns
folly::MPMC  blockingRead            65 ns     62 ns     57 ns
==============================================================
====================== 16 prod   8 cons ======================
=== uint32_t =================================================
Unbounded MPMC try   spin only      153 ns    109 ns     46 ns
Unbounded MPMC timed spin only      167 ns    110 ns     36 ns
Unbounded MPMC wait  spin only       43 ns     39 ns     36 ns
Unbounded MPMC try   may block      159 ns    125 ns    100 ns
Unbounded MPMC timed may block      127 ns     82 ns     52 ns
Unbounded MPMC wait  may block       51 ns     50 ns     46 ns
..............................................................
folly::MPMC  read                   149 ns    139 ns    129 ns
folly::MPMC  tryReadUntil           141 ns    134 ns    112 ns
folly::MPMC  blockingRead            59 ns     54 ns     49 ns
==============================================================
====================== 16 prod  16 cons ======================
=== uint32_t =================================================
Unbounded MPMC try   spin only      193 ns    169 ns    148 ns
Unbounded MPMC timed spin only      221 ns    175 ns    106 ns
Unbounded MPMC wait  spin only       45 ns     41 ns     37 ns
Unbounded MPMC try   may block      204 ns    171 ns    133 ns
Unbounded MPMC timed may block      184 ns    162 ns    104 ns
Unbounded MPMC wait  may block       61 ns     52 ns     49 ns
..............................................................
folly::MPMC  read                   181 ns    164 ns    157 ns
folly::MPMC  tryReadUntil           185 ns    173 ns    157 ns
folly::MPMC  blockingRead            56 ns     50 ns     45 ns
==============================================================
====================== 16 prod  32 cons ======================
=== uint32_t =================================================
Unbounded MPMC try   spin only      255 ns    217 ns    181 ns
Unbounded MPMC timed spin only      225 ns    205 ns    182 ns
Unbounded MPMC wait  spin only      115 ns     57 ns     40 ns
Unbounded MPMC try   may block      215 ns    199 ns    184 ns
Unbounded MPMC timed may block      218 ns    196 ns    179 ns
Unbounded MPMC wait  may block       63 ns     54 ns     47 ns
..............................................................
folly::MPMC  read                   260 ns    205 ns    185 ns
folly::MPMC  tryReadUntil           205 ns    200 ns    192 ns
folly::MPMC  blockingRead            53 ns     48 ns     43 ns
==============================================================
====================== 32 prod   2 cons ======================
=== uint32_t =================================================
Unbounded MPMC try   spin only       95 ns     66 ns     45 ns
Unbounded MPMC timed spin only       95 ns     62 ns     45 ns
Unbounded MPMC wait  spin only       56 ns     44 ns     36 ns
Unbounded MPMC try   may block      123 ns     86 ns     50 ns
Unbounded MPMC timed may block      109 ns     73 ns     47 ns
Unbounded MPMC wait  may block       95 ns     58 ns     47 ns
..............................................................
folly::MPMC  read                   445 ns    380 ns    315 ns
folly::MPMC  tryReadUntil           459 ns    341 ns    153 ns
folly::MPMC  blockingRead           351 ns    286 ns    218 ns
==============================================================
====================== 32 prod   4 cons ======================
=== uint32_t =================================================
Unbounded MPMC try   spin only      114 ns     92 ns     59 ns
Unbounded MPMC timed spin only      135 ns     99 ns     47 ns
Unbounded MPMC wait  spin only      139 ns     55 ns     38 ns
Unbounded MPMC try   may block      165 ns    113 ns     72 ns
Unbounded MPMC timed may block      119 ns     94 ns     51 ns
Unbounded MPMC wait  may block       61 ns     52 ns     47 ns
..............................................................
folly::MPMC  read                   127 ns    112 ns     93 ns
folly::MPMC  tryReadUntil           116 ns    107 ns     96 ns
folly::MPMC  blockingRead            67 ns     59 ns     51 ns
==============================================================
====================== 32 prod   8 cons ======================
=== uint32_t =================================================
Unbounded MPMC try   spin only      226 ns    140 ns     57 ns
Unbounded MPMC timed spin only      176 ns    126 ns     61 ns
Unbounded MPMC wait  spin only       86 ns     50 ns     39 ns
Unbounded MPMC try   may block      170 ns    131 ns     76 ns
Unbounded MPMC timed may block      201 ns    141 ns    110 ns
Unbounded MPMC wait  may block       94 ns     55 ns     47 ns
..............................................................
folly::MPMC  read                   148 ns    131 ns    120 ns
folly::MPMC  tryReadUntil           132 ns    126 ns    121 ns
folly::MPMC  blockingRead            59 ns     54 ns     51 ns
==============================================================
====================== 32 prod  16 cons ======================
=== uint32_t =================================================
Unbounded MPMC try   spin only      209 ns    174 ns    146 ns
Unbounded MPMC timed spin only      214 ns    189 ns    154 ns
Unbounded MPMC wait  spin only      138 ns     51 ns     38 ns
Unbounded MPMC try   may block      247 ns    191 ns    144 ns
Unbounded MPMC timed may block      245 ns    180 ns    123 ns
Unbounded MPMC wait  may block       74 ns     51 ns     46 ns
..............................................................
folly::MPMC  read                   164 ns    148 ns    135 ns
folly::MPMC  tryReadUntil           156 ns    149 ns    140 ns
folly::MPMC  blockingRead            55 ns     50 ns     47 ns
==============================================================
====================== 32 prod  32 cons ======================
=== uint32_t =================================================
Unbounded MPMC try   spin only      255 ns    212 ns    179 ns
Unbounded MPMC timed spin only      391 ns    223 ns    147 ns
Unbounded MPMC wait  spin only       78 ns     44 ns     38 ns
Unbounded MPMC try   may block      516 ns    249 ns    195 ns
Unbounded MPMC timed may block      293 ns    210 ns    171 ns
Unbounded MPMC wait  may block       54 ns     51 ns     48 ns
..............................................................
folly::MPMC  read                   195 ns    183 ns    164 ns
folly::MPMC  tryReadUntil           191 ns    175 ns    159 ns
folly::MPMC  blockingRead            49 ns     45 ns     43 ns
==============================================================

$ lscpu
Architecture:        x86_64
CPU op-mode(s):      32-bit, 64-bit
Byte Order:          Little Endian
CPU(s):              32
On-line CPU(s) list: 0-31
Thread(s) per core:  2
Core(s) per socket:  8
Socket(s):           2
NUMA node(s):        2
Vendor ID:           GenuineIntel
CPU family:          6
Model:               45
Model name:          Intel(R) Xeon(R) CPU E5-2660 0 @ 2.20GHz
Stepping:            6
CPU MHz:             2200.000
CPU max MHz:         2200.0000
CPU min MHz:         1200.0000
BogoMIPS:            4399.92
Virtualization:      VT-x
L1d cache:           32K
L1i cache:           32K
L2 cache:            256K
L3 cache:            20480K
NUMA node0 CPU(s):   0-7,16-23
NUMA node1 CPU(s):   8-15,24-31

Flags:               fpu vme de pse tsc msr pae mce cx8 apic sep mtrr
                     pge mca cmov pat pse36 clflush dts acpi mmx fxsr
                     sse sse2 ss ht tm pbe syscall nx pdpe1gb rdtscp
                     lm constant_tsc arch_perfmon pebs bts rep_good
                     nopl xtopology nonstop_tsc aperfmperf eagerfpu
                     pni pclmulqdq dtes64 monitor ds_cpl vmx smx est
                     tm2 ssse3 cx16 xtpr pdcm pcid dca sse4_1 sse4_2
                     x2apic popcnt tsc_deadline_timer aes xsave avx
                     lahf_lm epb tpr_shadow vnmi flexpriority ept vpid
                     xsaveopt dtherm arat pln pts
 */