add throughput numbers to the random_writes benchmark

Summary: Before adding a random_reads benchmark, this diff enables the random_writes benchmark on Windows and adds throughput numbers. Reviewed By: kmancini Differential Revision: D42461465 fbshipit-source-id: 165de212e061f9e2ad58222178422592f3bc688d
2024-10-04 22:07:44 +03:00 · 2023-01-18 20:46:42 -08:00 · 2023-01-18 20:46:42 -08:00 · 07a1caa93c
commit 07a1caa93c
parent 1c2aaa23c3
1 changed files with 60 additions and 23 deletions
--- a/eden/fs/benchmarks/random_writes.cpp
+++ b/eden/fs/benchmarks/random_writes.cpp
@ -8,19 +8,22 @@
 #include <folly/Exception.h>
 #include <folly/File.h>
 #include <folly/FileUtil.h>
+#include <folly/String.h>
 #include <folly/logging/xlog.h>
 #include <folly/portability/GFlags.h>
+#include <algorithm>
 #include <random>
 #include "eden/common/utils/benchharness/Bench.h"

 namespace {
 constexpr size_t kPageSize = 4096;
+constexpr size_t kDefaultFileSize = 16 * 1024 * 1024;

 DEFINE_string(
    filename,
    "random_writes.tmp",
    "Path to which writes should be issued");
-DEFINE_uint64(filesize, kPageSize * 4096, "File size in bytes");
+DEFINE_uint64(filesize, kDefaultFileSize, "File size in bytes");

 struct TemporaryFile {
  TemporaryFile()
@ -32,7 +35,15 @@ struct TemporaryFile {
  }

  ~TemporaryFile() {
-    folly::checkUnixError(::unlink(FLAGS_filename.c_str()));
+    file.close();
+    if (-1 == unlink(FLAGS_filename.c_str())) {
+      int err = errno;
+      fmt::print(
+          stderr,
+          "error unlinking {}: {}",
+          FLAGS_filename,
+          folly::errnoStr(err));
+    }
  }

  folly::File file;
@ -43,36 +54,63 @@ int getTemporaryFD() {
  return tf.file.fd();
 }

+using random_bytes_engine = std::independent_bits_engine<
+    std::default_random_engine,
+    CHAR_BIT,
+    unsigned short>;
+
 void random_writes(benchmark::State& state) {
  int fd = getTemporaryFD();
  off_t pageCount = FLAGS_filesize / kPageSize;

-  char pagebuf[kPageSize];
-
-  {
-    folly::File urandom{"/dev/urandom", O_RDONLY | O_CLOEXEC};
-    folly::checkUnixError(
-        folly::readFull(urandom.fd(), pagebuf, sizeof(pagebuf)),
-        "read /dev/urandom");
-  }
+  uint8_t pagebuf[kPageSize];
+  std::generate(std::begin(pagebuf), std::end(pagebuf), random_bytes_engine{});

  std::default_random_engine gen{std::random_device{}()};
-  std::uniform_int_distribution<off_t> rng{0, pageCount - 1};

  // std::uniform_int_distribution has as much userspace CPU cost as
  // __libc_pwrite64 so pregenerate some offsets.
-  off_t offsets[16 * 1024];
-  std::generate(std::begin(offsets), std::end(offsets), [&] {
-    return rng(gen) * kPageSize;
+  std::vector<off_t> offsets(pageCount);
+  std::generate(offsets.begin(), offsets.end(), [offset = 0ull]() mutable {
+    return (offset++) * kPageSize;
  });
+  std::shuffle(offsets.begin(), offsets.end(), gen);

+  size_t total_written = 0;
+  size_t total_pages = 0;
  size_t offset_index = 0;
  for (auto _ : state) {
-    off_t offset = offsets[offset_index++ % std::size(offsets)];
-    folly::checkUnixError(pwrite(fd, pagebuf, kPageSize, offset));
+    off_t offset = offsets[offset_index];
+    if (offset_index++ == offsets.size()) {
+      // Redoing the offsets is okay
+      total_pages += offsets.size();
+      offset_index = 0;
+    }
+    int result = pwrite(fd, pagebuf, kPageSize, offset);
+    folly::checkUnixError(result);
+    if (result != kPageSize) {
+      fmt::print(stderr, "write was not complete: {} != {}", result, kPageSize);
+    }
+    total_written += result;
  }
+  total_pages += offset_index;
+
+  state.SetItemsProcessed(total_pages);
+  state.SetBytesProcessed(total_written);
 }

+BENCHMARK(random_writes)
+    // By default, google benchmark shows throughput numbers in bytes per CPU
+    // second. That's not useful, so tell it we care about wall clock time.
+    ->UseRealTime()
+    ->Threads(1)
+    ->Threads(2)
+    ->Threads(4)
+    ->Threads(8)
+    ->Threads(16);
+
+#ifdef __GLIBC__
+
 void random_writes_no_cancellation(benchmark::State& state) {
  int oldstate;
  XCHECK_EQ(0, pthread_setcancelstate(PTHREAD_CANCEL_DISABLE, &oldstate));
@ -89,19 +127,18 @@ void random_writes_no_cancellation(benchmark::State& state) {
  random_writes(state);
 }

-BENCHMARK(random_writes)
+BENCHMARK(random_writes_no_cancellation)
+    // By default, google benchmark shows throughput numbers in bytes per CPU
+    // second. That's not useful, so tell it we care about wall clock time.
+    ->UseRealTime()
    ->Threads(1)
    ->Threads(2)
    ->Threads(4)
    ->Threads(8)
    ->Threads(16);

-BENCHMARK(random_writes_no_cancellation)
-    ->Threads(1)
-    ->Threads(2)
-    ->Threads(4)
-    ->Threads(8)
-    ->Threads(16);
+#endif
+
 } // namespace

 EDEN_BENCHMARK_MAIN();