redpanda-data · travisdowns · Jul 19, 2024 · Jun 27, 2024 · Jun 27, 2024 · Jun 27, 2024
@@ -48,8 +48,11 @@ Available tests to run:
 * Disk tests:
   ** Throughput test: 512 KB messages, sequential read/write
      *** Uses a larger request message sizes and deeper I/O queue depth to write/read more bytes in a shorter amount of time, at the cost of IOPS/latency.
-  ** Latency test: 4 KB messages, sequential read/write
-     *** Uses smaller request message sizes and lower levels of parallelism to achieve higher IOPS and lower latency.
+  ** Latency and io depth tests: 4 KB messages, sequential read/write, varying io depth
+     *** Uses small IO sizes and varying levels of parallelism to determine the relationship between io depth and IOPS
+     *** Includes one test without using dsync (fdatasync) on each write to establish the cost of dsync
+  ** 16 KB test
+     *** One high io depth test at 16 KB to reflect performance at Redpanda's default chunk size
 * Network tests:
   ** Throughput test: 8192-bit messages
      *** Unique pairs of Redpanda nodes each act as a client and a server.
@@ -123,7 +126,7 @@ func assembleTests(onlyDisk bool, onlyNetwork bool, onlyCloud bool, durationDisk
 	diskcheck := []any{
 		// One test weighted for better throughput results
 		rpadmin.DiskcheckParameters{
-			Name:        "512KB sequential r/w throughput disk test",
+			Name:        "512KB sequential r/w",
 			DSync:       true,
 			SkipWrite:   false,
 			SkipRead:    false,
@@ -133,16 +136,73 @@ func assembleTests(onlyDisk bool, onlyNetwork bool, onlyCloud bool, durationDisk
 			Parallelism: 4,
 			Type:        rpadmin.DiskcheckTagIdentifier,
 		},
-		// .. and another for better latency/iops results
+		// .. and then a series of 4KB write-only tests at increasing io depth
 		rpadmin.DiskcheckParameters{
-			Name:        "4KB sequential r/w latency/iops disk test",
+			Name:        "4KB sequential r/w, low io depth",
 			DSync:       true,
 			SkipWrite:   false,
 			SkipRead:    false,
 			DataSize:    1 * units.GiB,
 			RequestSize: 4 * units.KiB,
 			DurationMs:  durationDisk,
-			Parallelism: 2,
+			Parallelism: 1,
+			Type:        rpadmin.DiskcheckTagIdentifier,
+		},
+		rpadmin.DiskcheckParameters{
+			Name:        "4KB sequential write, medium io depth",
+			DSync:       true,
+			SkipWrite:   false,
+			SkipRead:    true,
+			DataSize:    1 * units.GiB,
+			RequestSize: 4 * units.KiB,
+			DurationMs:  durationDisk,
+			Parallelism: 8,
+			Type:        rpadmin.DiskcheckTagIdentifier,
+		},
+		rpadmin.DiskcheckParameters{
+			Name:        "4KB sequential write, high io depth",
+			DSync:       true,
+			SkipWrite:   false,
+			SkipRead:    true,
+			DataSize:    1 * units.GiB,
+			RequestSize: 4 * units.KiB,
+			DurationMs:  durationDisk,
+			Parallelism: 64,
+			Type:        rpadmin.DiskcheckTagIdentifier,
+		},
+		rpadmin.DiskcheckParameters{
+			Name:        "4KB sequential write, very high io depth",
+			DSync:       true,
+			SkipWrite:   false,
+			SkipRead:    true,
+			DataSize:    1 * units.GiB,
+			RequestSize: 4 * units.KiB,
+			DurationMs:  durationDisk,
+			Parallelism: 256,
+			Type:        rpadmin.DiskcheckTagIdentifier,
+		},
+		// ... and a 4KB test as above but with dsync off
+		rpadmin.DiskcheckParameters{
+			Name:        "4KB sequential write, no dsync",
+			DSync:       false,
+			SkipWrite:   false,
+			SkipRead:    true,
+			DataSize:    1 * units.GiB,
+			RequestSize: 4 * units.KiB,
+			DurationMs:  durationDisk,
+			Parallelism: 64,
+			Type:        rpadmin.DiskcheckTagIdentifier,
+		},
+		// ... and a 16KB test as above as another important size for redpanda
+		rpadmin.DiskcheckParameters{
+			Name:        "16KB sequential r/w, high io depth",
+			DSync:       false,
+			SkipWrite:   false,
+			SkipRead:    false,
+			DataSize:    1 * units.GiB,
+			RequestSize: 16 * units.KiB,
+			DurationMs:  durationDisk,
+			Parallelism: 64,
 			Type:        rpadmin.DiskcheckTagIdentifier,
 		},
 	}

diff --git a/src/v/cluster/self_test/diskcheck.cc b/src/v/cluster/self_test/diskcheck.cc
@@ -144,7 +144,8 @@ diskcheck::run_configured_benchmarks(ss::file& file) {
     auto write_metrics = co_await do_run_benchmark<read_or_write::write>(file);
     auto result = write_metrics.to_st_result();
     result.name = _opts.name;
-    result.info = "write run";
+    result.info = fmt::format(
+      "write run (iodepth: {}, dsync: {})", _opts.parallelism, _opts.dsync);
     result.test_type = "disk";
     if (_cancelled) {
         result.warning = "Run was manually cancelled";

diff --git a/src/v/cluster/self_test_rpc_types.h b/src/v/cluster/self_test_rpc_types.h
@@ -46,7 +46,7 @@ struct diskcheck_opts
   : serde::
       envelope<diskcheck_opts, serde::version<0>, serde::compat_version<0>> {
     /// Descriptive name given to test run
-    ss::sstring name{"512K sequential r/w disk test"};
+    ss::sstring name{"unspecified"};
     /// Where files this benchmark will read/write to exist
     std::filesystem::path dir{config::node().disk_benchmark_path()};
     /// Open the file with O_DSYNC flag option
@@ -56,7 +56,7 @@ struct diskcheck_opts
     /// Set to true to disable the read portion of the benchmark
     bool skip_read{false};
     /// Total size of all benchmark files to exist on disk
-    uint64_t data_size{10ULL << 30}; // 1GiB
+    uint64_t data_size{10ULL << 30}; // 10GiB
     /// Size of individual read and/or write requests
     size_t request_size{512 << 10}; // 512KiB
     /// Total duration of the benchmark

diff --git a/tests/rptest/tests/self_test_test.py b/tests/rptest/tests/self_test_test.py
@@ -43,7 +43,7 @@ def all_idle():
             return not any([x['status'] == 'running'
                             for x in node_reports]), node_reports
 
-        return wait_until_result(all_idle, timeout_sec=30, backoff_sec=1)
+        return wait_until_result(all_idle, timeout_sec=90, backoff_sec=1)
 
     @cluster(num_nodes=3)
     @matrix(remote_read=[True, False], remote_write=[True, False])
@@ -101,9 +101,9 @@ def assert_fail(report, error_msg):
         # on specific results, but rather what tests are oberved to have run
         reports = flat_map(lambda node: node['results'], node_reports)
 
-        # Ensure 4 disk tests per node, read/write & latency/throughput
+        # Ensure 10 disk tests per node (see the RPK code for the full list)
         disk_results = [r for r in reports if r['test_type'] == 'disk']
-        expected_disk_results = num_nodes * 4
+        expected_disk_results = num_nodes * 10
         assert len(
             disk_results
         ) == expected_disk_results, f"Expected {expected_disk_results} disk reports observed {len(disk_results)}"