From ba008f405a89d07e170d1b4c893246fb25ccba04 Mon Sep 17 00:00:00 2001
From: Mark Harfouche <mark.harfouche@gmail.com>
Date: Sat, 15 Sep 2018 12:08:41 -0400
Subject: BENCH: Make the pad benchmark pagefault in setup

---
 benchmarks/benchmarks/bench_lib.py | 26 +++++++++++++++++++-------
 1 file changed, 19 insertions(+), 7 deletions(-)

(limited to 'benchmarks')

diff --git a/benchmarks/benchmarks/bench_lib.py b/benchmarks/benchmarks/bench_lib.py
index e6c91a27c..05d6a4aae 100644
--- a/benchmarks/benchmarks/bench_lib.py
+++ b/benchmarks/benchmarks/bench_lib.py
@@ -13,16 +13,28 @@ class Pad(Benchmark):
 
     param_names = ["shape", "pad_width", "mode"]
     params = [
-        [(1000,), (10, 100), (10, 10, 10)],
-        [1, 3, (0, 5)],
-        ["constant", "edge", "linear_ramp", "mean", "reflect", "wrap"],
+        [(1000,),
+         (10, 100),
+         (10, 10, 10),
+         # 50 * 512 * 512 = 13 million points = 46 MB. should be a good
+         # out of cache describing a typical usecase
+         (50, 512, 512)],
+        [1,
+         3,
+         (0, 5)],
+        ["constant",
+         "edge", "linear_ramp",
+         # mean/median/minimum/maximum all use the same code path
+         "mean",
+         # reflect/symmetric share alot of the code path
+         "reflect",
+         "wrap"],
     ]
 
     def setup(self, shape, pad_width, mode):
-        # avoid np.zeros or np.empty's lazy allocation.
-        # np.full causes pagefaults to occur during setup
-        # instead of during the benchmark
-        self.array = np.full(shape, 0)
+        # Make sure to fill the array to make the OS page fault
+        # in the setup phase and not the timed phase
+        self.array = np.full(shape, fill_value=1)
 
     def time_pad(self, shape, pad_width, mode):
         np.pad(self.array, pad_width, mode)
-- 
cgit v1.2.1


From 65a099d4f66c82b48372790d91b7738233043e68 Mon Sep 17 00:00:00 2001
From: Lars Grueter <lagru@mailbox.org>
Date: Fri, 23 Nov 2018 16:46:54 +0100
Subject: BENCH: Pin dtype to float64 for np.pad's benchmarks

---
 benchmarks/benchmarks/bench_lib.py | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

(limited to 'benchmarks')

diff --git a/benchmarks/benchmarks/bench_lib.py b/benchmarks/benchmarks/bench_lib.py
index 05d6a4aae..211055c4c 100644
--- a/benchmarks/benchmarks/bench_lib.py
+++ b/benchmarks/benchmarks/bench_lib.py
@@ -16,8 +16,8 @@ class Pad(Benchmark):
         [(1000,),
          (10, 100),
          (10, 10, 10),
-         # 50 * 512 * 512 = 13 million points = 46 MB. should be a good
-         # out of cache describing a typical usecase
+         # 50 * 512 * 512 * 64 bits = 100 MiB, corresponds to typical use cases
+         # for large arrays which are out of cache
          (50, 512, 512)],
         [1,
          3,
@@ -34,7 +34,7 @@ class Pad(Benchmark):
     def setup(self, shape, pad_width, mode):
         # Make sure to fill the array to make the OS page fault
         # in the setup phase and not the timed phase
-        self.array = np.full(shape, fill_value=1)
+        self.array = np.full(shape, fill_value=1, dtype=np.float64)
 
     def time_pad(self, shape, pad_width, mode):
         np.pad(self.array, pad_width, mode)
-- 
cgit v1.2.1


From 3f67151194e98f0f53d75252819cc0f08b2d9f6a Mon Sep 17 00:00:00 2001
From: Lars Grueter <lagru@mailbox.org>
Date: Thu, 20 Dec 2018 17:28:12 +0100
Subject: Bench: Adjust parameters and explain background

See new class docstring for an explanation of these changes.
---
 benchmarks/benchmarks/bench_lib.py | 50 +++++++++++++++++++++++++-------------
 1 file changed, 33 insertions(+), 17 deletions(-)

(limited to 'benchmarks')

diff --git a/benchmarks/benchmarks/bench_lib.py b/benchmarks/benchmarks/bench_lib.py
index 211055c4c..7a6b3f01d 100644
--- a/benchmarks/benchmarks/bench_lib.py
+++ b/benchmarks/benchmarks/bench_lib.py
@@ -9,26 +9,42 @@ import numpy as np
 
 
 class Pad(Benchmark):
-    """Benchmarks for `numpy.pad`."""
+    """Benchmarks for `numpy.pad`.
+
+    When benchmarking the pad function it is useful to cover scenarios where
+    the ratio between the size of the input array and the output array differs
+    significantly (original area vs. padded area). This allows to evaluate for
+    which scenario a padding algorithm is optimized. Furthermore involving
+    large range of array sizes ensures that the effects of CPU-bound caching is
+    visible.
+
+    The table below shows the sizes of the arrays involved in this benchmark:
+
+    +-----------------+----------+-----------+-----------+-----------------+
+    | shape           | original | padded: 1 | padded: 8 | padded: (0, 32) |
+    +=================+==========+===========+===========+=================+
+    | (2 ** 22,)      | 32 MiB   | 32.0 MiB  | 32.0 MiB  | 32.0 MiB        |
+    +-----------------+----------+-----------+-----------+-----------------+
+    | (1024, 1024)    | 8 MiB    | 8.03 MiB  | 8.25 MiB  | 8.51 MiB        |
+    +-----------------+----------+-----------+-----------+-----------------+
+    | (256, 256, 1)   | 256 KiB  | 786 KiB   | 5.08 MiB  | 11.6 MiB        |
+    +-----------------+----------+-----------+-----------+-----------------+
+    | (4, 4, 4, 4)    | 2 KiB    | 10.1 KiB  | 1.22 MiB  | 12.8 MiB        |
+    +-----------------+----------+-----------+-----------+-----------------+
+    | (1, 1, 1, 1, 1) | 8 B      | 1.90 MiB  | 10.8 MiB  | 299 MiB         |
+    +-----------------+----------+-----------+-----------+-----------------+
+    """
 
     param_names = ["shape", "pad_width", "mode"]
     params = [
-        [(1000,),
-         (10, 100),
-         (10, 10, 10),
-         # 50 * 512 * 512 * 64 bits = 100 MiB, corresponds to typical use cases
-         # for large arrays which are out of cache
-         (50, 512, 512)],
-        [1,
-         3,
-         (0, 5)],
-        ["constant",
-         "edge", "linear_ramp",
-         # mean/median/minimum/maximum all use the same code path
-         "mean",
-         # reflect/symmetric share alot of the code path
-         "reflect",
-         "wrap"],
+        # Shape of the input arrays
+        [(2 ** 22,), (1024, 1024), (256, 128, 1),
+         (4, 4, 4, 4), (1, 1, 1, 1, 1)],
+        # Tested pad widths
+        [1, 8, (0, 32)],
+        # Tested modes: mean, median, minimum & maximum use the same code path
+        #               reflect & symmetric share a lot of their code path
+        ["constant", "edge", "linear_ramp", "mean", "reflect", "wrap"],
     ]
 
     def setup(self, shape, pad_width, mode):
-- 
cgit v1.2.1