TST: Add testing unit for fused NPYV intrinsics

author: Sayed Adel <seiko@imavr.com> 2020-09-14 15:52:27 +0200
committer: Sayed Adel <seiko@imavr.com> 2020-10-27 11:46:58 +0000
commit: 92a4693cb0df392003cf99a2f1abe8927cdd58b4 (patch)
tree: 4147d6754326e23c2755cab298ac760b1606afd6
parent: 1779c2a9287d2242226ee6bac575c75684c3d696 (diff)
download: numpy-92a4693cb0df392003cf99a2f1abe8927cdd58b4.tar.gz
2 files changed, 37 insertions, 2 deletions
diff --git a/numpy/core/src/_simd/_simd.dispatch.c.src b/numpy/core/src/_simd/_simd.dispatch.c.src
index 69a9ffd45..506ef93f0 100644
--- a/numpy/core/src/_simd/_simd.dispatch.c.src
+++ b/numpy/core/src/_simd/_simd.dispatch.c.src
@@ -19,6 +19,7 @@
  * #sat_sup   = 1,  1,  1,   1,   0,   0,   0,   0,   0,   0#
  * #mul_sup   = 1,  1,  1,   1,   1,   1,   0,   0,   1,   1#
  * #div_sup   = 0,  0,  0,   0,   0,   0,   0,   0,   1,   1#
+ * #fused_sup = 0,  0,  0,   0,   0,   0,   0,   0,   1,   1#
  * #shl_imm   = 0,  0,  15,  15,  31,  31,  63,  63,  0,   0#
  * #shr_imm   = 0,  0,  16,  16,  32,  32,  64,  64,  0,   0#
  */
@@ -175,9 +176,16 @@ SIMD_IMPL_INTRIN_2(mul_@sfx@, v@sfx@, v@sfx@, v@sfx@)
 SIMD_IMPL_INTRIN_2(div_@sfx@, v@sfx@, v@sfx@, v@sfx@)
 #endif // div_sup
 
+#if @fused_sup@
+/**begin repeat1
+ * #intrin  = muladd, mulsub, nmuladd, nmulsub#
+ */
+SIMD_IMPL_INTRIN_3(@intrin@_@sfx@, v@sfx@, v@sfx@, v@sfx@, v@sfx@)
+/**end repeat1**/
+#endif // fused_sup
+
 #endif // simd_sup
 /**end repeat**/
-
 /***************************
  * Variant
  ***************************/
@@ -194,6 +202,7 @@ static PyMethodDef simd__intrinsics_methods[] = {
  * #sat_sup   = 1,  1,  1,   1,   0,   0,   0,   0,   0,   0#
  * #mul_sup   = 1,  1,  1,   1,   1,   1,   0,   0,   1,   1#
  * #div_sup   = 0,  0,  0,   0,   0,   0,   0,   0,   1,   1#
+ * #fused_sup = 0,  0,  0,   0,   0,   0,   0,   0,   1,   1#
  * #shl_imm   = 0,  0,  15,  15,  31,  31,  63,  63,  0,   0#
  * #shr_imm   = 0,  0,  16,  16,  32,  32,  64,  64,  0,   0#
  */
@@ -286,6 +295,14 @@ SIMD_INTRIN_DEF(mul_@sfx@)
 SIMD_INTRIN_DEF(div_@sfx@)
 #endif // div_sup
 
+#if @fused_sup@
+/**begin repeat1
+ * #intrin  = muladd, mulsub, nmuladd, nmulsub#
+ */
+SIMD_INTRIN_DEF(@intrin@_@sfx@)
+/**end repeat1**/
+#endif // fused_sup
+
 #endif // simd_sup
 /**end repeat**/
 
diff --git a/numpy/core/tests/test_simd.py b/numpy/core/tests/test_simd.py
index 26e78d402..3ca6b068d 100644
--- a/numpy/core/tests/test_simd.py
+++ b/numpy/core/tests/test_simd.py
@@ -131,7 +131,25 @@ class _SIMD_FP(_Test_Utility):
     """
     To test all float vector types at once
     """
-    pass
+    def test_arithmetic_fused(self):
+        vdata_a, vdata_b, vdata_c = [self.load(self._data())]*3
+        vdata_cx2 = self.add(vdata_c, vdata_c)
+        # multiply and add, a*b + c
+        data_fma = self.load([a * b + c for a, b, c in zip(vdata_a, vdata_b, vdata_c)])
+        fma = self.muladd(vdata_a, vdata_b, vdata_c)
+        assert fma == data_fma
+        # multiply and subtract, a*b - c
+        fms = self.mulsub(vdata_a, vdata_b, vdata_c)
+        data_fms = self.sub(data_fma, vdata_cx2)
+        assert fms == data_fms
+        # negate multiply and add, -(a*b) + c
+        nfma = self.nmuladd(vdata_a, vdata_b, vdata_c)
+        data_nfma = self.sub(vdata_cx2, data_fma)
+        assert nfma == data_nfma
+        # negate multiply and subtract, -(a*b) - c
+        nfms = self.nmulsub(vdata_a, vdata_b, vdata_c)
+        data_nfms = self.mul(data_fma, self.setall(-1))
+        assert nfms == data_nfms
 
 class _SIMD_ALL(_Test_Utility):
     """
author	Sayed Adel <seiko@imavr.com>	2020-09-14 15:52:27 +0200
committer	Sayed Adel <seiko@imavr.com>	2020-10-27 11:46:58 +0000
commit	92a4693cb0df392003cf99a2f1abe8927cdd58b4 (patch)
tree	4147d6754326e23c2755cab298ac760b1606afd6
parent	1779c2a9287d2242226ee6bac575c75684c3d696 (diff)
download	numpy-92a4693cb0df392003cf99a2f1abe8927cdd58b4.tar.gz