MAINT: Remove NotImplemented handling from ufuncs (almost)

This was redundant/broken anyway. See gh-5844 for discussion. See the massive comment added to ufunc_object.c:get_ufunc_arguments for a discussion of the deprecation strategy here -- it turns out that array_richcompare is such a disaster zone that we can't quite wholly eliminate NotImplemented quite yet. But this removes most NotImplementeds, and lays the groundwork for eliminating the rest in a release or two.
author: Nathaniel J. Smith <njs@pobox.com> 2015-05-07 22:57:16 -0700
committer: Charles Harris <charlesr.harris@gmail.com> 2015-06-13 12:36:26 -0600
commit: 6bf0e419dc79ea6815557c57b7e9bb504ba20543 (patch)
tree: 36a55fdd8cbf7e39d2b58e0e0b3b9b009ad090c8 /numpy
parent: a0643f542642537cb4f4b3fa057fbbecaf799b29 (diff)
download: numpy-6bf0e419dc79ea6815557c57b7e9bb504ba20543.tar.gz
5 files changed, 191 insertions, 95 deletions
diff --git a/numpy/core/src/multiarray/arrayobject.c b/numpy/core/src/multiarray/arrayobject.c
index 3e5084fb3..6a22cd141 100644
--- a/numpy/core/src/multiarray/arrayobject.c
+++ b/numpy/core/src/multiarray/arrayobject.c
@@ -1312,6 +1312,15 @@ array_richcompare(PyArrayObject *self, PyObject *other, int cmp_op)
         else {
             return _strings_richcompare(self, array_other, cmp_op, 0);
         }
+        /* If we reach this point, it means that we are not comparing
+         * string-to-string. It's possible that this will still work out,
+         * e.g. if the other array is an object array, then both will be cast
+         * to object or something? I don't know how that works actually, but
+         * it does, b/c this works:
+         *   l = ["a", "b"]
+         *   assert np.array(l, dtype="S1") == np.array(l, dtype="O")
+         * So we fall through and see what happens.
+         */
     }
 
     switch (cmp_op) {
@@ -1360,10 +1369,9 @@ array_richcompare(PyArrayObject *self, PyObject *other, int cmp_op)
              */
             if (array_other == NULL) {
                 PyErr_Clear();
-                if (DEPRECATE_FUTUREWARNING(
+                if (DEPRECATE(
                         "elementwise comparison failed and returning scalar "
-                        "instead; this will raise an error or perform "
-                        "elementwise comparison in the future.") < 0) {
+                        "instead; this will raise an error in the future.") < 0) {
                     return NULL;
                 }
                 Py_INCREF(Py_NotImplemented);
@@ -1445,10 +1453,9 @@ array_richcompare(PyArrayObject *self, PyObject *other, int cmp_op)
             */
             if (array_other == NULL) {
                 PyErr_Clear();
-                if (DEPRECATE_FUTUREWARNING(
+                if (DEPRECATE(
                         "elementwise comparison failed and returning scalar "
-                        "instead; this will raise an error or perform "
-                        "elementwise comparison in the future.") < 0) {
+                        "instead; this will raise an error in the future.") < 0) {
                     return NULL;
                 }
                 Py_INCREF(Py_NotImplemented);
diff --git a/numpy/core/src/umath/ufunc_object.c b/numpy/core/src/umath/ufunc_object.c
index 21e1013d9..e120b5fd5 100644
--- a/numpy/core/src/umath/ufunc_object.c
+++ b/numpy/core/src/umath/ufunc_object.c
@@ -523,38 +523,6 @@ PyUFunc_GetPyValues(char *name, int *bufsize, int *errmask, PyObject **errobj)
     return _extract_pyvals(ref, name, bufsize, errmask, errobj);
 }
 
-#define GETATTR(str, rstr) do {if (strcmp(name, #str) == 0)     \
-        return PyObject_HasAttrString(op, "__" #rstr "__");} while (0);
-
-static int
-_has_reflected_op(PyObject *op, const char *name)
-{
-    GETATTR(add, radd);
-    GETATTR(subtract, rsub);
-    GETATTR(multiply, rmul);
-    GETATTR(divide, rdiv);
-    GETATTR(true_divide, rtruediv);
-    GETATTR(floor_divide, rfloordiv);
-    GETATTR(remainder, rmod);
-    GETATTR(power, rpow);
-    GETATTR(left_shift, rlshift);
-    GETATTR(right_shift, rrshift);
-    GETATTR(bitwise_and, rand);
-    GETATTR(bitwise_xor, rxor);
-    GETATTR(bitwise_or, ror);
-    /* Comparisons */
-    GETATTR(equal, eq);
-    GETATTR(not_equal, ne);
-    GETATTR(greater, lt);
-    GETATTR(less, gt);
-    GETATTR(greater_equal, le);
-    GETATTR(less_equal, ge);
-    return 0;
-}
-
-#undef GETATTR
-
-
 /* Return the position of next non-white-space char in the string */
 static int
 _next_non_white_space(const char* str, int offset)
@@ -896,16 +864,122 @@ get_ufunc_arguments(PyUFuncObject *ufunc,
         }
     }
 
-    /*
-     * Indicate not implemented if there are flexible objects (structured
-     * type or string) but no object types and no registered struct
-     * dtype ufuncs.
-     *
-     * Not sure - adding this increased to 246 errors, 150 failures.
-     */
     if (any_flexible && !any_flexible_userloops && !any_object) {
-        return -2;
-
+        /* Traditionally, we return -2 here (meaning "NotImplemented") anytime
+         * we hit the above condition.
+         *
+         * This condition basically means "we are doomed", b/c the "flexible"
+         * dtypes -- strings and void -- cannot have their own ufunc loops
+         * registered (except via the special "flexible userloops" mechanism),
+         * and they can't be cast to anything except object (and we only cast
+         * to object if any_object is true). So really we should do nothing
+         * here and continue and let the proper error be raised. But, we can't
+         * quite yet, b/c of backcompat.
+         *
+         * Most of the time, this NotImplemented either got returned directly
+         * to the user (who can't do anything useful with it), or got passed
+         * back out of a special function like __mul__. And fortunately, for
+         * almost all special functions, the end result of this was a
+         * TypeError. Which is also what we get if we just continue without
+         * this special case, so this special case is unnecessary.
+         *
+         * The only thing that actually depended on the NotImplemented is
+         * array_richcompare, which did two things with it. First, it needed
+         * to see this NotImplemented in order to implement the special-case
+         * comparisons for
+         *
+         *    string < <= == != >= > string
+         *    void == != void
+         *
+         * Now it checks for those cases first, before trying to call the
+         * ufunc, so that's no problem. What it doesn't handle, though, is
+         * cases like
+         *
+         *    float < string
+         *
+         * or
+         *
+         *    float == void
+         *
+         * For those, it just let the NotImplemented bubble out, and accepted
+         * Python's default handling. And unfortunately, for comparisons,
+         * Python's default is *not* to raise an error. Instead, it returns
+         * something that depends on the operator:
+         *
+         *    ==         return False
+         *    !=         return True
+         *    < <= >= >  Python 2: use "fallback" (= weird and broken) ordering
+         *               Python 3: raise TypeError (hallelujah)
+         *
+         * In most cases this is straightforwardly broken, because comparison
+         * of two arrays should always return an array, and here we end up
+         * returning a scalar. However, there is an exception: if we are
+         * comparing two scalars for equality, then it actually is correct to
+         * return a scalar bool instead of raising an error. If we just
+         * removed this special check entirely, then "np.float64(1) == 'foo'"
+         * would raise an error instead of returning False, which is genuinely
+         * wrong.
+         *
+         * The proper end goal here is:
+         *   1) == and != should be implemented in a proper vectorized way for
+         *      all types. The short-term hack for this is just to add a
+         *      special case to PyUFunc_DefaultLegacyInnerLoopSelector where
+         *      if it can't find a comparison loop for the given types, and
+         *      the ufunc is np.equal or np.not_equal, then it returns a loop
+         *      that just fills the output array with False (resp. True). Then
+         *      array_richcompare could trust that whenever its special cases
+         *      don't apply, simply calling the ufunc will do the right thing,
+         *      even without this special check.
+         *   2) < <= >= > should raise an error if no comparison function can
+         *      be found. array_richcompare already handles all string <>
+         *      string cases, and void dtypes don't have ordering, so again
+         *      this would mean that array_richcompare could simply call the
+         *      ufunc and it would do the right thing (i.e., raise an error),
+         *      again without needing this special check.
+         *
+         * So this means that for the transition period, our goal is:
+         *   == and != on scalars should simply return NotImplemented like
+         *     they always did, since everything ends up working out correctly
+         *     in this case only
+         *   == and != on arrays should issue a FutureWarning and then return
+         *     NotImplemented
+         *   < <= >= > on all flexible dtypes on py2 should raise a
+         *     DeprecationWarning, and then return NotImplemented. On py3 we
+         *     skip the warning, though, b/c it would just be immediately be
+         *     followed by an exception anyway.
+         *
+         * And for all other operations, we let things continue as normal.
+         */
+        /* strcmp() is a hack but I think we can get away with it for this
+         * temporary measure.
+         */
+        if (!strcmp(ufunc_name, "equal")
+            || !strcmp(ufunc_name, "not_equal")) {
+            /* Warn on non-scalar, return NotImplemented regardless */
+            assert(nin == 2);
+            if (PyArray_NDIM(out_op[0]) != 0
+                || PyArray_NDIM(out_op[1]) != 0) {
+                if (DEPRECATE_FUTUREWARNING(
+                        "elementwise comparison failed; returning scalar "
+                        "but in the future will perform elementwise "
+                        "comparison") < 0) {
+                    return -1;
+                }
+            }
+            return -2;
+        }
+        else if (!strcmp(ufunc_name, "less")
+                 || !strcmp(ufunc_name, "less_equal")
+                 || !strcmp(ufunc_name, "greater")
+                 || !strcmp(ufunc_name, "greater_equal")) {
+#if !defined(NPY_PY3K)
+            if (DEPRECATE("unorderable dtypes; returning scalar but in "
+                          "the future this will be an error") < 0) {
+                return -1;
+            }
+#endif
+            return -2;
+        }
     }
 
     /* Get positional output arguments */
@@ -2142,26 +2216,6 @@ PyUFunc_GeneralizedFunction(PyUFuncObject *ufunc,
         goto fail;
     }
 
-    /*
-     * FAIL with NotImplemented if the other object has
-     * the __r<op>__ method and has a higher priority than
-     * the current op (signalling it can handle ndarray's).
-    */
-    if (nin == 2 && nout == 1 && dtypes[1]->type_num == NPY_OBJECT) {
-        PyObject *_obj = PyTuple_GET_ITEM(args, 1);
-        if (!PyArray_CheckExact(_obj)) {
-            double self_prio, other_prio;
-            self_prio = PyArray_GetPriority(PyTuple_GET_ITEM(args, 0),
-                                                        NPY_SCALAR_PRIORITY);
-            other_prio = PyArray_GetPriority(_obj, NPY_SCALAR_PRIORITY);
-            if (self_prio < other_prio &&
-                            _has_reflected_op(_obj, ufunc_name)) {
-                retval = -2;
-                goto fail;
-            }
-        }
-    }
-
 #if NPY_UF_DBG_TRACING
     printf("input types:\n");
     for (i = 0; i < nin; ++i) {
@@ -2521,27 +2575,6 @@ PyUFunc_GenericFunction(PyUFuncObject *ufunc,
         }
     }
 
-    /*
-     * FAIL with NotImplemented if the other object has
-     * the __r<op>__ method and has __array_priority__ as
-     * an attribute (signalling it can handle ndarray's)
-     * and is not already an ndarray or a subtype of the same type.
-    */
-    if (nin == 2 && nout == 1 && dtypes[1]->type_num == NPY_OBJECT) {
-        PyObject *_obj = PyTuple_GET_ITEM(args, 1);
-        if (!PyArray_Check(_obj)) {
-            double self_prio, other_prio;
-            self_prio = PyArray_GetPriority(PyTuple_GET_ITEM(args, 0),
-                                                        NPY_SCALAR_PRIORITY);
-            other_prio = PyArray_GetPriority(_obj, NPY_SCALAR_PRIORITY);
-            if (self_prio < other_prio &&
-                            _has_reflected_op(_obj, ufunc_name)) {
-                retval = -2;
-                goto fail;
-            }
-        }
-    }
-
 #if NPY_UF_DBG_TRACING
     printf("input types:\n");
     for (i = 0; i < nin; ++i) {
@@ -4222,13 +4255,15 @@ ufunc_generic_call(PyUFuncObject *ufunc, PyObject *args, PyObject *kwds)
             return NULL;
         }
         else if (ufunc->nin == 2 && ufunc->nout == 1) {
-            /* To allow the other argument to be given a chance */
+            /* For array_richcompare's benefit -- see the long comment in
+             * get_ufunc_arguments.
+             */
             Py_INCREF(Py_NotImplemented);
             return Py_NotImplemented;
         }
         else {
             PyErr_SetString(PyExc_TypeError,
-                                        "Not implemented for this type");
+                            "XX can't happen, please report a bug XX");
             return NULL;
         }
     }
diff --git a/numpy/core/tests/test_deprecations.py b/numpy/core/tests/test_deprecations.py
index b4889e491..02dafb6de 100644
--- a/numpy/core/tests/test_deprecations.py
+++ b/numpy/core/tests/test_deprecations.py
@@ -5,6 +5,7 @@ to document how deprecations should eventually be turned into errors.
 """
 from __future__ import division, absolute_import, print_function
 
+import sys
 import operator
 import warnings
 
@@ -382,8 +383,7 @@ class TestComparisonDeprecations(_DeprecationTestCase):
     Also test FutureWarning for the None comparison.
     """
 
-    message = "elementwise comparison failed; " \
-              "this will raise an error in the future."
+    message = "elementwise.* comparison failed; .*"
 
     def test_normal_types(self):
         for op in (operator.eq, operator.ne):
@@ -442,6 +442,52 @@ class TestComparisonDeprecations(_DeprecationTestCase):
         # it has to be considered when the deprecations is done.
         assert_(np.equal(np.datetime64('NaT'), None))
 
+    def test_void_dtype_equality_failures(self):
+        class NotArray(object):
+            def __array__(self):
+                raise TypeError
+
+        self.assert_deprecated(lambda: np.arange(2) == NotArray())
+        self.assert_deprecated(lambda: np.arange(2) != NotArray())
+
+        struct1 = np.zeros(2, dtype="i4,i4")
+        struct2 = np.zeros(2, dtype="i4,i4,i4")
+
+        assert_warns(FutureWarning, lambda: struct1 == 1)
+        assert_warns(FutureWarning, lambda: struct1 == struct2)
+        assert_warns(FutureWarning, lambda: struct1 != 1)
+        assert_warns(FutureWarning, lambda: struct1 != struct2)
+
+    def test_array_richcompare_legacy_weirdness(self):
+        # It doesn't really work to use assert_deprecated here, b/c part of
+        # the point of assert_deprecated is to check that when warnings are
+        # set to "error" mode then the error is propagated -- which is good!
+        # But here we are testing a bunch of code that is deprecated *because*
+        # it has the habit of swallowing up errors and converting them into
+        # different warnings. So assert_warns will have to be sufficient.
+        assert_warns(FutureWarning, lambda: np.arange(2) == "a")
+        assert_warns(FutureWarning, lambda: np.arange(2) != "a")
+        # No warning for scalar comparisons
+        with warnings.catch_warnings():
+            warnings.filterwarnings("error")
+            assert_(not (np.array(0) == "a"))
+            assert_(np.array(0) != "a")
+            assert_(not (np.int16(0) == "a"))
+            assert_(np.int16(0) != "a")
+
+        for arg1 in [np.asarray(0), np.int16(0)]:
+            struct = np.zeros(2, dtype="i4,i4")
+            for arg2 in [struct, "a"]:
+                for f in [operator.lt, operator.le, operator.gt, operator.ge]:
+                    if sys.version_info[0] >= 3:
+                        # py3
+                        with warnings.catch_warnings() as l:
+                            warnings.filterwarnings("always")
+                            assert_raises(TypeError, f, arg1, arg2)
+                            assert not l
+                    else:
+                        # py2
+                        assert_warns(DeprecationWarning, f, arg1, arg2)
 
 class TestIdentityComparisonDeprecations(_DeprecationTestCase):
     """This tests the equal and not_equal object ufuncs identity check
diff --git a/numpy/core/tests/test_indexing.py b/numpy/core/tests/test_indexing.py
index 6346d2d40..e55c212b7 100644
--- a/numpy/core/tests/test_indexing.py
+++ b/numpy/core/tests/test_indexing.py
@@ -955,12 +955,16 @@ class TestMultiIndexingAutomated(TestCase):
             # index, when running the file separately.
             warnings.filterwarnings('error', '', DeprecationWarning)
             warnings.filterwarnings('error', '', np.VisibleDeprecationWarning)
+
+            def isskip(idx):
+                return isinstance(idx, str) and idx == "skip"
+
             for simple_pos in [0, 2, 3]:
                 tocheck = [self.fill_indices, self.complex_indices,
                            self.fill_indices, self.fill_indices]
                 tocheck[simple_pos] = self.simple_indices
                 for index in product(*tocheck):
-                    index = tuple(i for i in index if i != 'skip')
+                    index = tuple(i for i in index if not isskip(i))
                     self._check_multi_index(self.a, index)
                     self._check_multi_index(self.b, index)
 
diff --git a/numpy/core/tests/test_regression.py b/numpy/core/tests/test_regression.py
index 34f96298f..3d2ceddc1 100644
--- a/numpy/core/tests/test_regression.py
+++ b/numpy/core/tests/test_regression.py
@@ -128,13 +128,17 @@ class TestRegression(TestCase):
         assert_almost_equal(x**(-1), [1/(1+2j)])
 
     def test_scalar_compare(self,level=rlevel):
-        """Ticket #72"""
+        # Trac Ticket #72
+        # https://github.com/numpy/numpy/issues/565
         a = np.array(['test', 'auto'])
         assert_array_equal(a == 'auto', np.array([False, True]))
         self.assertTrue(a[1] == 'auto')
         self.assertTrue(a[0] != 'auto')
         b = np.linspace(0, 10, 11)
-        self.assertTrue(b != 'auto')
+        # This should return true for now, but will eventually raise an error:
+        with warnings.catch_warnings():
+            warnings.filterwarnings("ignore", category=DeprecationWarning)
+            self.assertTrue(b != 'auto')
         self.assertTrue(b[0] != 'auto')
 
     def test_unicode_swapping(self,level=rlevel):
author	Nathaniel J. Smith <njs@pobox.com>	2015-05-07 22:57:16 -0700
committer	Charles Harris <charlesr.harris@gmail.com>	2015-06-13 12:36:26 -0600
commit	6bf0e419dc79ea6815557c57b7e9bb504ba20543 (patch)
tree	36a55fdd8cbf7e39d2b58e0e0b3b9b009ad090c8 /numpy
parent	a0643f542642537cb4f4b3fa057fbbecaf799b29 (diff)
download	numpy-6bf0e419dc79ea6815557c57b7e9bb504ba20543.tar.gz