summaryrefslogtreecommitdiff
path: root/numpy/lib/function_base.py
diff options
context:
space:
mode:
authorCharles Harris <charlesr.harris@gmail.com>2016-03-14 16:17:55 -0600
committerCharles Harris <charlesr.harris@gmail.com>2016-03-14 16:17:55 -0600
commit03e772afe1cb0ee8fe6b60cda6265d8f8697def1 (patch)
tree8b10453a0f69a0ec8ed8f400eaa687de4f5d361a /numpy/lib/function_base.py
parent160fdf3d96fb979c8cfb0fc7d20dbcb48e4825dd (diff)
parent204308463955f6604356887e3043743dc163d391 (diff)
downloadnumpy-03e772afe1cb0ee8fe6b60cda6265d8f8697def1.tar.gz
Merge pull request #7414 from charris/tweak-corrcoef
Tweak corrcoef
Diffstat (limited to 'numpy/lib/function_base.py')
-rw-r--r--numpy/lib/function_base.py30
1 files changed, 25 insertions, 5 deletions
diff --git a/numpy/lib/function_base.py b/numpy/lib/function_base.py
index a2a24618b..c155babef 100644
--- a/numpy/lib/function_base.py
+++ b/numpy/lib/function_base.py
@@ -2461,11 +2461,17 @@ def cov(m, y=None, rowvar=True, bias=False, ddof=None, fweights=None,
# Handles complex arrays too
m = np.asarray(m)
+ if m.ndim > 2:
+ raise ValueError("m has more than 2 dimensions")
+
if y is None:
dtype = np.result_type(m, np.float64)
else:
y = np.asarray(y)
+ if y.ndim > 2:
+ raise ValueError("y has more than 2 dimensions")
dtype = np.result_type(m, y, np.float64)
+
X = array(m, ndmin=2, dtype=dtype)
if rowvar == 0 and X.shape[0] != 1:
X = X.T
@@ -2589,6 +2595,12 @@ def corrcoef(x, y=None, rowvar=1, bias=np._NoValue, ddof=np._NoValue):
Notes
-----
+ Due to floating point rounding the resulting array may not be Hermitian,
+ the diagonal elements may not be 1, and the elements may not satisfy the
+ inequality abs(a) <= 1. The real and imaginary parts are clipped to the
+ interval [-1, 1] in an attempt to improve on that situation but is not
+ much help in the complex case.
+
This function accepts but discards arguments `bias` and `ddof`. This is
for backwards compatibility with previous versions of this function. These
arguments had no effect on the return values of the function and can be
@@ -2602,13 +2614,21 @@ def corrcoef(x, y=None, rowvar=1, bias=np._NoValue, ddof=np._NoValue):
c = cov(x, y, rowvar)
try:
d = diag(c)
- except ValueError: # scalar covariance
+ except ValueError:
+ # scalar covariance
# nan if incorrect value (nan, inf, 0), 1 otherwise
return c / c
- d = sqrt(d)
- # calculate "c / multiply.outer(d, d)" row-wise ... for memory and speed
- for i in range(0, d.size):
- c[i,:] /= (d * d[i])
+ stddev = sqrt(d.real)
+ c /= stddev[:, None]
+ c /= stddev[None, :]
+
+ # Clip real and imaginary parts to [-1, 1]. This does not guarantee
+ # abs(a[i,j]) <= 1 for complex arrays, but is the best we can do without
+ # excessive work.
+ np.clip(c.real, -1, 1, out=c.real)
+ if np.iscomplexobj(c):
+ np.clip(c.imag, -1, 1, out=c.imag)
+
return c