Fixed so swapped record arrays get converted properly.

author: Travis Oliphant <oliphant@enthought.com> 2005-12-13 06:54:34 +0000
committer: Travis Oliphant <oliphant@enthought.com> 2005-12-13 06:54:34 +0000
commit: a20e397e881f3b6c60d00a2195f79b87642f0cb7 (patch)
tree: e278f2bd60cd951df7537ac2ee3871504b7a2319
parent: f0995b54db038fa8e1ecfecf51c2519e48e10043 (diff)
download: numpy-a20e397e881f3b6c60d00a2195f79b87642f0cb7.tar.gz
4 files changed, 173 insertions, 21 deletions
diff --git a/scipy/base/chararray.py b/scipy/base/chararray.py
index 3133de07b..0bcc07b54 100644
--- a/scipy/base/chararray.py
+++ b/scipy/base/chararray.py
@@ -63,7 +63,7 @@ class chararray(ndarray):
         b = broadcast(self, other)
         arr = b.iters[1].base
         outitem = self.itemsize + arr.itemsize
-        result = ndchararray(b.shape, outitem, self.dtype is unicode_)
+        result = chararray(b.shape, outitem, self.dtype is unicode_)
         res = result.flat
         for k, val in enumerate(b):
             res[k] = (val[0] + val[1])
@@ -73,7 +73,7 @@ class chararray(ndarray):
         b = broadcast(other, self)
         outitem = b.iters[0].base.itemsize + \
                   b.iters[1].base.itemsize
-        result = ndchararray(b.shape, outitem, self.dtype is unicode_)        
+        result = chararray(b.shape, outitem, self.dtype is unicode_)        
         res = result.flat
         for k, val in enumerate(b):
             res[k] = (val[0] + val[1])
@@ -85,7 +85,7 @@ class chararray(ndarray):
         if not issubclass(arr.dtype, integer):
             raise ValueError, "Can only multiply by integers"
         outitem = b.iters[0].base.itemsize * arr.max()
-        result = ndchararray(b.shape, outitem, self.dtype is unicode_)
+        result = chararray(b.shape, outitem, self.dtype is unicode_)
         res = result.flat
         for k, val in enumerate(b):
             res[k] = val[0]*val[1]
@@ -97,7 +97,7 @@ class chararray(ndarray):
         if not issubclass(arr.dtype, integer):
             raise ValueError, "Can only multiply by integers"
         outitem = b.iters[0].base.itemsize * arr.max()
-        result = ndchararray(b.shape, outitem, self.dtype is unicode_)        
+        result = chararray(b.shape, outitem, self.dtype is unicode_)        
         res = result.flat
         for k, val in enumerate(b):
             res[k] = val[0]*val[1]
@@ -111,7 +111,7 @@ class chararray(ndarray):
             newval = val[0] % val[1]
             maxsize = max(len(newval), maxsize)
             res[k] = newval
-        newarr = ndchararray(b.shape, maxsize, self.dtype is unicode_)
+        newarr = chararray(b.shape, maxsize, self.dtype is unicode_)
         nearr[:] = res
         return newarr
     
@@ -130,7 +130,7 @@ class chararray(ndarray):
             newitem = getattr(val[0],name)(*newval)
             maxsize = max(len(newitem), maxsize)
             res[k] = newitem
-        newarr = ndchararray(myiter.shape, maxsize, self.dtype is unicode_)
+        newarr = chararray(myiter.shape, maxsize, self.dtype is unicode_)
 	print res, maxsize
         newarr[:] = res
         return newarr
@@ -284,7 +284,7 @@ class chararray(ndarray):
     
 def array(obj, itemlen=7, copy=True, unicode=False, fortran=False):
         
-    if isinstance(obj, ndchararray):
+    if isinstance(obj, chararray):
         if copy or (itemlen != obj.itemlen) \
            or (not unicode and obj.dtype == unicode_) \
            or (unicode and obj.dtype == string):
@@ -308,7 +308,7 @@ def array(obj, itemlen=7, copy=True, unicode=False, fortran=False):
         if copy and not copied:
             obj = obj.copy()
 
-        return ndarray.__new__(ndchararray, obj.shape, (dtype, itemlen),
+        return ndarray.__new__(chararray, obj.shape, (dtype, itemlen),
                                buffer=obj, offset=0, swap=obj.flags.swapped,
                                fortran=obj.flags['FNC'])    
 
diff --git a/scipy/base/records.py b/scipy/base/records.py
index 0b2a6be6a..ec259aad4 100644
--- a/scipy/base/records.py
+++ b/scipy/base/records.py
@@ -4,7 +4,10 @@ import numeric as sb
 import numerictypes as nt
 import sys
 import types
-import re
+import re, stat, os
+
+_sysbyte = sys.byteorder
+_byteorders = ['big','little']
 
 # formats regular expression
 # allows multidimension spec with a tuple syntax in front 
@@ -253,7 +256,8 @@ class record(nt.void):
 
 class recarray(sb.ndarray):
     def __new__(subtype, shape, formats, names=None, titles=None,
-                buf=None, offset=0, strides=None, swap=0, aligned=0):
+                buf=None, offset=0, strides=None, byteorder=_sysbyte,
+                aligned=0):
 
         if isinstance(formats, sb.dtypedescr):
             descr = formats
@@ -267,10 +271,11 @@ class recarray(sb.ndarray):
                     raise ValueError, "Can only deal with alignment"\
                           "for list and dictionary type-descriptors."
             descr = sb.dtypedescr(formats, aligned)
-        
+
         if buf is None:
             self = sb.ndarray.__new__(subtype, shape, (record, descr))
         else:
+            swap = ((byteorder != _sysbyte) and (byteorder in _byteorders))
             self = sb.ndarray.__new__(subtype, shape, (record, descr),
                                       buffer=buf, swap=swap)
         return self
@@ -295,7 +300,7 @@ class recarray(sb.ndarray):
 
 
 def fromarrays(arrayList, formats=None, names=None, titles=None, shape=None,
-               swap=0, aligned=0):
+               aligned=0):
     """ create a record array from a (flat) list of arrays
 
     >>> x1=array([1,2,3,4])
@@ -338,7 +343,7 @@ def fromarrays(arrayList, formats=None, names=None, titles=None, shape=None,
 
     parsed = format_parser(formats, names, titles, aligned)
     _names = parsed._names
-    _array = recarray(shape, parsed._descr, swap=swap)
+    _array = recarray(shape, parsed._descr)
     
     # populate the record array (makes a copy)
     for i in range(len(arrayList)):
@@ -346,8 +351,9 @@ def fromarrays(arrayList, formats=None, names=None, titles=None, shape=None,
 
     return _array
 
+# shape must be 1-d 
 def fromrecords(recList, formats=None, names=None, titles=None, shape=None,
-                swap=0, aligned=0):
+                aligned=0):
     """ create a Record Array from a list of records in text form
 
         The data in the same field can be heterogeneous, they will be promoted
@@ -376,25 +382,147 @@ def fromrecords(recList, formats=None, names=None, titles=None, shape=None,
     if (shape is None or shape == 0):
         shape = len(recList)
 
-    if isinstance(shape, int):
+    if isinstance(shape, (int, long)):
         shape = (shape,)
 
+    if len(shape > 1):
+        raise ValueError, "Can only deal with 1-d list of records"
+
     nfields = len(recList[0])
     if formats is None:  # slower
         obj = sb.array(recList,dtype=object)
         arrlist = [sb.array(obj[:,i].tolist()) for i in xrange(nfields)]
         return fromarrays(arrlist, formats=formats, shape=shape, names=names,
-                          titles=titles, swap=swap, aligned=aligned)
+                          titles=titles, aligned=aligned)
     
     parsed = format_parser(formats, names, titles, aligned)
     _names = parsed._names
-    _array = recarray(shape, parsed._descr, swap=swap)
-
+    _array = recarray(shape, parsed._descr)
     farr = _array.flat
-
+    
     for k in xrange(_array.size):
         for j in xrange(nfields):
             farr[k][_names[j]] = recList[k][j]
 
     return _array
 
+def fromstring(datastring, formats, shape=None, names=None, titles=None,
+               byteorder=_sysbyte, aligned=0, offset=0):
+    """ create a (read-only) record array from binary data contained in
+    a string"""
+
+    formats = format_parser(formats, names, titles, aligned)
+    itemsize = parsed._descr.itemsize
+    if (shape is None or shape == 0 or shape == -1):
+        shape = (len(datastring)-offset) / itemsize
+        
+    _array = recarray(shape, parsed._descr, shape=shape, names=names,
+                      titles=titles, buf=datastring, offset=offset,
+                      byteorder=byteorder)
+    return _array
+
+def fromfile(fd, formats, shape=None, names=None, titles=None,
+             byteorder=_sysbyte, aligned=0, offset=0):
+    """Create an array from binary file data
+
+    If file is a string then that file is opened, else it is assumed
+    to be a file object. No options at the moment, all file positioning
+    must be done prior to this function call with a file object
+
+    >>> import testdata, sys
+    >>> fd=open(testdata.filename)
+    >>> fd.seek(2880*2)
+    >>> r=fromfile(fd, formats='f8,i4,a5', shape=3, byteorder='big')
+    >>> print r[0]
+    (5.1000000000000005, 61, 'abcde')
+    >>> r._shape
+    (3,)
+    """
+
+    if (shape is None or shape == 0):
+        shape = (-1,)
+    elif isinstance(shape, (int, long)):
+        shape = (shape,)
+
+    name = 0
+    if isinstance(fd, str):
+        name = 1
+        fd = open(fd, 'rb')
+    if (offset > 0):
+        fd.seek(offset, 1)
+    try:
+        size = os.fstat(fd.fileno())[stat.ST_SIZE] - fd.tell()
+    except:
+        size = os.path.getsize(fd.name) - fd.tell()
+
+    parsed = format_parser(formats, names, titles, aligned)
+    itemsize = parsed._descr.itemsize
+
+    shapeprod = sb.array(shape).prod()
+    shapesize = shapeprod*itemsize
+    if shapesize < 0:
+        shape = list(shape)
+        shape[ shape.index(-1) ] = size / -shapesize
+        shape = tuple(shape)
+        shapeprod = sb.array(shape).prod()
+        
+    nbytes = shapeprod*itemsize
+
+    if nbytes > size:
+        raise ValueError(
+                "Not enough bytes left in file for specified shape and type")
+
+    # create the array
+    _array = recarray(shape, parsed._descr)
+    nbytesread = fd.readinto(_array.data)
+    if nbytesread != nbytes:
+        raise IOError("Didn't read as many bytes as expected")
+    if name:
+        fd.close()
+
+    # update swap flag if byteorder does not match
+    if ((byteorder != _sysbyte) and (byteorder in _byteorders)):
+        _array.flags.swapped=True
+        
+    return _array
+
+
+def array(obj, formats=None, names=None, titles=None, shape=None,
+          byteorder=_sysbyte, aligned=0, offset=0, strides=None):
+    
+    if isinstance(obj, (type(None), str, file)) and (formats is None):
+        raise ValueError("Must define formats if object is "\
+                         "None, string, or a file pointer")
+
+    elif obj is None:
+        if shape is None:
+            raise ValueError("Must define a shape if obj is None")
+        return recarray(shape, formats, names=names, titles=titles,
+                        buf=obj, offset=offset, strides=strides,
+                        byteorder=byteorder, aligned=aligned)
+    elif isinstance(obj, str):
+        return fromstring(obj, formats, names=names, titles=titles,
+                          shape=shape, byteorder=byteorder, aligned=aligned,
+                          offset=offset)
+    elif isinstance(obj, (list, tuple)):
+        if isinstance(obj[0], sb.ndarray):
+            return fromarrays(obj, formats=formats, names=names, titles=titles,
+                              shape=shape, aligned=aligned)
+        else:
+            return fromrecords(obj, formats=formats, names=names, titles=titles,
+                               shape=shape, aligned=aligned)
+    elif isinstance(obj, recarray):
+        new = obj.copy()
+        parsed = format_parser(formats, names, titles, aligned)
+        new.dtypedescr = parsed._descr
+        return new
+    elif isinstance(obj, file):
+        return fromfile(obj, formats=formats, names=names, titles=titles,
+                        shape=shape, byteorder=byteorder, aligned=aligned,
+                        offset=offset)
+    else:
+        raise ValueError("Unknown input type")
+    
+    
+                
+        
diff --git a/scipy/base/src/scalartypes.inc.src b/scipy/base/src/scalartypes.inc.src
index 5dfa914b6..b095a859f 100644
--- a/scipy/base/src/scalartypes.inc.src
+++ b/scipy/base/src/scalartypes.inc.src
@@ -1070,7 +1070,7 @@ gentype_byteswap(PyObject *self, PyObject *args)
 
 /**begin repeat
 
-#name=getfield, take, put, putmask, repeat, tofile, mean, trace, diagonal, clip, std, var, sum, cumsum, prod, cumprod, compress#
+#name=take, put, putmask, repeat, tofile, mean, trace, diagonal, clip, std, var, sum, cumsum, prod, cumprod, compress#
 */
 
 static PyObject *
@@ -1081,6 +1081,30 @@ gentype_@name@(PyObject *self, PyObject *args, PyObject *kwds)
 /**end repeat**/
 
 static PyObject *
+gentype_getfield(PyObject *self, PyObject *args, PyObject *kwds)
+{
+	PyObject *ret;
+
+	ret = gentype_generic_method(self, args, kwds, "getfield");
+	if (!ret) return ret;
+	if (PyArray_IsScalar(self, Void) && \
+	    PyArray_IsScalar(ret, Generic) &&	\
+	    (!PyArray_IsScalar(ret, Void))) {
+		PyArray_Descr *descr;
+		if (!((((PyVoidScalarObject *)self)->flags &	\
+		       NOTSWAPPED) == NOTSWAPPED)) {
+			descr = PyArray_DescrFromScalar(ret);
+			if (descr->byteorder != '|') {
+				descr->f->copyswap(_SOFFSET_(ret, 
+							     descr->type_num),
+						   NULL, 1, descr->elsize);
+			}
+		}
+	}
+	return ret;
+}
+
+static PyObject *
 gentype_setfield(PyObject *self, PyObject *args, PyObject *kwds)
 {
 	PyArray_Descr *typecode;
diff --git a/scipy/core_version.py b/scipy/core_version.py
index 3708e1368..d59d24b4e 100644
--- a/scipy/core_version.py
+++ b/scipy/core_version.py
@@ -1,4 +1,4 @@
-version='0.8.3'
+version='0.8.4'
 
 import os
 svn_version_file = os.path.join(os.path.dirname(__file__),
author	Travis Oliphant <oliphant@enthought.com>	2005-12-13 06:54:34 +0000
committer	Travis Oliphant <oliphant@enthought.com>	2005-12-13 06:54:34 +0000
commit	a20e397e881f3b6c60d00a2195f79b87642f0cb7 (patch)
tree	e278f2bd60cd951df7537ac2ee3871504b7a2319
parent	f0995b54db038fa8e1ecfecf51c2519e48e10043 (diff)
download	numpy-a20e397e881f3b6c60d00a2195f79b87642f0cb7.tar.gz