diff options
| author | Amaury Forgeot d'Arc <amauryfa@gmail.com> | 2008-09-11 20:56:13 +0000 | 
|---|---|---|
| committer | Amaury Forgeot d'Arc <amauryfa@gmail.com> | 2008-09-11 20:56:13 +0000 | 
| commit | 24cb382455a0701b33926c134803a39f13e29bd1 (patch) | |
| tree | 9c99aba4406b65ae0fe19bd38dac101ed7e21c30 | |
| parent | d2e09383624944add0e670b857c572129d56988e (diff) | |
| download | cpython-git-24cb382455a0701b33926c134803a39f13e29bd1.tar.gz | |
#3640: Correct a crash in cPickle on 64bit platforms, in the case of deeply nested lists or dicts.
Reviewed by Martin von Loewis.
| -rw-r--r-- | Misc/NEWS | 3 | ||||
| -rw-r--r-- | Misc/find_recursionlimit.py | 19 | ||||
| -rw-r--r-- | Modules/cPickle.c | 181 | 
3 files changed, 139 insertions, 64 deletions
| @@ -75,6 +75,9 @@ C-API  Library  ------- +- Issue #3640: Pickling a list or a dict uses less local variables, to reduce +  stack usage in the case of deeply nested objects. +  - Issue #3629: Fix sre "bytecode" validator for an end case.  - Issue #3811: The Unicode database was updated to 5.1. diff --git a/Misc/find_recursionlimit.py b/Misc/find_recursionlimit.py index e6454c9c30..398abebc16 100644 --- a/Misc/find_recursionlimit.py +++ b/Misc/find_recursionlimit.py @@ -22,6 +22,7 @@ NB: A program that does not use __methods__ can set a higher limit.  """  import sys +import itertools  class RecursiveBlowup1:      def __init__(self): @@ -61,6 +62,23 @@ def test_getitem():  def test_recurse():      return test_recurse() +def test_cpickle(_cache={}): +    try: +        import cPickle +    except ImportError: +        print "cannot import cPickle, skipped!" +        return +    l = None +    for n in itertools.count(): +        try: +            l = _cache[n] +            continue  # Already tried and it works, let's save some time +        except KeyError: +            for i in range(100): +                l = [l] +        cPickle.dumps(l, protocol=-1) +        _cache[n] = l +  def check_limit(n, test_func_name):      sys.setrecursionlimit(n)      if test_func_name.startswith("test_"): @@ -83,5 +101,6 @@ while 1:      check_limit(limit, "test_init")      check_limit(limit, "test_getattr")      check_limit(limit, "test_getitem") +    check_limit(limit, "test_cpickle")      print "Limit of %d is fine" % limit      limit = limit + 100 diff --git a/Modules/cPickle.c b/Modules/cPickle.c index 7f4ad7eb87..95d619dc91 100644 --- a/Modules/cPickle.c +++ b/Modules/cPickle.c @@ -1515,8 +1515,8 @@ save_tuple(Picklerobject *self, PyObject *args)  static int  batch_list(Picklerobject *self, PyObject *iter)  { -	PyObject *obj; -	PyObject *slice[BATCHSIZE]; +	PyObject *obj = NULL; +	PyObject *firstitem = NULL;  	int i, n;  	static char append = APPEND; @@ -1545,45 +1545,69 @@ batch_list(Picklerobject *self, PyObject *iter)  	/* proto > 0:  write in batches of BATCHSIZE. */  	do { -		/* Get next group of (no more than) BATCHSIZE elements. */ -		for (n = 0; n < BATCHSIZE; ++n) { -			obj = PyIter_Next(iter); -			if (obj == NULL) { -				if (PyErr_Occurred()) -					goto BatchFailed; -				break; -			} -			slice[n] = obj; +		/* Get first item */ +		firstitem = PyIter_Next(iter); +		if (firstitem == NULL) { +			if (PyErr_Occurred()) +				goto BatchFailed; + +			/* nothing more to add */ +			break;  		} -		if (n > 1) { -			/* Pump out MARK, slice[0:n], APPENDS. */ -			if (self->write_func(self, &MARKv, 1) < 0) +		/* Try to get a second item */ +		obj = PyIter_Next(iter); +		if (obj == NULL) { +			if (PyErr_Occurred())  				goto BatchFailed; -			for (i = 0; i < n; ++i) { -				if (save(self, slice[i], 0) < 0) -					goto BatchFailed; -			} -			if (self->write_func(self, &appends, 1) < 0) -				goto BatchFailed; -		} -		else if (n == 1) { -			if (save(self, slice[0], 0) < 0) + +			/* Only one item to write */ +			if (save(self, firstitem, 0) < 0)  				goto BatchFailed;  			if (self->write_func(self, &append, 1) < 0)  				goto BatchFailed; +			Py_CLEAR(firstitem); +			break;  		} -		for (i = 0; i < n; ++i) { -			Py_DECREF(slice[i]); +		/* More than one item to write */ + +		/* Pump out MARK, items, APPENDS. */ +		if (self->write_func(self, &MARKv, 1) < 0) +			goto BatchFailed; +		 +		if (save(self, firstitem, 0) < 0) +			goto BatchFailed; +		Py_CLEAR(firstitem); +		n = 1; +		 +		/* Fetch and save up to BATCHSIZE items */ +		while (obj) { +			if (save(self, obj, 0) < 0) +				goto BatchFailed; +			Py_CLEAR(obj); +			n += 1; +			 +			if (n == BATCHSIZE) +				break; + +			obj = PyIter_Next(iter); +			if (obj == NULL) { +				if (PyErr_Occurred()) +					goto BatchFailed; +				break; +			}  		} + +		if (self->write_func(self, &appends, 1) < 0) +			goto BatchFailed; +  	} while (n == BATCHSIZE);  	return 0;  BatchFailed: -	while (--n >= 0) { -		Py_DECREF(slice[n]); -	} +	Py_XDECREF(firstitem); +	Py_XDECREF(obj);  	return -1;  } @@ -1659,8 +1683,8 @@ save_list(Picklerobject *self, PyObject *args)  static int  batch_dict(Picklerobject *self, PyObject *iter)  { -	PyObject *p; -	PyObject *slice[BATCHSIZE]; +	PyObject *p = NULL; +	PyObject *firstitem = NULL;  	int i, n;  	static char setitem = SETITEM; @@ -1696,56 +1720,85 @@ batch_dict(Picklerobject *self, PyObject *iter)  	/* proto > 0:  write in batches of BATCHSIZE. */  	do { -		/* Get next group of (no more than) BATCHSIZE elements. */ -		for (n = 0; n < BATCHSIZE; ++n) { -			p = PyIter_Next(iter); -			if (p == NULL) { -				if (PyErr_Occurred()) -					goto BatchFailed; -				break; -			} -			if (!PyTuple_Check(p) || PyTuple_Size(p) != 2) { -				PyErr_SetString(PyExc_TypeError, "dict items " -					"iterator must return 2-tuples"); +		/* Get first item */ +		firstitem = PyIter_Next(iter); +		if (firstitem == NULL) { +			if (PyErr_Occurred())  				goto BatchFailed; -			} -			slice[n] = p; + +			/* nothing more to add */ +			break; +		} +		if (!PyTuple_Check(firstitem) || PyTuple_Size(firstitem) != 2) { +			PyErr_SetString(PyExc_TypeError, "dict items " +					"iterator must return 2-tuples"); +			goto BatchFailed;  		} -		if (n > 1) { -			/* Pump out MARK, slice[0:n], SETITEMS. */ -			if (self->write_func(self, &MARKv, 1) < 0) +		/* Try to get a second item */ +		p = PyIter_Next(iter); +		if (p == NULL) { +			if (PyErr_Occurred())  				goto BatchFailed; -			for (i = 0; i < n; ++i) { -				p = slice[i]; -				if (save(self, PyTuple_GET_ITEM(p, 0), 0) < 0) -					goto BatchFailed; -				if (save(self, PyTuple_GET_ITEM(p, 1), 0) < 0) -					goto BatchFailed; -			} -			if (self->write_func(self, &setitems, 1) < 0) + +			/* Only one item to write */ +			if (save(self, PyTuple_GET_ITEM(firstitem, 0), 0) < 0)  				goto BatchFailed; +			if (save(self, PyTuple_GET_ITEM(firstitem, 1), 0) < 0) +				goto BatchFailed; +			if (self->write_func(self, &setitem, 1) < 0) +				goto BatchFailed; +			Py_CLEAR(firstitem); +			break;  		} -		else if (n == 1) { -			p = slice[0]; + +		/* More than one item to write */ + +		/* Pump out MARK, items, SETITEMS. */ +		if (self->write_func(self, &MARKv, 1) < 0) +			goto BatchFailed; + +		if (save(self, PyTuple_GET_ITEM(firstitem, 0), 0) < 0) +			goto BatchFailed; +		if (save(self, PyTuple_GET_ITEM(firstitem, 1), 0) < 0) +			goto BatchFailed; +		Py_CLEAR(firstitem); +		n = 1; + +		/* Fetch and save up to BATCHSIZE items */ +		while (p) { +			if (!PyTuple_Check(p) || PyTuple_Size(p) != 2) { +				PyErr_SetString(PyExc_TypeError, "dict items " +					"iterator must return 2-tuples"); +				goto BatchFailed; +			}  			if (save(self, PyTuple_GET_ITEM(p, 0), 0) < 0)  				goto BatchFailed;  			if (save(self, PyTuple_GET_ITEM(p, 1), 0) < 0)  				goto BatchFailed; -			if (self->write_func(self, &setitem, 1) < 0) -				goto BatchFailed; -		} +			Py_CLEAR(p); +			n += 1; + +			if (n == BATCHSIZE) +				break; -		for (i = 0; i < n; ++i) { -			Py_DECREF(slice[i]); +			p = PyIter_Next(iter); +			if (p == NULL) { +				if (PyErr_Occurred()) +					goto BatchFailed; +				break; +			}  		} + +		if (self->write_func(self, &setitems, 1) < 0) +			goto BatchFailed; +  	} while (n == BATCHSIZE);  	return 0;  BatchFailed: -	while (--n >= 0) { -		Py_DECREF(slice[n]); -	} +	Py_XDECREF(firstitem); +	Py_XDECREF(p);  	return -1;  } | 
