mirror of
				https://github.com/python/cpython.git
				synced 2025-10-25 10:44:55 +00:00 
			
		
		
		
	 dd226eabe9
			
		
	
	
		dd226eabe9
		
	
	
	
	
		
			
			svn+ssh://pythondev@svn.python.org/python/trunk ........ r72597 | r.david.murray | 2009-05-12 20:30:29 -0400 (Tue, 12 May 2009) | 2 lines Issue 5994: add docstrings to marshal. ........
		
			
				
	
	
		
			1381 lines
		
	
	
	
		
			31 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
			
		
		
	
	
			1381 lines
		
	
	
	
		
			31 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
| 
 | ||
| /* Write Python objects to files and read them back.
 | ||
|    This is intended for writing and reading compiled Python code only;
 | ||
|    a true persistent storage facility would be much harder, since
 | ||
|    it would have to take circular links and sharing into account. */
 | ||
| 
 | ||
| #define PY_SSIZE_T_CLEAN
 | ||
| 
 | ||
| #include "Python.h"
 | ||
| #include "longintrepr.h"
 | ||
| #include "code.h"
 | ||
| #include "marshal.h"
 | ||
| 
 | ||
| #define ABS(x) ((x) < 0 ? -(x) : (x))
 | ||
| 
 | ||
| /* High water mark to determine when the marshalled object is dangerously deep
 | ||
|  * and risks coring the interpreter.  When the object stack gets this deep,
 | ||
|  * raise an exception instead of continuing.
 | ||
|  * On Windows debug builds, reduce this value.
 | ||
|  */
 | ||
| #if defined(MS_WINDOWS) && defined(_DEBUG)
 | ||
| #define MAX_MARSHAL_STACK_DEPTH 1500
 | ||
| #else
 | ||
| #define MAX_MARSHAL_STACK_DEPTH 2000
 | ||
| #endif
 | ||
| 
 | ||
| #define TYPE_NULL		'0'
 | ||
| #define TYPE_NONE		'N'
 | ||
| #define TYPE_FALSE		'F'
 | ||
| #define TYPE_TRUE		'T'
 | ||
| #define TYPE_STOPITER		'S'
 | ||
| #define TYPE_ELLIPSIS   	'.'
 | ||
| #define TYPE_INT		'i'
 | ||
| #define TYPE_INT64		'I'
 | ||
| #define TYPE_FLOAT		'f'
 | ||
| #define TYPE_BINARY_FLOAT	'g'
 | ||
| #define TYPE_COMPLEX		'x'
 | ||
| #define TYPE_BINARY_COMPLEX	'y'
 | ||
| #define TYPE_LONG		'l'
 | ||
| #define TYPE_STRING		's'
 | ||
| #define TYPE_TUPLE		'('
 | ||
| #define TYPE_LIST		'['
 | ||
| #define TYPE_DICT		'{'
 | ||
| #define TYPE_CODE		'c'
 | ||
| #define TYPE_UNICODE		'u'
 | ||
| #define TYPE_UNKNOWN		'?'
 | ||
| #define TYPE_SET		'<'
 | ||
| #define TYPE_FROZENSET  	'>'
 | ||
| 
 | ||
| #define WFERR_OK 0
 | ||
| #define WFERR_UNMARSHALLABLE 1
 | ||
| #define WFERR_NESTEDTOODEEP 2
 | ||
| #define WFERR_NOMEMORY 3
 | ||
| 
 | ||
| typedef struct {
 | ||
| 	FILE *fp;
 | ||
| 	int error;  /* see WFERR_* values */
 | ||
| 	int depth;
 | ||
| 	/* If fp == NULL, the following are valid: */
 | ||
| 	PyObject *str;
 | ||
| 	char *ptr;
 | ||
| 	char *end;
 | ||
| 	PyObject *strings; /* dict on marshal, list on unmarshal */
 | ||
| 	int version;
 | ||
| } WFILE;
 | ||
| 
 | ||
| #define w_byte(c, p) if (((p)->fp)) putc((c), (p)->fp); \
 | ||
| 		      else if ((p)->ptr != (p)->end) *(p)->ptr++ = (c); \
 | ||
| 			   else w_more(c, p)
 | ||
| 
 | ||
| static void
 | ||
| w_more(int c, WFILE *p)
 | ||
| {
 | ||
| 	Py_ssize_t size, newsize;
 | ||
| 	if (p->str == NULL)
 | ||
| 		return; /* An error already occurred */
 | ||
| 	size = PyBytes_Size(p->str);
 | ||
| 	newsize = size + size + 1024;
 | ||
| 	if (newsize > 32*1024*1024) {
 | ||
| 		newsize = size + (size >> 3);	/* 12.5% overallocation */
 | ||
| 	}
 | ||
| 	if (_PyBytes_Resize(&p->str, newsize) != 0) {
 | ||
| 		p->ptr = p->end = NULL;
 | ||
| 	}
 | ||
| 	else {
 | ||
| 		p->ptr = PyBytes_AS_STRING((PyBytesObject *)p->str) + size;
 | ||
| 		p->end =
 | ||
| 			PyBytes_AS_STRING((PyBytesObject *)p->str) + newsize;
 | ||
| 		*p->ptr++ = Py_SAFE_DOWNCAST(c, int, char);
 | ||
| 	}
 | ||
| }
 | ||
| 
 | ||
| static void
 | ||
| w_string(char *s, int n, WFILE *p)
 | ||
| {
 | ||
| 	if (p->fp != NULL) {
 | ||
| 		fwrite(s, 1, n, p->fp);
 | ||
| 	}
 | ||
| 	else {
 | ||
| 		while (--n >= 0) {
 | ||
| 			w_byte(*s, p);
 | ||
| 			s++;
 | ||
| 		}
 | ||
| 	}
 | ||
| }
 | ||
| 
 | ||
| static void
 | ||
| w_short(int x, WFILE *p)
 | ||
| {
 | ||
| 	w_byte((char)( x      & 0xff), p);
 | ||
| 	w_byte((char)((x>> 8) & 0xff), p);
 | ||
| }
 | ||
| 
 | ||
| static void
 | ||
| w_long(long x, WFILE *p)
 | ||
| {
 | ||
| 	w_byte((char)( x      & 0xff), p);
 | ||
| 	w_byte((char)((x>> 8) & 0xff), p);
 | ||
| 	w_byte((char)((x>>16) & 0xff), p);
 | ||
| 	w_byte((char)((x>>24) & 0xff), p);
 | ||
| }
 | ||
| 
 | ||
| #if SIZEOF_LONG > 4
 | ||
| static void
 | ||
| w_long64(long x, WFILE *p)
 | ||
| {
 | ||
| 	w_long(x, p);
 | ||
| 	w_long(x>>32, p);
 | ||
| }
 | ||
| #endif
 | ||
| 
 | ||
| /* We assume that Python longs are stored internally in base some power of
 | ||
|    2**15; for the sake of portability we'll always read and write them in base
 | ||
|    exactly 2**15. */
 | ||
| 
 | ||
| #define PyLong_MARSHAL_SHIFT 15
 | ||
| #define PyLong_MARSHAL_BASE ((short)1 << PyLong_MARSHAL_SHIFT)
 | ||
| #define PyLong_MARSHAL_MASK (PyLong_MARSHAL_BASE - 1)
 | ||
| #if PyLong_SHIFT % PyLong_MARSHAL_SHIFT != 0
 | ||
| #error "PyLong_SHIFT must be a multiple of PyLong_MARSHAL_SHIFT"
 | ||
| #endif
 | ||
| #define PyLong_MARSHAL_RATIO (PyLong_SHIFT / PyLong_MARSHAL_SHIFT)
 | ||
| 
 | ||
| static void
 | ||
| w_PyLong(const PyLongObject *ob, WFILE *p)
 | ||
| {
 | ||
| 	Py_ssize_t i, j, n, l;
 | ||
| 	digit d;
 | ||
| 
 | ||
| 	w_byte(TYPE_LONG, p);
 | ||
| 	if (Py_SIZE(ob) == 0) {
 | ||
| 		w_long((long)0, p);
 | ||
| 		return;
 | ||
| 	}
 | ||
| 
 | ||
| 	/* set l to number of base PyLong_MARSHAL_BASE digits */
 | ||
| 	n = ABS(Py_SIZE(ob));
 | ||
| 	l = (n-1) * PyLong_MARSHAL_RATIO;
 | ||
| 	d = ob->ob_digit[n-1];
 | ||
| 	assert(d != 0); /* a PyLong is always normalized */
 | ||
| 	do {
 | ||
| 		d >>= PyLong_MARSHAL_SHIFT;
 | ||
| 		l++;
 | ||
| 	} while (d != 0);
 | ||
| 	w_long((long)(Py_SIZE(ob) > 0 ? l : -l), p);
 | ||
| 
 | ||
| 	for (i=0; i < n-1; i++) {
 | ||
| 		d = ob->ob_digit[i];
 | ||
| 		for (j=0; j < PyLong_MARSHAL_RATIO; j++) {
 | ||
| 			w_short(d & PyLong_MARSHAL_MASK, p);
 | ||
| 			d >>= PyLong_MARSHAL_SHIFT;
 | ||
| 		}
 | ||
| 		assert (d == 0);
 | ||
| 	}
 | ||
| 	d = ob->ob_digit[n-1];
 | ||
| 	do {
 | ||
| 		w_short(d & PyLong_MARSHAL_MASK, p);
 | ||
| 		d >>= PyLong_MARSHAL_SHIFT;
 | ||
| 	} while (d != 0);
 | ||
| }
 | ||
| 
 | ||
| static void
 | ||
| w_object(PyObject *v, WFILE *p)
 | ||
| {
 | ||
| 	Py_ssize_t i, n;
 | ||
| 
 | ||
| 	p->depth++;
 | ||
| 
 | ||
| 	if (p->depth > MAX_MARSHAL_STACK_DEPTH) {
 | ||
| 		p->error = WFERR_NESTEDTOODEEP;
 | ||
| 	}
 | ||
| 	else if (v == NULL) {
 | ||
| 		w_byte(TYPE_NULL, p);
 | ||
| 	}
 | ||
| 	else if (v == Py_None) {
 | ||
| 		w_byte(TYPE_NONE, p);
 | ||
| 	}
 | ||
| 	else if (v == PyExc_StopIteration) {
 | ||
| 		w_byte(TYPE_STOPITER, p);
 | ||
| 	}
 | ||
| 	else if (v == Py_Ellipsis) {
 | ||
| 	        w_byte(TYPE_ELLIPSIS, p);
 | ||
| 	}
 | ||
| 	else if (v == Py_False) {
 | ||
| 	        w_byte(TYPE_FALSE, p);
 | ||
| 	}
 | ||
| 	else if (v == Py_True) {
 | ||
| 	        w_byte(TYPE_TRUE, p);
 | ||
| 	}
 | ||
| 	else if (PyLong_CheckExact(v)) {
 | ||
| 		long x = PyLong_AsLong(v);
 | ||
| 		if ((x == -1)  && PyErr_Occurred()) {
 | ||
| 			PyLongObject *ob = (PyLongObject *)v;
 | ||
| 			PyErr_Clear();
 | ||
| 			w_PyLong(ob, p);
 | ||
| 		}
 | ||
| 		else {
 | ||
| #if SIZEOF_LONG > 4
 | ||
| 			long y = Py_ARITHMETIC_RIGHT_SHIFT(long, x, 31);
 | ||
| 			if (y && y != -1) {
 | ||
| 				w_byte(TYPE_INT64, p);
 | ||
| 				w_long64(x, p);
 | ||
| 			}
 | ||
| 			else
 | ||
| #endif
 | ||
| 			{
 | ||
| 				w_byte(TYPE_INT, p);
 | ||
| 				w_long(x, p);
 | ||
| 			}
 | ||
| 		}
 | ||
| 	}
 | ||
| 	else if (PyFloat_CheckExact(v)) {
 | ||
| 		if (p->version > 1) {
 | ||
| 			unsigned char buf[8];
 | ||
| 			if (_PyFloat_Pack8(PyFloat_AsDouble(v), 
 | ||
| 					   buf, 1) < 0) {
 | ||
| 				p->error = WFERR_UNMARSHALLABLE;
 | ||
| 				return;
 | ||
| 			}
 | ||
| 			w_byte(TYPE_BINARY_FLOAT, p);
 | ||
| 			w_string((char*)buf, 8, p);
 | ||
| 		}
 | ||
| 		else {
 | ||
| 			char *buf = PyOS_double_to_string(PyFloat_AS_DOUBLE(v),
 | ||
|                                                           'g', 17, 0, NULL);
 | ||
| 			if (!buf) {
 | ||
| 				p->error = WFERR_NOMEMORY;
 | ||
| 				return;
 | ||
| 			}
 | ||
| 			n = strlen(buf);
 | ||
| 			w_byte(TYPE_FLOAT, p);
 | ||
| 			w_byte((int)n, p);
 | ||
| 			w_string(buf, (int)n, p);
 | ||
| 			PyMem_Free(buf);
 | ||
| 		}
 | ||
| 	}
 | ||
| #ifndef WITHOUT_COMPLEX
 | ||
| 	else if (PyComplex_CheckExact(v)) {
 | ||
| 		if (p->version > 1) {
 | ||
| 			unsigned char buf[8];
 | ||
| 			if (_PyFloat_Pack8(PyComplex_RealAsDouble(v),
 | ||
| 					   buf, 1) < 0) {
 | ||
| 				p->error = WFERR_UNMARSHALLABLE;
 | ||
| 				return;
 | ||
| 			}
 | ||
| 			w_byte(TYPE_BINARY_COMPLEX, p);
 | ||
| 			w_string((char*)buf, 8, p);
 | ||
| 			if (_PyFloat_Pack8(PyComplex_ImagAsDouble(v), 
 | ||
| 					   buf, 1) < 0) {
 | ||
| 				p->error = WFERR_UNMARSHALLABLE;
 | ||
| 				return;
 | ||
| 			}
 | ||
| 			w_string((char*)buf, 8, p);
 | ||
| 		}
 | ||
| 		else {
 | ||
| 			char *buf;
 | ||
| 			w_byte(TYPE_COMPLEX, p);
 | ||
| 			buf = PyOS_double_to_string(PyComplex_RealAsDouble(v),
 | ||
|                                                     'g', 17, 0, NULL);
 | ||
| 			if (!buf) {
 | ||
| 				p->error = WFERR_NOMEMORY;
 | ||
| 				return;
 | ||
| 			}
 | ||
| 			n = strlen(buf);
 | ||
| 			w_byte((int)n, p);
 | ||
| 			w_string(buf, (int)n, p);
 | ||
| 			PyMem_Free(buf);
 | ||
| 			buf = PyOS_double_to_string(PyComplex_ImagAsDouble(v),
 | ||
|                                                     'g', 17, 0, NULL);
 | ||
| 			if (!buf) {
 | ||
| 				p->error = WFERR_NOMEMORY;
 | ||
| 				return;
 | ||
| 			}
 | ||
| 			n = strlen(buf);
 | ||
| 			w_byte((int)n, p);
 | ||
| 			w_string(buf, (int)n, p);
 | ||
| 			PyMem_Free(buf);
 | ||
| 		}
 | ||
| 	}
 | ||
| #endif
 | ||
| 	else if (PyBytes_CheckExact(v)) {
 | ||
| 		w_byte(TYPE_STRING, p);
 | ||
| 		n = PyBytes_GET_SIZE(v);
 | ||
| 		if (n > INT_MAX) {
 | ||
| 			/* huge strings are not supported */
 | ||
| 			p->depth--;
 | ||
| 			p->error = WFERR_UNMARSHALLABLE;
 | ||
| 			return;
 | ||
| 		}
 | ||
| 		w_long((long)n, p);
 | ||
| 		w_string(PyBytes_AS_STRING(v), (int)n, p);
 | ||
| 	}
 | ||
| 	else if (PyUnicode_CheckExact(v)) {
 | ||
| 	        PyObject *utf8;
 | ||
| 		utf8 = PyUnicode_EncodeUTF8(PyUnicode_AS_UNICODE(v),
 | ||
| 					    PyUnicode_GET_SIZE(v),
 | ||
| 					    "surrogatepass");
 | ||
| 		if (utf8 == NULL) {
 | ||
| 			p->depth--;
 | ||
| 			p->error = WFERR_UNMARSHALLABLE;
 | ||
| 			return;
 | ||
| 		}
 | ||
| 		w_byte(TYPE_UNICODE, p);
 | ||
| 		n = PyBytes_GET_SIZE(utf8);
 | ||
| 		if (n > INT_MAX) {
 | ||
| 			p->depth--;
 | ||
| 			p->error = WFERR_UNMARSHALLABLE;
 | ||
| 			return;
 | ||
| 		}
 | ||
| 		w_long((long)n, p);
 | ||
| 		w_string(PyBytes_AS_STRING(utf8), (int)n, p);
 | ||
| 		Py_DECREF(utf8);
 | ||
| 	}
 | ||
| 	else if (PyTuple_CheckExact(v)) {
 | ||
| 		w_byte(TYPE_TUPLE, p);
 | ||
| 		n = PyTuple_Size(v);
 | ||
| 		w_long((long)n, p);
 | ||
| 		for (i = 0; i < n; i++) {
 | ||
| 			w_object(PyTuple_GET_ITEM(v, i), p);
 | ||
| 		}
 | ||
| 	}
 | ||
| 	else if (PyList_CheckExact(v)) {
 | ||
| 		w_byte(TYPE_LIST, p);
 | ||
| 		n = PyList_GET_SIZE(v);
 | ||
| 		w_long((long)n, p);
 | ||
| 		for (i = 0; i < n; i++) {
 | ||
| 			w_object(PyList_GET_ITEM(v, i), p);
 | ||
| 		}
 | ||
| 	}
 | ||
| 	else if (PyDict_CheckExact(v)) {
 | ||
| 		Py_ssize_t pos;
 | ||
| 		PyObject *key, *value;
 | ||
| 		w_byte(TYPE_DICT, p);
 | ||
| 		/* This one is NULL object terminated! */
 | ||
| 		pos = 0;
 | ||
| 		while (PyDict_Next(v, &pos, &key, &value)) {
 | ||
| 			w_object(key, p);
 | ||
| 			w_object(value, p);
 | ||
| 		}
 | ||
| 		w_object((PyObject *)NULL, p);
 | ||
| 	}
 | ||
| 	else if (PyAnySet_CheckExact(v)) {
 | ||
| 		PyObject *value, *it;
 | ||
| 
 | ||
| 		if (PyObject_TypeCheck(v, &PySet_Type))
 | ||
| 			w_byte(TYPE_SET, p);
 | ||
| 		else
 | ||
| 			w_byte(TYPE_FROZENSET, p);
 | ||
| 		n = PyObject_Size(v);
 | ||
| 		if (n == -1) {
 | ||
| 			p->depth--;
 | ||
| 			p->error = WFERR_UNMARSHALLABLE;
 | ||
| 			return;
 | ||
| 		}
 | ||
| 		w_long((long)n, p);
 | ||
| 		it = PyObject_GetIter(v);
 | ||
| 		if (it == NULL) {
 | ||
| 			p->depth--;
 | ||
| 			p->error = WFERR_UNMARSHALLABLE;
 | ||
| 			return;
 | ||
| 		}
 | ||
| 		while ((value = PyIter_Next(it)) != NULL) {
 | ||
| 			w_object(value, p);
 | ||
| 			Py_DECREF(value);
 | ||
| 		}
 | ||
| 		Py_DECREF(it);
 | ||
| 		if (PyErr_Occurred()) {
 | ||
| 			p->depth--;
 | ||
| 			p->error = WFERR_UNMARSHALLABLE;
 | ||
| 			return;
 | ||
| 		}
 | ||
| 	}
 | ||
| 	else if (PyCode_Check(v)) {
 | ||
| 		PyCodeObject *co = (PyCodeObject *)v;
 | ||
| 		w_byte(TYPE_CODE, p);
 | ||
| 		w_long(co->co_argcount, p);
 | ||
| 		w_long(co->co_kwonlyargcount, p);
 | ||
| 		w_long(co->co_nlocals, p);
 | ||
| 		w_long(co->co_stacksize, p);
 | ||
| 		w_long(co->co_flags, p);
 | ||
| 		w_object(co->co_code, p);
 | ||
| 		w_object(co->co_consts, p);
 | ||
| 		w_object(co->co_names, p);
 | ||
| 		w_object(co->co_varnames, p);
 | ||
| 		w_object(co->co_freevars, p);
 | ||
| 		w_object(co->co_cellvars, p);
 | ||
| 		w_object(co->co_filename, p);
 | ||
| 		w_object(co->co_name, p);
 | ||
| 		w_long(co->co_firstlineno, p);
 | ||
| 		w_object(co->co_lnotab, p);
 | ||
| 	}
 | ||
| 	else if (PyObject_CheckBuffer(v)) {
 | ||
| 		/* Write unknown buffer-style objects as a string */
 | ||
| 		char *s;
 | ||
| 		PyBufferProcs *pb = v->ob_type->tp_as_buffer;
 | ||
|                 Py_buffer view;
 | ||
| 		if ((*pb->bf_getbuffer)(v, &view, PyBUF_SIMPLE) != 0) {
 | ||
|                         w_byte(TYPE_UNKNOWN, p);
 | ||
|                         p->error = WFERR_UNMARSHALLABLE;
 | ||
|                 }
 | ||
| 		w_byte(TYPE_STRING, p);
 | ||
|                 n = view.len;
 | ||
|                 s = view.buf;                        
 | ||
| 		if (n > INT_MAX) {
 | ||
| 			p->depth--;
 | ||
| 			p->error = WFERR_UNMARSHALLABLE;
 | ||
| 			return;
 | ||
| 		}
 | ||
| 		w_long((long)n, p);
 | ||
| 		w_string(s, (int)n, p);
 | ||
|                 if (pb->bf_releasebuffer != NULL)
 | ||
|                         (*pb->bf_releasebuffer)(v, &view);
 | ||
| 	}
 | ||
| 	else {
 | ||
| 		w_byte(TYPE_UNKNOWN, p);
 | ||
| 		p->error = WFERR_UNMARSHALLABLE;
 | ||
| 	}
 | ||
| 	p->depth--;
 | ||
| }
 | ||
| 
 | ||
| /* version currently has no effect for writing longs. */
 | ||
| void
 | ||
| PyMarshal_WriteLongToFile(long x, FILE *fp, int version)
 | ||
| {
 | ||
| 	WFILE wf;
 | ||
| 	wf.fp = fp;
 | ||
| 	wf.error = WFERR_OK;
 | ||
| 	wf.depth = 0;
 | ||
| 	wf.strings = NULL;
 | ||
| 	wf.version = version;
 | ||
| 	w_long(x, &wf);
 | ||
| }
 | ||
| 
 | ||
| void
 | ||
| PyMarshal_WriteObjectToFile(PyObject *x, FILE *fp, int version)
 | ||
| {
 | ||
| 	WFILE wf;
 | ||
| 	wf.fp = fp;
 | ||
| 	wf.error = WFERR_OK;
 | ||
| 	wf.depth = 0;
 | ||
| 	wf.strings = (version > 0) ? PyDict_New() : NULL;
 | ||
| 	wf.version = version;
 | ||
| 	w_object(x, &wf);
 | ||
| 	Py_XDECREF(wf.strings);
 | ||
| }
 | ||
| 
 | ||
| typedef WFILE RFILE; /* Same struct with different invariants */
 | ||
| 
 | ||
| #define rs_byte(p) (((p)->ptr < (p)->end) ? (unsigned char)*(p)->ptr++ : EOF)
 | ||
| 
 | ||
| #define r_byte(p) ((p)->fp ? getc((p)->fp) : rs_byte(p))
 | ||
| 
 | ||
| static int
 | ||
| r_string(char *s, int n, RFILE *p)
 | ||
| {
 | ||
| 	if (p->fp != NULL)
 | ||
| 		/* The result fits into int because it must be <=n. */
 | ||
| 		return (int)fread(s, 1, n, p->fp);
 | ||
| 	if (p->end - p->ptr < n)
 | ||
| 		n = (int)(p->end - p->ptr);
 | ||
| 	memcpy(s, p->ptr, n);
 | ||
| 	p->ptr += n;
 | ||
| 	return n;
 | ||
| }
 | ||
| 
 | ||
| static int
 | ||
| r_short(RFILE *p)
 | ||
| {
 | ||
| 	register short x;
 | ||
| 	x = r_byte(p);
 | ||
| 	x |= r_byte(p) << 8;
 | ||
| 	/* Sign-extension, in case short greater than 16 bits */
 | ||
| 	x |= -(x & 0x8000);
 | ||
| 	return x;
 | ||
| }
 | ||
| 
 | ||
| static long
 | ||
| r_long(RFILE *p)
 | ||
| {
 | ||
| 	register long x;
 | ||
| 	register FILE *fp = p->fp;
 | ||
| 	if (fp) {
 | ||
| 		x = getc(fp);
 | ||
| 		x |= (long)getc(fp) << 8;
 | ||
| 		x |= (long)getc(fp) << 16;
 | ||
| 		x |= (long)getc(fp) << 24;
 | ||
| 	}
 | ||
| 	else {
 | ||
| 		x = rs_byte(p);
 | ||
| 		x |= (long)rs_byte(p) << 8;
 | ||
| 		x |= (long)rs_byte(p) << 16;
 | ||
| 		x |= (long)rs_byte(p) << 24;
 | ||
| 	}
 | ||
| #if SIZEOF_LONG > 4
 | ||
| 	/* Sign extension for 64-bit machines */
 | ||
| 	x |= -(x & 0x80000000L);
 | ||
| #endif
 | ||
| 	return x;
 | ||
| }
 | ||
| 
 | ||
| /* r_long64 deals with the TYPE_INT64 code.  On a machine with
 | ||
|    sizeof(long) > 4, it returns a Python int object, else a Python long
 | ||
|    object.  Note that w_long64 writes out TYPE_INT if 32 bits is enough,
 | ||
|    so there's no inefficiency here in returning a PyLong on 32-bit boxes
 | ||
|    for everything written via TYPE_INT64 (i.e., if an int is written via
 | ||
|    TYPE_INT64, it *needs* more than 32 bits).
 | ||
| */
 | ||
| static PyObject *
 | ||
| r_long64(RFILE *p)
 | ||
| {
 | ||
| 	long lo4 = r_long(p);
 | ||
| 	long hi4 = r_long(p);
 | ||
| #if SIZEOF_LONG > 4
 | ||
| 	long x = (hi4 << 32) | (lo4 & 0xFFFFFFFFL);
 | ||
| 	return PyLong_FromLong(x);
 | ||
| #else
 | ||
| 	unsigned char buf[8];
 | ||
| 	int one = 1;
 | ||
| 	int is_little_endian = (int)*(char*)&one;
 | ||
| 	if (is_little_endian) {
 | ||
| 		memcpy(buf, &lo4, 4);
 | ||
| 		memcpy(buf+4, &hi4, 4);
 | ||
| 	}
 | ||
| 	else {
 | ||
| 		memcpy(buf, &hi4, 4);
 | ||
| 		memcpy(buf+4, &lo4, 4);
 | ||
| 	}
 | ||
| 	return _PyLong_FromByteArray(buf, 8, is_little_endian, 1);
 | ||
| #endif
 | ||
| }
 | ||
| 
 | ||
| static PyObject *
 | ||
| r_PyLong(RFILE *p)
 | ||
| {
 | ||
| 	PyLongObject *ob;
 | ||
| 	int size, i, j, md;
 | ||
| 	long n;
 | ||
| 	digit d;
 | ||
| 
 | ||
| 	n = r_long(p);
 | ||
| 	if (n == 0)
 | ||
| 		return (PyObject *)_PyLong_New(0);
 | ||
| 	if (n < -INT_MAX || n > INT_MAX) {
 | ||
| 		PyErr_SetString(PyExc_ValueError,
 | ||
| 			       "bad marshal data (long size out of range)");
 | ||
| 		return NULL;
 | ||
| 	}
 | ||
| 
 | ||
| 	size = 1 + (ABS(n)-1) / PyLong_MARSHAL_RATIO;
 | ||
| 	ob = _PyLong_New(size);
 | ||
| 	if (ob == NULL)
 | ||
| 		return NULL;
 | ||
| 	Py_SIZE(ob) = n > 0 ? size : -size;
 | ||
| 
 | ||
| 	for (i = 0; i < size-1; i++) {
 | ||
| 		d = 0;
 | ||
| 		for (j=0; j < PyLong_MARSHAL_RATIO; j++) {
 | ||
| 			md = r_short(p);
 | ||
| 			if (md < 0 || md > PyLong_MARSHAL_BASE)
 | ||
| 				goto bad_digit;
 | ||
| 			d += (digit)md << j*PyLong_MARSHAL_SHIFT;
 | ||
| 		}
 | ||
| 		ob->ob_digit[i] = d;
 | ||
| 	}
 | ||
| 	d = 0;
 | ||
| 	for (j=0; j < (ABS(n)-1)%PyLong_MARSHAL_RATIO + 1; j++) {
 | ||
| 		md = r_short(p);
 | ||
| 		if (md < 0 || md > PyLong_MARSHAL_BASE)
 | ||
| 			goto bad_digit;
 | ||
| 		d += (digit)md << j*PyLong_MARSHAL_SHIFT;
 | ||
| 	}
 | ||
| 	ob->ob_digit[size-1] = d;
 | ||
| 	return (PyObject *)ob;
 | ||
|   bad_digit:
 | ||
| 	Py_DECREF(ob);
 | ||
| 	PyErr_SetString(PyExc_ValueError,
 | ||
| 			"bad marshal data (digit out of range in long)");
 | ||
| 	return NULL;
 | ||
| }
 | ||
| 
 | ||
| 
 | ||
| static PyObject *
 | ||
| r_object(RFILE *p)
 | ||
| {
 | ||
| 	/* NULL is a valid return value, it does not necessarily means that
 | ||
| 	   an exception is set. */
 | ||
| 	PyObject *v, *v2;
 | ||
| 	long i, n;
 | ||
| 	int type = r_byte(p);
 | ||
| 	PyObject *retval;
 | ||
| 
 | ||
| 	p->depth++;
 | ||
| 
 | ||
| 	if (p->depth > MAX_MARSHAL_STACK_DEPTH) {
 | ||
| 		p->depth--;
 | ||
| 		PyErr_SetString(PyExc_ValueError, "recursion limit exceeded");
 | ||
| 		return NULL;
 | ||
| 	}
 | ||
| 
 | ||
| 	switch (type) {
 | ||
| 
 | ||
| 	case EOF:
 | ||
| 		PyErr_SetString(PyExc_EOFError,
 | ||
| 				"EOF read where object expected");
 | ||
| 		retval = NULL;
 | ||
| 		break;
 | ||
| 
 | ||
| 	case TYPE_NULL:
 | ||
| 		retval = NULL;
 | ||
| 		break;
 | ||
| 
 | ||
| 	case TYPE_NONE:
 | ||
| 		Py_INCREF(Py_None);
 | ||
| 		retval = Py_None;
 | ||
| 		break;
 | ||
| 
 | ||
| 	case TYPE_STOPITER:
 | ||
| 		Py_INCREF(PyExc_StopIteration);
 | ||
| 		retval = PyExc_StopIteration;
 | ||
| 		break;
 | ||
| 
 | ||
| 	case TYPE_ELLIPSIS:
 | ||
| 		Py_INCREF(Py_Ellipsis);
 | ||
| 		retval = Py_Ellipsis;
 | ||
| 		break;
 | ||
| 
 | ||
| 	case TYPE_FALSE:
 | ||
| 		Py_INCREF(Py_False);
 | ||
| 		retval = Py_False;
 | ||
| 		break;
 | ||
| 
 | ||
| 	case TYPE_TRUE:
 | ||
| 		Py_INCREF(Py_True);
 | ||
| 		retval = Py_True;
 | ||
| 		break;
 | ||
| 
 | ||
| 	case TYPE_INT:
 | ||
| 		retval = PyLong_FromLong(r_long(p));
 | ||
| 		break;
 | ||
| 
 | ||
| 	case TYPE_INT64:
 | ||
| 		retval = r_long64(p);
 | ||
| 		break;
 | ||
| 
 | ||
| 	case TYPE_LONG:
 | ||
| 		retval = r_PyLong(p);
 | ||
| 		break;
 | ||
| 
 | ||
| 	case TYPE_FLOAT:
 | ||
| 		{
 | ||
| 			char buf[256];
 | ||
| 			double dx;
 | ||
| 			retval = NULL;
 | ||
| 			n = r_byte(p);
 | ||
| 			if (n == EOF || r_string(buf, (int)n, p) != n) {
 | ||
| 				PyErr_SetString(PyExc_EOFError,
 | ||
| 					"EOF read where object expected");
 | ||
| 				break;
 | ||
| 			}
 | ||
| 			buf[n] = '\0';
 | ||
| 			dx = PyOS_string_to_double(buf, NULL, NULL);
 | ||
| 			if (dx == -1.0 && PyErr_Occurred())
 | ||
| 				break;
 | ||
| 			retval = PyFloat_FromDouble(dx);
 | ||
| 			break;
 | ||
| 		}
 | ||
| 
 | ||
| 	case TYPE_BINARY_FLOAT:
 | ||
| 		{
 | ||
| 			unsigned char buf[8];
 | ||
| 			double x;
 | ||
| 			if (r_string((char*)buf, 8, p) != 8) {
 | ||
| 				PyErr_SetString(PyExc_EOFError,
 | ||
| 					"EOF read where object expected");
 | ||
| 				retval = NULL;
 | ||
| 				break;
 | ||
| 			}
 | ||
| 			x = _PyFloat_Unpack8(buf, 1);
 | ||
| 			if (x == -1.0 && PyErr_Occurred()) {
 | ||
| 				retval = NULL;
 | ||
| 				break;
 | ||
| 			}
 | ||
| 			retval = PyFloat_FromDouble(x);
 | ||
| 			break;
 | ||
| 		}
 | ||
| 
 | ||
| #ifndef WITHOUT_COMPLEX
 | ||
| 	case TYPE_COMPLEX:
 | ||
| 		{
 | ||
| 			char buf[256];
 | ||
| 			Py_complex c;
 | ||
| 			retval = NULL;
 | ||
| 			n = r_byte(p);
 | ||
| 			if (n == EOF || r_string(buf, (int)n, p) != n) {
 | ||
| 				PyErr_SetString(PyExc_EOFError,
 | ||
| 					"EOF read where object expected");
 | ||
| 				break;
 | ||
| 			}
 | ||
| 			buf[n] = '\0';
 | ||
| 			c.real = PyOS_string_to_double(buf, NULL, NULL);
 | ||
| 			if (c.real == -1.0 && PyErr_Occurred())
 | ||
| 				break;
 | ||
| 			n = r_byte(p);
 | ||
| 			if (n == EOF || r_string(buf, (int)n, p) != n) {
 | ||
| 				PyErr_SetString(PyExc_EOFError,
 | ||
| 					"EOF read where object expected");
 | ||
| 				break;
 | ||
| 			}
 | ||
| 			buf[n] = '\0';
 | ||
| 			c.imag = PyOS_string_to_double(buf, NULL, NULL);
 | ||
| 			if (c.imag == -1.0 && PyErr_Occurred())
 | ||
| 				break;
 | ||
| 			retval = PyComplex_FromCComplex(c);
 | ||
| 			break;
 | ||
| 		}
 | ||
| 
 | ||
| 	case TYPE_BINARY_COMPLEX:
 | ||
| 		{
 | ||
| 			unsigned char buf[8];
 | ||
| 			Py_complex c;
 | ||
| 			if (r_string((char*)buf, 8, p) != 8) {
 | ||
| 				PyErr_SetString(PyExc_EOFError,
 | ||
| 					"EOF read where object expected");
 | ||
| 				retval = NULL;
 | ||
| 				break;
 | ||
| 			}
 | ||
| 			c.real = _PyFloat_Unpack8(buf, 1);
 | ||
| 			if (c.real == -1.0 && PyErr_Occurred()) {
 | ||
| 				retval = NULL;
 | ||
| 				break;
 | ||
| 			}
 | ||
| 			if (r_string((char*)buf, 8, p) != 8) {
 | ||
| 				PyErr_SetString(PyExc_EOFError,
 | ||
| 					"EOF read where object expected");
 | ||
| 				retval = NULL;
 | ||
| 				break;
 | ||
| 			}
 | ||
| 			c.imag = _PyFloat_Unpack8(buf, 1);
 | ||
| 			if (c.imag == -1.0 && PyErr_Occurred()) {
 | ||
| 				retval = NULL;
 | ||
| 				break;
 | ||
| 			}
 | ||
| 			retval = PyComplex_FromCComplex(c);
 | ||
| 			break;
 | ||
| 		}
 | ||
| #endif
 | ||
| 
 | ||
| 	case TYPE_STRING:
 | ||
| 		n = r_long(p);
 | ||
| 		if (n < 0 || n > INT_MAX) {
 | ||
| 			PyErr_SetString(PyExc_ValueError, "bad marshal data (string size out of range)");
 | ||
| 			retval = NULL;
 | ||
| 			break;
 | ||
| 		}
 | ||
| 		v = PyBytes_FromStringAndSize((char *)NULL, n);
 | ||
| 		if (v == NULL) {
 | ||
| 			retval = NULL;
 | ||
| 			break;
 | ||
| 		}
 | ||
| 		if (r_string(PyBytes_AS_STRING(v), (int)n, p) != n) {
 | ||
| 			Py_DECREF(v);
 | ||
| 			PyErr_SetString(PyExc_EOFError,
 | ||
| 					"EOF read where object expected");
 | ||
| 			retval = NULL;
 | ||
| 			break;
 | ||
| 		}
 | ||
| 		retval = v;
 | ||
| 		break;
 | ||
| 
 | ||
| 	case TYPE_UNICODE:
 | ||
| 	    {
 | ||
| 		char *buffer;
 | ||
| 
 | ||
| 		n = r_long(p);
 | ||
| 		if (n < 0 || n > INT_MAX) {
 | ||
| 			PyErr_SetString(PyExc_ValueError, "bad marshal data (unicode size out of range)");
 | ||
| 			retval = NULL;
 | ||
| 			break;
 | ||
| 		}
 | ||
| 		buffer = PyMem_NEW(char, n);
 | ||
| 		if (buffer == NULL) {
 | ||
| 			retval = PyErr_NoMemory();
 | ||
| 			break;
 | ||
| 		}
 | ||
| 		if (r_string(buffer, (int)n, p) != n) {
 | ||
| 			PyMem_DEL(buffer);
 | ||
| 			PyErr_SetString(PyExc_EOFError,
 | ||
| 				"EOF read where object expected");
 | ||
| 			retval = NULL;
 | ||
| 			break;
 | ||
| 		}
 | ||
| 		v = PyUnicode_DecodeUTF8(buffer, n, "surrogatepass");
 | ||
| 		PyMem_DEL(buffer);
 | ||
| 		retval = v;
 | ||
| 		break;
 | ||
| 	    }
 | ||
| 
 | ||
| 	case TYPE_TUPLE:
 | ||
| 		n = r_long(p);
 | ||
| 		if (n < 0 || n > INT_MAX) {
 | ||
| 			PyErr_SetString(PyExc_ValueError, "bad marshal data (tuple size out of range)");
 | ||
| 			retval = NULL;
 | ||
| 			break;
 | ||
| 		}
 | ||
| 		v = PyTuple_New((int)n);
 | ||
| 		if (v == NULL) {
 | ||
| 			retval = NULL;
 | ||
| 			break;
 | ||
| 		}
 | ||
| 		for (i = 0; i < n; i++) {
 | ||
| 			v2 = r_object(p);
 | ||
| 			if ( v2 == NULL ) {
 | ||
| 				if (!PyErr_Occurred())
 | ||
| 					PyErr_SetString(PyExc_TypeError,
 | ||
| 						"NULL object in marshal data for tuple");
 | ||
| 				Py_DECREF(v);
 | ||
| 				v = NULL;
 | ||
| 				break;
 | ||
| 			}
 | ||
| 			PyTuple_SET_ITEM(v, (int)i, v2);
 | ||
| 		}
 | ||
| 		retval = v;
 | ||
| 		break;
 | ||
| 
 | ||
| 	case TYPE_LIST:
 | ||
| 		n = r_long(p);
 | ||
| 		if (n < 0 || n > INT_MAX) {
 | ||
| 			PyErr_SetString(PyExc_ValueError, "bad marshal data (list size out of range)");
 | ||
| 			retval = NULL;
 | ||
| 			break;
 | ||
| 		}
 | ||
| 		v = PyList_New((int)n);
 | ||
| 		if (v == NULL) {
 | ||
| 			retval = NULL;
 | ||
| 			break;
 | ||
| 		}
 | ||
| 		for (i = 0; i < n; i++) {
 | ||
| 			v2 = r_object(p);
 | ||
| 			if ( v2 == NULL ) {
 | ||
| 				if (!PyErr_Occurred())
 | ||
| 					PyErr_SetString(PyExc_TypeError,
 | ||
| 						"NULL object in marshal data for list");
 | ||
| 				Py_DECREF(v);
 | ||
| 				v = NULL;
 | ||
| 				break;
 | ||
| 			}
 | ||
| 			PyList_SET_ITEM(v, (int)i, v2);
 | ||
| 		}
 | ||
| 		retval = v;
 | ||
| 		break;
 | ||
| 
 | ||
| 	case TYPE_DICT:
 | ||
| 		v = PyDict_New();
 | ||
| 		if (v == NULL) {
 | ||
| 			retval = NULL;
 | ||
| 			break;
 | ||
| 		}
 | ||
| 		for (;;) {
 | ||
| 			PyObject *key, *val;
 | ||
| 			key = r_object(p);
 | ||
| 			if (key == NULL)
 | ||
| 				break;
 | ||
| 			val = r_object(p);
 | ||
| 			if (val != NULL)
 | ||
| 				PyDict_SetItem(v, key, val);
 | ||
| 			Py_DECREF(key);
 | ||
| 			Py_XDECREF(val);
 | ||
| 		}
 | ||
| 		if (PyErr_Occurred()) {
 | ||
| 			Py_DECREF(v);
 | ||
| 			v = NULL;
 | ||
| 		}
 | ||
| 		retval = v;
 | ||
| 		break;
 | ||
| 
 | ||
| 	case TYPE_SET:
 | ||
| 	case TYPE_FROZENSET:
 | ||
| 		n = r_long(p);
 | ||
| 		if (n < 0 || n > INT_MAX) {
 | ||
| 			PyErr_SetString(PyExc_ValueError, "bad marshal data (set size out of range)");
 | ||
| 			retval = NULL;
 | ||
| 			break;
 | ||
| 		}
 | ||
|                 v = (type == TYPE_SET) ? PySet_New(NULL) : PyFrozenSet_New(NULL);
 | ||
| 		if (v == NULL) {
 | ||
| 			retval = NULL;
 | ||
| 			break;
 | ||
| 		}
 | ||
| 		for (i = 0; i < n; i++) {
 | ||
| 			v2 = r_object(p);
 | ||
| 			if ( v2 == NULL ) {
 | ||
| 				if (!PyErr_Occurred())
 | ||
| 					PyErr_SetString(PyExc_TypeError,
 | ||
| 						"NULL object in marshal data for set");
 | ||
| 				Py_DECREF(v);
 | ||
| 				v = NULL;
 | ||
| 				break;
 | ||
| 			}
 | ||
| 			if (PySet_Add(v, v2) == -1) {
 | ||
|                                 Py_DECREF(v);
 | ||
|                                 Py_DECREF(v2);
 | ||
|                                 v = NULL;
 | ||
|                                 break;
 | ||
|                         }
 | ||
|                         Py_DECREF(v2);
 | ||
| 		}
 | ||
| 		retval = v;
 | ||
| 		break;
 | ||
| 
 | ||
| 	case TYPE_CODE:
 | ||
| 		{
 | ||
| 			int argcount;
 | ||
| 			int kwonlyargcount;
 | ||
| 			int nlocals;
 | ||
| 			int stacksize;
 | ||
| 			int flags;
 | ||
| 			PyObject *code = NULL;
 | ||
| 			PyObject *consts = NULL;
 | ||
| 			PyObject *names = NULL;
 | ||
| 			PyObject *varnames = NULL;
 | ||
| 			PyObject *freevars = NULL;
 | ||
| 			PyObject *cellvars = NULL;
 | ||
| 			PyObject *filename = NULL;
 | ||
| 			PyObject *name = NULL;
 | ||
| 			int firstlineno;
 | ||
| 			PyObject *lnotab = NULL;
 | ||
| 			
 | ||
| 			v = NULL;
 | ||
| 
 | ||
| 			/* XXX ignore long->int overflows for now */
 | ||
| 			argcount = (int)r_long(p);
 | ||
| 			kwonlyargcount = (int)r_long(p);
 | ||
| 			nlocals = (int)r_long(p);
 | ||
| 			stacksize = (int)r_long(p);
 | ||
| 			flags = (int)r_long(p);
 | ||
| 			code = r_object(p);
 | ||
| 			if (code == NULL)
 | ||
| 				goto code_error;
 | ||
| 			consts = r_object(p);
 | ||
| 			if (consts == NULL)
 | ||
| 				goto code_error;
 | ||
| 			names = r_object(p);
 | ||
| 			if (names == NULL)
 | ||
| 				goto code_error;
 | ||
| 			varnames = r_object(p);
 | ||
| 			if (varnames == NULL)
 | ||
| 				goto code_error;
 | ||
| 			freevars = r_object(p);
 | ||
| 			if (freevars == NULL)
 | ||
| 				goto code_error;
 | ||
| 			cellvars = r_object(p);
 | ||
| 			if (cellvars == NULL)
 | ||
| 				goto code_error;
 | ||
| 			filename = r_object(p);
 | ||
| 			if (filename == NULL)
 | ||
| 				goto code_error;
 | ||
| 			name = r_object(p);
 | ||
| 			if (name == NULL)
 | ||
| 				goto code_error;
 | ||
| 			firstlineno = (int)r_long(p);
 | ||
| 			lnotab = r_object(p);
 | ||
| 			if (lnotab == NULL)
 | ||
| 				goto code_error;
 | ||
| 
 | ||
| 			v = (PyObject *) PyCode_New(
 | ||
| 					argcount, kwonlyargcount,
 | ||
| 					nlocals, stacksize, flags,
 | ||
| 					code, consts, names, varnames,
 | ||
| 					freevars, cellvars, filename, name,
 | ||
| 					firstlineno, lnotab);
 | ||
| 
 | ||
| 		  code_error:
 | ||
| 			Py_XDECREF(code);
 | ||
| 			Py_XDECREF(consts);
 | ||
| 			Py_XDECREF(names);
 | ||
| 			Py_XDECREF(varnames);
 | ||
| 			Py_XDECREF(freevars);
 | ||
| 			Py_XDECREF(cellvars);
 | ||
| 			Py_XDECREF(filename);
 | ||
| 			Py_XDECREF(name);
 | ||
| 			Py_XDECREF(lnotab);
 | ||
| 		}
 | ||
| 		retval = v;
 | ||
| 		break;
 | ||
| 
 | ||
| 	default:
 | ||
| 		/* Bogus data got written, which isn't ideal.
 | ||
| 		   This will let you keep working and recover. */
 | ||
| 		PyErr_SetString(PyExc_ValueError, "bad marshal data (unknown type code)");
 | ||
| 		retval = NULL;
 | ||
| 		break;
 | ||
| 
 | ||
| 	}
 | ||
| 	p->depth--;
 | ||
| 	return retval;
 | ||
| }
 | ||
| 
 | ||
| static PyObject *
 | ||
| read_object(RFILE *p)
 | ||
| {
 | ||
| 	PyObject *v;
 | ||
| 	if (PyErr_Occurred()) {
 | ||
| 		fprintf(stderr, "XXX readobject called with exception set\n");
 | ||
| 		return NULL;
 | ||
| 	}
 | ||
| 	v = r_object(p);
 | ||
| 	if (v == NULL && !PyErr_Occurred())
 | ||
| 		PyErr_SetString(PyExc_TypeError, "NULL object in marshal data for object");
 | ||
| 	return v;
 | ||
| }
 | ||
| 
 | ||
| int
 | ||
| PyMarshal_ReadShortFromFile(FILE *fp)
 | ||
| {
 | ||
| 	RFILE rf;
 | ||
| 	assert(fp);
 | ||
| 	rf.fp = fp;
 | ||
| 	rf.strings = NULL;
 | ||
| 	rf.end = rf.ptr = NULL;
 | ||
| 	return r_short(&rf);
 | ||
| }
 | ||
| 
 | ||
| long
 | ||
| PyMarshal_ReadLongFromFile(FILE *fp)
 | ||
| {
 | ||
| 	RFILE rf;
 | ||
| 	rf.fp = fp;
 | ||
| 	rf.strings = NULL;
 | ||
| 	rf.ptr = rf.end = NULL;
 | ||
| 	return r_long(&rf);
 | ||
| }
 | ||
| 
 | ||
| #ifdef HAVE_FSTAT
 | ||
| /* Return size of file in bytes; < 0 if unknown. */
 | ||
| static off_t
 | ||
| getfilesize(FILE *fp)
 | ||
| {
 | ||
| 	struct stat st;
 | ||
| 	if (fstat(fileno(fp), &st) != 0)
 | ||
| 		return -1;
 | ||
| 	else
 | ||
| 		return st.st_size;
 | ||
| }
 | ||
| #endif
 | ||
| 
 | ||
| /* If we can get the size of the file up-front, and it's reasonably small,
 | ||
|  * read it in one gulp and delegate to ...FromString() instead.  Much quicker
 | ||
|  * than reading a byte at a time from file; speeds .pyc imports.
 | ||
|  * CAUTION:  since this may read the entire remainder of the file, don't
 | ||
|  * call it unless you know you're done with the file.
 | ||
|  */
 | ||
| PyObject *
 | ||
| PyMarshal_ReadLastObjectFromFile(FILE *fp)
 | ||
| {
 | ||
| /* 75% of 2.1's .pyc files can exploit SMALL_FILE_LIMIT.
 | ||
|  * REASONABLE_FILE_LIMIT is by defn something big enough for Tkinter.pyc.
 | ||
|  */
 | ||
| #define SMALL_FILE_LIMIT (1L << 14)
 | ||
| #define REASONABLE_FILE_LIMIT (1L << 18)
 | ||
| #ifdef HAVE_FSTAT
 | ||
| 	off_t filesize;
 | ||
| #endif
 | ||
| #ifdef HAVE_FSTAT
 | ||
| 	filesize = getfilesize(fp);
 | ||
| 	if (filesize > 0) {
 | ||
| 		char buf[SMALL_FILE_LIMIT];
 | ||
| 		char* pBuf = NULL;
 | ||
| 		if (filesize <= SMALL_FILE_LIMIT)
 | ||
| 			pBuf = buf;
 | ||
| 		else if (filesize <= REASONABLE_FILE_LIMIT)
 | ||
| 			pBuf = (char *)PyMem_MALLOC(filesize);
 | ||
| 		if (pBuf != NULL) {
 | ||
| 			PyObject* v;
 | ||
| 			size_t n;
 | ||
| 			/* filesize must fit into an int, because it
 | ||
| 			   is smaller than REASONABLE_FILE_LIMIT */
 | ||
| 			n = fread(pBuf, 1, (int)filesize, fp);
 | ||
| 			v = PyMarshal_ReadObjectFromString(pBuf, n);
 | ||
| 			if (pBuf != buf)
 | ||
| 				PyMem_FREE(pBuf);
 | ||
| 			return v;
 | ||
| 		}
 | ||
| 
 | ||
| 	}
 | ||
| #endif
 | ||
| 	/* We don't have fstat, or we do but the file is larger than
 | ||
| 	 * REASONABLE_FILE_LIMIT or malloc failed -- read a byte at a time.
 | ||
| 	 */
 | ||
| 	return PyMarshal_ReadObjectFromFile(fp);
 | ||
| 
 | ||
| #undef SMALL_FILE_LIMIT
 | ||
| #undef REASONABLE_FILE_LIMIT
 | ||
| }
 | ||
| 
 | ||
| PyObject *
 | ||
| PyMarshal_ReadObjectFromFile(FILE *fp)
 | ||
| {
 | ||
| 	RFILE rf;
 | ||
| 	PyObject *result;
 | ||
| 	rf.fp = fp;
 | ||
| 	rf.strings = PyList_New(0);
 | ||
| 	rf.depth = 0;
 | ||
| 	rf.ptr = rf.end = NULL;
 | ||
| 	result = r_object(&rf);
 | ||
| 	Py_DECREF(rf.strings);
 | ||
| 	return result;
 | ||
| }
 | ||
| 
 | ||
| PyObject *
 | ||
| PyMarshal_ReadObjectFromString(char *str, Py_ssize_t len)
 | ||
| {
 | ||
| 	RFILE rf;
 | ||
| 	PyObject *result;
 | ||
| 	rf.fp = NULL;
 | ||
| 	rf.ptr = str;
 | ||
| 	rf.end = str + len;
 | ||
| 	rf.strings = PyList_New(0);
 | ||
| 	rf.depth = 0;
 | ||
| 	result = r_object(&rf);
 | ||
| 	Py_DECREF(rf.strings);
 | ||
| 	return result;
 | ||
| }
 | ||
| 
 | ||
| PyObject *
 | ||
| PyMarshal_WriteObjectToString(PyObject *x, int version)
 | ||
| {
 | ||
| 	WFILE wf;
 | ||
| 	PyObject *res = NULL;
 | ||
| 
 | ||
| 	wf.fp = NULL;
 | ||
| 	wf.str = PyBytes_FromStringAndSize((char *)NULL, 50);
 | ||
| 	if (wf.str == NULL)
 | ||
| 		return NULL;
 | ||
| 	wf.ptr = PyBytes_AS_STRING((PyBytesObject *)wf.str);
 | ||
| 	wf.end = wf.ptr + PyBytes_Size(wf.str);
 | ||
| 	wf.error = WFERR_OK;
 | ||
| 	wf.depth = 0;
 | ||
| 	wf.version = version;
 | ||
| 	wf.strings = (version > 0) ? PyDict_New() : NULL;
 | ||
| 	w_object(x, &wf);
 | ||
| 	Py_XDECREF(wf.strings);
 | ||
| 	if (wf.str != NULL) {
 | ||
| 		char *base = PyBytes_AS_STRING((PyBytesObject *)wf.str);
 | ||
| 		if (wf.ptr - base > PY_SSIZE_T_MAX) {
 | ||
| 			Py_DECREF(wf.str);
 | ||
| 			PyErr_SetString(PyExc_OverflowError,
 | ||
| 					"too much marshal data for a string");
 | ||
| 			return NULL;
 | ||
| 		}
 | ||
| 		if (_PyBytes_Resize(&wf.str, (Py_ssize_t)(wf.ptr - base)) < 0)
 | ||
| 			return NULL;
 | ||
| 	}
 | ||
| 	if (wf.error != WFERR_OK) {
 | ||
| 		Py_XDECREF(wf.str);
 | ||
|                 if (wf.error == WFERR_NOMEMORY)
 | ||
|                     PyErr_NoMemory();
 | ||
|                 else
 | ||
|                     PyErr_SetString(PyExc_ValueError,
 | ||
|                       (wf.error==WFERR_UNMARSHALLABLE)?"unmarshallable object"
 | ||
|                        :"object too deeply nested to marshal");
 | ||
| 		return NULL;
 | ||
| 	}
 | ||
| 	if (wf.str != NULL) {
 | ||
| 		/* XXX Quick hack -- need to do this differently */
 | ||
| 		res = PyBytes_FromObject(wf.str);
 | ||
| 		Py_DECREF(wf.str);
 | ||
| 	}
 | ||
| 	return res;
 | ||
| }
 | ||
| 
 | ||
| /* And an interface for Python programs... */
 | ||
| 
 | ||
| static PyObject *
 | ||
| marshal_dump(PyObject *self, PyObject *args)
 | ||
| {
 | ||
| 	/* XXX Quick hack -- need to do this differently */
 | ||
| 	PyObject *x;
 | ||
| 	PyObject *f;
 | ||
| 	int version = Py_MARSHAL_VERSION;
 | ||
| 	PyObject *s;
 | ||
| 	PyObject *res;
 | ||
| 	if (!PyArg_ParseTuple(args, "OO|i:dump", &x, &f, &version))
 | ||
| 		return NULL;
 | ||
| 	s = PyMarshal_WriteObjectToString(x, version);
 | ||
| 	if (s == NULL)
 | ||
| 		return NULL;
 | ||
| 	res = PyObject_CallMethod(f, "write", "O", s);
 | ||
| 	Py_DECREF(s);
 | ||
| 	return res;
 | ||
| }
 | ||
| 
 | ||
| PyDoc_STRVAR(dump_doc,
 | ||
| "dump(value, file[, version])\n\
 | ||
| \n\
 | ||
| Write the value on the open file. The value must be a supported type.\n\
 | ||
| The file must be an open file object such as sys.stdout or returned by\n\
 | ||
| open() or os.popen(). It must be opened in binary mode ('wb' or 'w+b').\n\
 | ||
| \n\
 | ||
| If the value has (or contains an object that has) an unsupported type, a\n\
 | ||
| ValueError exception is raised — but garbage data will also be written\n\
 | ||
| to the file. The object will not be properly read back by load()\n\
 | ||
| \n\
 | ||
| The version argument indicates the data format that dump should use.");
 | ||
| 
 | ||
| static PyObject *
 | ||
| marshal_load(PyObject *self, PyObject *f)
 | ||
| {
 | ||
| 	/* XXX Quick hack -- need to do this differently */
 | ||
| 	PyObject *data, *result;
 | ||
| 	RFILE rf;
 | ||
| 	data = PyObject_CallMethod(f, "read", "");
 | ||
| 	if (data == NULL)
 | ||
| 		return NULL;
 | ||
| 	rf.fp = NULL;
 | ||
| 	if (PyBytes_Check(data)) {
 | ||
| 		rf.ptr = PyBytes_AS_STRING(data);
 | ||
| 		rf.end = rf.ptr + PyBytes_GET_SIZE(data);
 | ||
| 	}
 | ||
| 	else if (PyBytes_Check(data)) {
 | ||
| 		rf.ptr = PyBytes_AS_STRING(data);
 | ||
| 		rf.end = rf.ptr + PyBytes_GET_SIZE(data);
 | ||
| 	}
 | ||
| 	else {
 | ||
| 		PyErr_Format(PyExc_TypeError,
 | ||
| 			     "f.read() returned neither string "
 | ||
| 			     "nor bytes but %.100s",
 | ||
| 			     data->ob_type->tp_name);
 | ||
| 		Py_DECREF(data);
 | ||
| 		return NULL;
 | ||
| 	}
 | ||
| 	rf.strings = PyList_New(0);
 | ||
| 	rf.depth = 0;
 | ||
| 	result = read_object(&rf);
 | ||
| 	Py_DECREF(rf.strings);
 | ||
| 	Py_DECREF(data);
 | ||
| 	return result;
 | ||
| }
 | ||
| 
 | ||
| PyDoc_STRVAR(load_doc,
 | ||
| "load(file)\n\
 | ||
| \n\
 | ||
| Read one value from the open file and return it. If no valid value is\n\
 | ||
| read (e.g. because the data has a different Python version’s\n\
 | ||
| incompatible marshal format), raise EOFError, ValueError or TypeError.\n\
 | ||
| The file must be an open file object opened in binary mode ('rb' or\n\
 | ||
| 'r+b').\n\
 | ||
| \n\
 | ||
| Note: If an object containing an unsupported type was marshalled with\n\
 | ||
| dump(), load() will substitute None for the unmarshallable type.");
 | ||
| 
 | ||
| 
 | ||
| static PyObject *
 | ||
| marshal_dumps(PyObject *self, PyObject *args)
 | ||
| {
 | ||
| 	PyObject *x;
 | ||
| 	int version = Py_MARSHAL_VERSION;
 | ||
| 	if (!PyArg_ParseTuple(args, "O|i:dumps", &x, &version))
 | ||
| 		return NULL;
 | ||
| 	return PyMarshal_WriteObjectToString(x, version);
 | ||
| }
 | ||
| 
 | ||
| PyDoc_STRVAR(dumps_doc,
 | ||
| "dumps(value[, version])\n\
 | ||
| \n\
 | ||
| Return the string that would be written to a file by dump(value, file).\n\
 | ||
| The value must be a supported type. Raise a ValueError exception if\n\
 | ||
| value has (or contains an object that has) an unsupported type.\n\
 | ||
| \n\
 | ||
| The version argument indicates the data format that dumps should use.");
 | ||
| 
 | ||
| 
 | ||
| static PyObject *
 | ||
| marshal_loads(PyObject *self, PyObject *args)
 | ||
| {
 | ||
| 	RFILE rf;
 | ||
| 	Py_buffer p;
 | ||
| 	char *s;
 | ||
| 	Py_ssize_t n;
 | ||
| 	PyObject* result;
 | ||
| 	if (!PyArg_ParseTuple(args, "s*:loads", &p))
 | ||
| 		return NULL;
 | ||
| 	s = p.buf;
 | ||
| 	n = p.len;
 | ||
| 	rf.fp = NULL;
 | ||
| 	rf.ptr = s;
 | ||
| 	rf.end = s + n;
 | ||
| 	rf.strings = PyList_New(0);
 | ||
| 	rf.depth = 0;
 | ||
| 	result = read_object(&rf);
 | ||
| 	Py_DECREF(rf.strings);
 | ||
| 	PyBuffer_Release(&p);
 | ||
| 	return result;
 | ||
| }
 | ||
| 
 | ||
| PyDoc_STRVAR(loads_doc,
 | ||
| "loads(string)\n\
 | ||
| \n\
 | ||
| Convert the string to a value. If no valid value is found, raise\n\
 | ||
| EOFError, ValueError or TypeError. Extra characters in the string are\n\
 | ||
| ignored.");
 | ||
| 
 | ||
| static PyMethodDef marshal_methods[] = {
 | ||
| 	{"dump",	marshal_dump,	METH_VARARGS,	dump_doc},
 | ||
| 	{"load",	marshal_load,	METH_O,		load_doc},
 | ||
| 	{"dumps",	marshal_dumps,	METH_VARARGS,	dumps_doc},
 | ||
| 	{"loads",	marshal_loads,	METH_VARARGS,	loads_doc},
 | ||
| 	{NULL,		NULL}		/* sentinel */
 | ||
| };
 | ||
| 
 | ||
| 
 | ||
| PyDoc_STRVAR(module_doc,
 | ||
| "This module contains functions that can read and write Python values in\n\
 | ||
| a binary format. The format is specific to Python, but independent of\n\
 | ||
| machine architecture issues.\n\
 | ||
| \n\
 | ||
| Not all Python object types are supported; in general, only objects\n\
 | ||
| whose value is independent from a particular invocation of Python can be\n\
 | ||
| written and read by this module. The following types are supported:\n\
 | ||
| None, integers, floating point numbers, strings, bytes, bytearrays,\n\
 | ||
| tuples, lists, sets, dictionaries, and code objects, where it\n\
 | ||
| should be understood that tuples, lists and dictionaries are only\n\
 | ||
| supported as long as the values contained therein are themselves\n\
 | ||
| supported; and recursive lists and dictionaries should not be written\n\
 | ||
| (they will cause infinite loops).\n\
 | ||
| \n\
 | ||
| Variables:\n\
 | ||
| \n\
 | ||
| version -- indicates the format that the module uses. Version 0 is the\n\
 | ||
|     historical format, version 1 shares interned strings and version 2\n\
 | ||
|     uses a binary format for floating point numbers.\n\
 | ||
| \n\
 | ||
| Functions:\n\
 | ||
| \n\
 | ||
| dump() -- write value to a file\n\
 | ||
| load() -- read value from a file\n\
 | ||
| dumps() -- write value to a string\n\
 | ||
| loads() -- read value from a string");
 | ||
| 
 | ||
| 
 | ||
| 
 | ||
| static struct PyModuleDef marshalmodule = {
 | ||
| 	PyModuleDef_HEAD_INIT,
 | ||
| 	"marshal",
 | ||
| 	module_doc,
 | ||
| 	0,
 | ||
| 	marshal_methods,
 | ||
| 	NULL,
 | ||
| 	NULL,
 | ||
| 	NULL,
 | ||
| 	NULL
 | ||
| };
 | ||
| 
 | ||
| PyMODINIT_FUNC
 | ||
| PyMarshal_Init(void)
 | ||
| {
 | ||
| 	PyObject *mod = PyModule_Create(&marshalmodule);
 | ||
| 	if (mod == NULL)
 | ||
| 		return NULL;
 | ||
| 	PyModule_AddIntConstant(mod, "version", Py_MARSHAL_VERSION);
 | ||
| 	return mod;
 | ||
| }
 |