move sections
[python/dscho.git] / Modules / cPickle.c
blobbd577ad3da113c17234a31f9c212b6c65207f18c
1 #include "Python.h"
2 #include "cStringIO.h"
3 #include "structmember.h"
5 PyDoc_STRVAR(cPickle_module_documentation,
6 "C implementation and optimization of the Python pickle module.");
8 #ifndef Py_eval_input
9 #include <graminit.h>
10 #define Py_eval_input eval_input
11 #endif /* Py_eval_input */
13 #define DEL_LIST_SLICE(list, from, to) (PyList_SetSlice(list, from, to, NULL))
15 #define WRITE_BUF_SIZE 256
17 /* Bump this when new opcodes are added to the pickle protocol. */
18 #define HIGHEST_PROTOCOL 2
21 * Note: The UNICODE macro controls the TCHAR meaning of the win32 API. Since
22 * all headers have already been included here, we can safely redefine it.
24 #ifdef UNICODE
25 # undef UNICODE
26 #endif
29 * Pickle opcodes. These must be kept in synch with pickle.py. Extensive
30 * docs are in pickletools.py.
32 #define MARK '('
33 #define STOP '.'
34 #define POP '0'
35 #define POP_MARK '1'
36 #define DUP '2'
37 #define FLOAT 'F'
38 #define BINFLOAT 'G'
39 #define INT 'I'
40 #define BININT 'J'
41 #define BININT1 'K'
42 #define LONG 'L'
43 #define BININT2 'M'
44 #define NONE 'N'
45 #define PERSID 'P'
46 #define BINPERSID 'Q'
47 #define REDUCE 'R'
48 #define STRING 'S'
49 #define BINSTRING 'T'
50 #define SHORT_BINSTRING 'U'
51 #define UNICODE 'V'
52 #define BINUNICODE 'X'
53 #define APPEND 'a'
54 #define BUILD 'b'
55 #define GLOBAL 'c'
56 #define DICT 'd'
57 #define EMPTY_DICT '}'
58 #define APPENDS 'e'
59 #define GET 'g'
60 #define BINGET 'h'
61 #define INST 'i'
62 #define LONG_BINGET 'j'
63 #define LIST 'l'
64 #define EMPTY_LIST ']'
65 #define OBJ 'o'
66 #define PUT 'p'
67 #define BINPUT 'q'
68 #define LONG_BINPUT 'r'
69 #define SETITEM 's'
70 #define TUPLE 't'
71 #define EMPTY_TUPLE ')'
72 #define SETITEMS 'u'
74 /* Protocol 2. */
75 #define PROTO '\x80' /* identify pickle protocol */
76 #define NEWOBJ '\x81' /* build object by applying cls.__new__ to argtuple */
77 #define EXT1 '\x82' /* push object from extension registry; 1-byte index */
78 #define EXT2 '\x83' /* ditto, but 2-byte index */
79 #define EXT4 '\x84' /* ditto, but 4-byte index */
80 #define TUPLE1 '\x85' /* build 1-tuple from stack top */
81 #define TUPLE2 '\x86' /* build 2-tuple from two topmost stack items */
82 #define TUPLE3 '\x87' /* build 3-tuple from three topmost stack items */
83 #define NEWTRUE '\x88' /* push True */
84 #define NEWFALSE '\x89' /* push False */
85 #define LONG1 '\x8a' /* push long from < 256 bytes */
86 #define LONG4 '\x8b' /* push really big long */
88 /* There aren't opcodes -- they're ways to pickle bools before protocol 2,
89 * so that unpicklers written before bools were introduced unpickle them
90 * as ints, but unpicklers after can recognize that bools were intended.
91 * Note that protocol 2 added direct ways to pickle bools.
93 #undef TRUE
94 #define TRUE "I01\n"
95 #undef FALSE
96 #define FALSE "I00\n"
98 /* Keep in synch with pickle.Pickler._BATCHSIZE. This is how many elements
99 * batch_list/dict() pumps out before doing APPENDS/SETITEMS. Nothing will
100 * break if this gets out of synch with pickle.py, but it's unclear that
101 * would help anything either.
103 #define BATCHSIZE 1000
105 static char MARKv = MARK;
107 static PyObject *PickleError;
108 static PyObject *PicklingError;
109 static PyObject *UnpickleableError;
110 static PyObject *UnpicklingError;
111 static PyObject *BadPickleGet;
113 /* As the name says, an empty tuple. */
114 static PyObject *empty_tuple;
116 /* copy_reg.dispatch_table, {type_object: pickling_function} */
117 static PyObject *dispatch_table;
119 /* For EXT[124] opcodes. */
120 /* copy_reg._extension_registry, {(module_name, function_name): code} */
121 static PyObject *extension_registry;
122 /* copy_reg._inverted_registry, {code: (module_name, function_name)} */
123 static PyObject *inverted_registry;
124 /* copy_reg._extension_cache, {code: object} */
125 static PyObject *extension_cache;
127 /* For looking up name pairs in copy_reg._extension_registry. */
128 static PyObject *two_tuple;
130 static PyObject *__class___str, *__getinitargs___str, *__dict___str,
131 *__getstate___str, *__setstate___str, *__name___str, *__reduce___str,
132 *__reduce_ex___str,
133 *write_str, *append_str,
134 *read_str, *readline_str, *__main___str,
135 *dispatch_table_str;
137 /*************************************************************************
138 Internal Data type for pickle data. */
140 typedef struct {
141 PyObject_HEAD
142 int length; /* number of initial slots in data currently used */
143 int size; /* number of slots in data allocated */
144 PyObject **data;
145 } Pdata;
147 static void
148 Pdata_dealloc(Pdata *self)
150 int i;
151 PyObject **p;
153 for (i = self->length, p = self->data; --i >= 0; p++) {
154 Py_DECREF(*p);
156 if (self->data)
157 free(self->data);
158 PyObject_Del(self);
161 static PyTypeObject PdataType = {
162 PyVarObject_HEAD_INIT(NULL, 0) "cPickle.Pdata", sizeof(Pdata), 0,
163 (destructor)Pdata_dealloc,
164 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0L,0L,0L,0L, ""
167 #define Pdata_Check(O) (Py_TYPE(O) == &PdataType)
169 static PyObject *
170 Pdata_New(void)
172 Pdata *self;
174 if (!(self = PyObject_New(Pdata, &PdataType)))
175 return NULL;
176 self->size = 8;
177 self->length = 0;
178 self->data = malloc(self->size * sizeof(PyObject*));
179 if (self->data)
180 return (PyObject*)self;
181 Py_DECREF(self);
182 return PyErr_NoMemory();
185 static int
186 stackUnderflow(void)
188 PyErr_SetString(UnpicklingError, "unpickling stack underflow");
189 return -1;
192 /* Retain only the initial clearto items. If clearto >= the current
193 * number of items, this is a (non-erroneous) NOP.
195 static int
196 Pdata_clear(Pdata *self, int clearto)
198 int i;
199 PyObject **p;
201 if (clearto < 0) return stackUnderflow();
202 if (clearto >= self->length) return 0;
204 for (i = self->length, p = self->data + clearto;
205 --i >= clearto;
206 p++) {
207 Py_CLEAR(*p);
209 self->length = clearto;
211 return 0;
214 static int
215 Pdata_grow(Pdata *self)
217 int bigger;
218 size_t nbytes;
219 PyObject **tmp;
221 bigger = self->size << 1;
222 if (bigger <= 0) /* was 0, or new value overflows */
223 goto nomemory;
224 if ((int)(size_t)bigger != bigger)
225 goto nomemory;
226 nbytes = (size_t)bigger * sizeof(PyObject *);
227 if (nbytes / sizeof(PyObject *) != (size_t)bigger)
228 goto nomemory;
229 tmp = realloc(self->data, nbytes);
230 if (tmp == NULL)
231 goto nomemory;
232 self->data = tmp;
233 self->size = bigger;
234 return 0;
236 nomemory:
237 PyErr_NoMemory();
238 return -1;
241 /* D is a Pdata*. Pop the topmost element and store it into V, which
242 * must be an lvalue holding PyObject*. On stack underflow, UnpicklingError
243 * is raised and V is set to NULL. D and V may be evaluated several times.
245 #define PDATA_POP(D, V) { \
246 if ((D)->length) \
247 (V) = (D)->data[--((D)->length)]; \
248 else { \
249 PyErr_SetString(UnpicklingError, "bad pickle data"); \
250 (V) = NULL; \
254 /* PDATA_PUSH and PDATA_APPEND both push rvalue PyObject* O on to Pdata*
255 * D. If the Pdata stack can't be grown to hold the new value, both
256 * raise MemoryError and execute "return ER". The difference is in ownership
257 * of O after: _PUSH transfers ownership of O from the caller to the stack
258 * (no incref of O is done, and in case of error O is decrefed), while
259 * _APPEND pushes a new reference.
262 /* Push O on stack D, giving ownership of O to the stack. */
263 #define PDATA_PUSH(D, O, ER) { \
264 if (((Pdata*)(D))->length == ((Pdata*)(D))->size && \
265 Pdata_grow((Pdata*)(D)) < 0) { \
266 Py_DECREF(O); \
267 return ER; \
269 ((Pdata*)(D))->data[((Pdata*)(D))->length++] = (O); \
272 /* Push O on stack D, pushing a new reference. */
273 #define PDATA_APPEND(D, O, ER) { \
274 if (((Pdata*)(D))->length == ((Pdata*)(D))->size && \
275 Pdata_grow((Pdata*)(D)) < 0) \
276 return ER; \
277 Py_INCREF(O); \
278 ((Pdata*)(D))->data[((Pdata*)(D))->length++] = (O); \
282 static PyObject *
283 Pdata_popTuple(Pdata *self, int start)
285 PyObject *r;
286 int i, j, l;
288 l = self->length-start;
289 r = PyTuple_New(l);
290 if (r == NULL)
291 return NULL;
292 for (i = start, j = 0 ; j < l; i++, j++)
293 PyTuple_SET_ITEM(r, j, self->data[i]);
295 self->length = start;
296 return r;
299 static PyObject *
300 Pdata_popList(Pdata *self, int start)
302 PyObject *r;
303 int i, j, l;
305 l=self->length-start;
306 if (!( r=PyList_New(l))) return NULL;
307 for (i=start, j=0 ; j < l; i++, j++)
308 PyList_SET_ITEM(r, j, self->data[i]);
310 self->length=start;
311 return r;
314 /*************************************************************************/
316 #define ARG_TUP(self, o) { \
317 if (self->arg || (self->arg=PyTuple_New(1))) { \
318 Py_XDECREF(PyTuple_GET_ITEM(self->arg,0)); \
319 PyTuple_SET_ITEM(self->arg,0,o); \
321 else { \
322 Py_DECREF(o); \
326 #define FREE_ARG_TUP(self) { \
327 if (Py_REFCNT(self->arg) > 1) { \
328 Py_DECREF(self->arg); \
329 self->arg=NULL; \
333 typedef struct Picklerobject {
334 PyObject_HEAD
335 FILE *fp;
336 PyObject *write;
337 PyObject *file;
338 PyObject *memo;
339 PyObject *arg;
340 PyObject *pers_func;
341 PyObject *inst_pers_func;
343 /* pickle protocol number, >= 0 */
344 int proto;
346 /* bool, true if proto > 0 */
347 int bin;
349 int fast; /* Fast mode doesn't save in memo, don't use if circ ref */
350 int (*write_func)(struct Picklerobject *, const char *, Py_ssize_t);
351 char *write_buf;
352 int buf_size;
353 PyObject *dispatch_table;
354 int fast_container; /* count nested container dumps */
355 PyObject *fast_memo;
356 } Picklerobject;
358 #ifndef PY_CPICKLE_FAST_LIMIT
359 #define PY_CPICKLE_FAST_LIMIT 50
360 #endif
362 static PyTypeObject Picklertype;
364 typedef struct Unpicklerobject {
365 PyObject_HEAD
366 FILE *fp;
367 PyObject *file;
368 PyObject *readline;
369 PyObject *read;
370 PyObject *memo;
371 PyObject *arg;
372 Pdata *stack;
373 PyObject *mark;
374 PyObject *pers_func;
375 PyObject *last_string;
376 int *marks;
377 int num_marks;
378 int marks_size;
379 Py_ssize_t (*read_func)(struct Unpicklerobject *, char **, Py_ssize_t);
380 Py_ssize_t (*readline_func)(struct Unpicklerobject *, char **);
381 int buf_size;
382 char *buf;
383 PyObject *find_class;
384 } Unpicklerobject;
386 static PyTypeObject Unpicklertype;
388 /* Forward decls that need the above structs */
389 static int save(Picklerobject *, PyObject *, int);
390 static int put2(Picklerobject *, PyObject *);
392 static
393 PyObject *
394 cPickle_ErrFormat(PyObject *ErrType, char *stringformat, char *format, ...)
396 va_list va;
397 PyObject *args=0, *retval=0;
398 va_start(va, format);
400 if (format) args = Py_VaBuildValue(format, va);
401 va_end(va);
402 if (format && ! args) return NULL;
403 if (stringformat && !(retval=PyString_FromString(stringformat)))
404 return NULL;
406 if (retval) {
407 if (args) {
408 PyObject *v;
409 v=PyString_Format(retval, args);
410 Py_DECREF(retval);
411 Py_DECREF(args);
412 if (! v) return NULL;
413 retval=v;
416 else
417 if (args) retval=args;
418 else {
419 PyErr_SetObject(ErrType,Py_None);
420 return NULL;
422 PyErr_SetObject(ErrType,retval);
423 Py_DECREF(retval);
424 return NULL;
427 static int
428 write_file(Picklerobject *self, const char *s, Py_ssize_t n)
430 size_t nbyteswritten;
432 if (s == NULL) {
433 return 0;
436 if (n > INT_MAX) {
437 /* String too large */
438 return -1;
441 PyFile_IncUseCount((PyFileObject *)self->file);
442 Py_BEGIN_ALLOW_THREADS
443 nbyteswritten = fwrite(s, sizeof(char), n, self->fp);
444 Py_END_ALLOW_THREADS
445 PyFile_DecUseCount((PyFileObject *)self->file);
446 if (nbyteswritten != (size_t)n) {
447 PyErr_SetFromErrno(PyExc_IOError);
448 return -1;
451 return (int)n;
454 static int
455 write_cStringIO(Picklerobject *self, const char *s, Py_ssize_t n)
457 if (s == NULL) {
458 return 0;
461 if (PycStringIO->cwrite((PyObject *)self->file, s, n) != n) {
462 return -1;
465 return (int)n;
468 static int
469 write_none(Picklerobject *self, const char *s, Py_ssize_t n)
471 if (s == NULL) return 0;
472 if (n > INT_MAX) return -1;
473 return (int)n;
476 static int
477 write_other(Picklerobject *self, const char *s, Py_ssize_t _n)
479 PyObject *py_str = 0, *junk = 0;
480 int n;
482 if (_n > INT_MAX)
483 return -1;
484 n = (int)_n;
485 if (s == NULL) {
486 if (!( self->buf_size )) return 0;
487 py_str = PyString_FromStringAndSize(self->write_buf,
488 self->buf_size);
489 if (!py_str)
490 return -1;
492 else {
493 if (self->buf_size && (n + self->buf_size) > WRITE_BUF_SIZE) {
494 if (write_other(self, NULL, 0) < 0)
495 return -1;
498 if (n > WRITE_BUF_SIZE) {
499 if (!( py_str =
500 PyString_FromStringAndSize(s, n)))
501 return -1;
503 else {
504 memcpy(self->write_buf + self->buf_size, s, n);
505 self->buf_size += n;
506 return n;
510 if (self->write) {
511 /* object with write method */
512 ARG_TUP(self, py_str);
513 if (self->arg) {
514 junk = PyObject_Call(self->write, self->arg, NULL);
515 FREE_ARG_TUP(self);
517 if (junk) Py_DECREF(junk);
518 else return -1;
520 else
521 PDATA_PUSH(self->file, py_str, -1);
523 self->buf_size = 0;
524 return n;
528 static Py_ssize_t
529 read_file(Unpicklerobject *self, char **s, Py_ssize_t n)
531 size_t nbytesread;
533 if (self->buf_size == 0) {
534 int size;
536 size = ((n < 32) ? 32 : n);
537 if (!( self->buf = (char *)malloc(size))) {
538 PyErr_NoMemory();
539 return -1;
542 self->buf_size = size;
544 else if (n > self->buf_size) {
545 char *newbuf = (char *)realloc(self->buf, n);
546 if (!newbuf) {
547 PyErr_NoMemory();
548 return -1;
550 self->buf = newbuf;
551 self->buf_size = n;
554 PyFile_IncUseCount((PyFileObject *)self->file);
555 Py_BEGIN_ALLOW_THREADS
556 nbytesread = fread(self->buf, sizeof(char), n, self->fp);
557 Py_END_ALLOW_THREADS
558 PyFile_DecUseCount((PyFileObject *)self->file);
559 if (nbytesread != (size_t)n) {
560 if (feof(self->fp)) {
561 PyErr_SetNone(PyExc_EOFError);
562 return -1;
565 PyErr_SetFromErrno(PyExc_IOError);
566 return -1;
569 *s = self->buf;
571 return n;
575 static Py_ssize_t
576 readline_file(Unpicklerobject *self, char **s)
578 int i;
580 if (self->buf_size == 0) {
581 if (!( self->buf = (char *)malloc(40))) {
582 PyErr_NoMemory();
583 return -1;
585 self->buf_size = 40;
588 i = 0;
589 while (1) {
590 int bigger;
591 char *newbuf;
592 for (; i < (self->buf_size - 1); i++) {
593 if (feof(self->fp) ||
594 (self->buf[i] = getc(self->fp)) == '\n') {
595 self->buf[i + 1] = '\0';
596 *s = self->buf;
597 return i + 1;
600 bigger = self->buf_size << 1;
601 if (bigger <= 0) { /* overflow */
602 PyErr_NoMemory();
603 return -1;
605 newbuf = (char *)realloc(self->buf, bigger);
606 if (!newbuf) {
607 PyErr_NoMemory();
608 return -1;
610 self->buf = newbuf;
611 self->buf_size = bigger;
616 static Py_ssize_t
617 read_cStringIO(Unpicklerobject *self, char **s, Py_ssize_t n)
619 char *ptr;
621 if (PycStringIO->cread((PyObject *)self->file, &ptr, n) != n) {
622 PyErr_SetNone(PyExc_EOFError);
623 return -1;
626 *s = ptr;
628 return n;
632 static Py_ssize_t
633 readline_cStringIO(Unpicklerobject *self, char **s)
635 Py_ssize_t n;
636 char *ptr;
638 if ((n = PycStringIO->creadline((PyObject *)self->file, &ptr)) < 0) {
639 return -1;
642 *s = ptr;
644 return n;
648 static Py_ssize_t
649 read_other(Unpicklerobject *self, char **s, Py_ssize_t n)
651 PyObject *bytes, *str=0;
653 if (!( bytes = PyInt_FromSsize_t(n))) return -1;
655 ARG_TUP(self, bytes);
656 if (self->arg) {
657 str = PyObject_Call(self->read, self->arg, NULL);
658 FREE_ARG_TUP(self);
660 if (! str) return -1;
662 Py_XDECREF(self->last_string);
663 self->last_string = str;
665 if (! (*s = PyString_AsString(str))) return -1;
667 if (PyString_GET_SIZE(str) != n) {
668 PyErr_SetNone(PyExc_EOFError);
669 return -1;
672 return n;
676 static Py_ssize_t
677 readline_other(Unpicklerobject *self, char **s)
679 PyObject *str;
680 Py_ssize_t str_size;
682 if (!( str = PyObject_CallObject(self->readline, empty_tuple))) {
683 return -1;
686 if ((str_size = PyString_Size(str)) < 0)
687 return -1;
689 Py_XDECREF(self->last_string);
690 self->last_string = str;
692 if (! (*s = PyString_AsString(str)))
693 return -1;
695 return str_size;
698 /* Copy the first n bytes from s into newly malloc'ed memory, plus a
699 * trailing 0 byte. Return a pointer to that, or NULL if out of memory.
700 * The caller is responsible for free()'ing the return value.
702 static char *
703 pystrndup(const char *s, int n)
705 char *r = (char *)malloc(n+1);
706 if (r == NULL)
707 return (char*)PyErr_NoMemory();
708 memcpy(r, s, n);
709 r[n] = 0;
710 return r;
714 static int
715 get(Picklerobject *self, PyObject *id)
717 PyObject *value, *mv;
718 long c_value;
719 char s[30];
720 size_t len;
722 if (!( mv = PyDict_GetItem(self->memo, id))) {
723 PyErr_SetObject(PyExc_KeyError, id);
724 return -1;
727 if (!( value = PyTuple_GetItem(mv, 0)))
728 return -1;
730 if (!( PyInt_Check(value))) {
731 PyErr_SetString(PicklingError, "no int where int expected in memo");
732 return -1;
734 c_value = PyInt_AS_LONG((PyIntObject*)value);
736 if (!self->bin) {
737 s[0] = GET;
738 PyOS_snprintf(s + 1, sizeof(s) - 1, "%ld\n", c_value);
739 len = strlen(s);
741 else if (Pdata_Check(self->file)) {
742 if (write_other(self, NULL, 0) < 0) return -1;
743 PDATA_APPEND(self->file, mv, -1);
744 return 0;
746 else {
747 if (c_value < 256) {
748 s[0] = BINGET;
749 s[1] = (int)(c_value & 0xff);
750 len = 2;
752 else {
753 s[0] = LONG_BINGET;
754 s[1] = (int)(c_value & 0xff);
755 s[2] = (int)((c_value >> 8) & 0xff);
756 s[3] = (int)((c_value >> 16) & 0xff);
757 s[4] = (int)((c_value >> 24) & 0xff);
758 len = 5;
762 if (self->write_func(self, s, len) < 0)
763 return -1;
765 return 0;
769 static int
770 put(Picklerobject *self, PyObject *ob)
772 if (Py_REFCNT(ob) < 2 || self->fast)
773 return 0;
775 return put2(self, ob);
779 static int
780 put2(Picklerobject *self, PyObject *ob)
782 char c_str[30];
783 int p;
784 size_t len;
785 int res = -1;
786 PyObject *py_ob_id = 0, *memo_len = 0, *t = 0;
788 if (self->fast)
789 return 0;
791 if ((p = PyDict_Size(self->memo)) < 0)
792 goto finally;
794 /* Make sure memo keys are positive! */
795 /* XXX Why?
796 * XXX And does "positive" really mean non-negative?
797 * XXX pickle.py starts with PUT index 0, not 1. This makes for
798 * XXX gratuitous differences between the pickling modules.
800 p++;
802 if (!( py_ob_id = PyLong_FromVoidPtr(ob)))
803 goto finally;
805 if (!( memo_len = PyInt_FromLong(p)))
806 goto finally;
808 if (!( t = PyTuple_New(2)))
809 goto finally;
811 PyTuple_SET_ITEM(t, 0, memo_len);
812 Py_INCREF(memo_len);
813 PyTuple_SET_ITEM(t, 1, ob);
814 Py_INCREF(ob);
816 if (PyDict_SetItem(self->memo, py_ob_id, t) < 0)
817 goto finally;
819 if (!self->bin) {
820 c_str[0] = PUT;
821 PyOS_snprintf(c_str + 1, sizeof(c_str) - 1, "%d\n", p);
822 len = strlen(c_str);
824 else if (Pdata_Check(self->file)) {
825 if (write_other(self, NULL, 0) < 0) return -1;
826 PDATA_APPEND(self->file, memo_len, -1);
827 res=0; /* Job well done ;) */
828 goto finally;
830 else {
831 if (p >= 256) {
832 c_str[0] = LONG_BINPUT;
833 c_str[1] = (int)(p & 0xff);
834 c_str[2] = (int)((p >> 8) & 0xff);
835 c_str[3] = (int)((p >> 16) & 0xff);
836 c_str[4] = (int)((p >> 24) & 0xff);
837 len = 5;
839 else {
840 c_str[0] = BINPUT;
841 c_str[1] = p;
842 len = 2;
846 if (self->write_func(self, c_str, len) < 0)
847 goto finally;
849 res = 0;
851 finally:
852 Py_XDECREF(py_ob_id);
853 Py_XDECREF(memo_len);
854 Py_XDECREF(t);
856 return res;
859 static PyObject *
860 whichmodule(PyObject *global, PyObject *global_name)
862 Py_ssize_t i, j;
863 PyObject *module = 0, *modules_dict = 0,
864 *global_name_attr = 0, *name = 0;
866 module = PyObject_GetAttrString(global, "__module__");
867 if (module)
868 return module;
869 if (PyErr_ExceptionMatches(PyExc_AttributeError))
870 PyErr_Clear();
871 else
872 return NULL;
874 if (!( modules_dict = PySys_GetObject("modules")))
875 return NULL;
877 i = 0;
878 while ((j = PyDict_Next(modules_dict, &i, &name, &module))) {
880 if (PyObject_Compare(name, __main___str)==0) continue;
882 global_name_attr = PyObject_GetAttr(module, global_name);
883 if (!global_name_attr) {
884 if (PyErr_ExceptionMatches(PyExc_AttributeError))
885 PyErr_Clear();
886 else
887 return NULL;
888 continue;
891 if (global_name_attr != global) {
892 Py_DECREF(global_name_attr);
893 continue;
896 Py_DECREF(global_name_attr);
898 break;
901 /* The following implements the rule in pickle.py added in 1.5
902 that used __main__ if no module is found. I don't actually
903 like this rule. jlf
905 if (!j) {
906 name=__main___str;
909 Py_INCREF(name);
910 return name;
914 static int
915 fast_save_enter(Picklerobject *self, PyObject *obj)
917 /* if fast_container < 0, we're doing an error exit. */
918 if (++self->fast_container >= PY_CPICKLE_FAST_LIMIT) {
919 PyObject *key = NULL;
920 if (self->fast_memo == NULL) {
921 self->fast_memo = PyDict_New();
922 if (self->fast_memo == NULL) {
923 self->fast_container = -1;
924 return 0;
927 key = PyLong_FromVoidPtr(obj);
928 if (key == NULL)
929 return 0;
930 if (PyDict_GetItem(self->fast_memo, key)) {
931 Py_DECREF(key);
932 PyErr_Format(PyExc_ValueError,
933 "fast mode: can't pickle cyclic objects "
934 "including object type %s at %p",
935 Py_TYPE(obj)->tp_name, obj);
936 self->fast_container = -1;
937 return 0;
939 if (PyDict_SetItem(self->fast_memo, key, Py_None) < 0) {
940 Py_DECREF(key);
941 self->fast_container = -1;
942 return 0;
944 Py_DECREF(key);
946 return 1;
950 fast_save_leave(Picklerobject *self, PyObject *obj)
952 if (self->fast_container-- >= PY_CPICKLE_FAST_LIMIT) {
953 PyObject *key = PyLong_FromVoidPtr(obj);
954 if (key == NULL)
955 return 0;
956 if (PyDict_DelItem(self->fast_memo, key) < 0) {
957 Py_DECREF(key);
958 return 0;
960 Py_DECREF(key);
962 return 1;
965 static int
966 save_none(Picklerobject *self, PyObject *args)
968 static char none = NONE;
969 if (self->write_func(self, &none, 1) < 0)
970 return -1;
972 return 0;
975 static int
976 save_bool(Picklerobject *self, PyObject *args)
978 static const char *buf[2] = {FALSE, TRUE};
979 static char len[2] = {sizeof(FALSE)-1, sizeof(TRUE)-1};
980 long l = PyInt_AS_LONG((PyIntObject *)args);
982 if (self->proto >= 2) {
983 char opcode = l ? NEWTRUE : NEWFALSE;
984 if (self->write_func(self, &opcode, 1) < 0)
985 return -1;
987 else if (self->write_func(self, buf[l], len[l]) < 0)
988 return -1;
989 return 0;
992 static int
993 save_int(Picklerobject *self, PyObject *args)
995 char c_str[32];
996 long l = PyInt_AS_LONG((PyIntObject *)args);
997 int len = 0;
999 if (!self->bin
1000 #if SIZEOF_LONG > 4
1001 || l > 0x7fffffffL
1002 || l < -0x80000000L
1003 #endif
1005 /* Text-mode pickle, or long too big to fit in the 4-byte
1006 * signed BININT format: store as a string.
1008 c_str[0] = INT;
1009 PyOS_snprintf(c_str + 1, sizeof(c_str) - 1, "%ld\n", l);
1010 if (self->write_func(self, c_str, strlen(c_str)) < 0)
1011 return -1;
1013 else {
1014 /* Binary pickle and l fits in a signed 4-byte int. */
1015 c_str[1] = (int)( l & 0xff);
1016 c_str[2] = (int)((l >> 8) & 0xff);
1017 c_str[3] = (int)((l >> 16) & 0xff);
1018 c_str[4] = (int)((l >> 24) & 0xff);
1020 if ((c_str[4] == 0) && (c_str[3] == 0)) {
1021 if (c_str[2] == 0) {
1022 c_str[0] = BININT1;
1023 len = 2;
1025 else {
1026 c_str[0] = BININT2;
1027 len = 3;
1030 else {
1031 c_str[0] = BININT;
1032 len = 5;
1035 if (self->write_func(self, c_str, len) < 0)
1036 return -1;
1039 return 0;
1043 static int
1044 save_long(Picklerobject *self, PyObject *args)
1046 Py_ssize_t size;
1047 int res = -1;
1048 PyObject *repr = NULL;
1050 static char l = LONG;
1052 if (self->proto >= 2) {
1053 /* Linear-time pickling. */
1054 size_t nbits;
1055 size_t nbytes;
1056 unsigned char *pdata;
1057 char c_str[5];
1058 int i;
1059 int sign = _PyLong_Sign(args);
1061 if (sign == 0) {
1062 /* It's 0 -- an empty bytestring. */
1063 c_str[0] = LONG1;
1064 c_str[1] = 0;
1065 i = self->write_func(self, c_str, 2);
1066 if (i < 0) goto finally;
1067 res = 0;
1068 goto finally;
1070 nbits = _PyLong_NumBits(args);
1071 if (nbits == (size_t)-1 && PyErr_Occurred())
1072 goto finally;
1073 /* How many bytes do we need? There are nbits >> 3 full
1074 * bytes of data, and nbits & 7 leftover bits. If there
1075 * are any leftover bits, then we clearly need another
1076 * byte. Wnat's not so obvious is that we *probably*
1077 * need another byte even if there aren't any leftovers:
1078 * the most-significant bit of the most-significant byte
1079 * acts like a sign bit, and it's usually got a sense
1080 * opposite of the one we need. The exception is longs
1081 * of the form -(2**(8*j-1)) for j > 0. Such a long is
1082 * its own 256's-complement, so has the right sign bit
1083 * even without the extra byte. That's a pain to check
1084 * for in advance, though, so we always grab an extra
1085 * byte at the start, and cut it back later if possible.
1087 nbytes = (nbits >> 3) + 1;
1088 if (nbytes > INT_MAX) {
1089 PyErr_SetString(PyExc_OverflowError, "long too large "
1090 "to pickle");
1091 goto finally;
1093 repr = PyString_FromStringAndSize(NULL, (int)nbytes);
1094 if (repr == NULL) goto finally;
1095 pdata = (unsigned char *)PyString_AS_STRING(repr);
1096 i = _PyLong_AsByteArray((PyLongObject *)args,
1097 pdata, nbytes,
1098 1 /* little endian */, 1 /* signed */);
1099 if (i < 0) goto finally;
1100 /* If the long is negative, this may be a byte more than
1101 * needed. This is so iff the MSB is all redundant sign
1102 * bits.
1104 if (sign < 0 && nbytes > 1 && pdata[nbytes - 1] == 0xff &&
1105 (pdata[nbytes - 2] & 0x80) != 0)
1106 --nbytes;
1108 if (nbytes < 256) {
1109 c_str[0] = LONG1;
1110 c_str[1] = (char)nbytes;
1111 size = 2;
1113 else {
1114 c_str[0] = LONG4;
1115 size = (int)nbytes;
1116 for (i = 1; i < 5; i++) {
1117 c_str[i] = (char)(size & 0xff);
1118 size >>= 8;
1120 size = 5;
1122 i = self->write_func(self, c_str, size);
1123 if (i < 0) goto finally;
1124 i = self->write_func(self, (char *)pdata, (int)nbytes);
1125 if (i < 0) goto finally;
1126 res = 0;
1127 goto finally;
1130 /* proto < 2: write the repr and newline. This is quadratic-time
1131 * (in the number of digits), in both directions.
1133 if (!( repr = PyObject_Repr(args)))
1134 goto finally;
1136 if ((size = PyString_Size(repr)) < 0)
1137 goto finally;
1139 if (self->write_func(self, &l, 1) < 0)
1140 goto finally;
1142 if (self->write_func(self,
1143 PyString_AS_STRING((PyStringObject *)repr),
1144 size) < 0)
1145 goto finally;
1147 if (self->write_func(self, "\n", 1) < 0)
1148 goto finally;
1150 res = 0;
1152 finally:
1153 Py_XDECREF(repr);
1154 return res;
1158 static int
1159 save_float(Picklerobject *self, PyObject *args)
1161 double x = PyFloat_AS_DOUBLE((PyFloatObject *)args);
1163 if (self->bin) {
1164 char str[9];
1165 str[0] = BINFLOAT;
1166 if (_PyFloat_Pack8(x, (unsigned char *)&str[1], 0) < 0)
1167 return -1;
1168 if (self->write_func(self, str, 9) < 0)
1169 return -1;
1171 else {
1172 int result = -1;
1173 char *buf = NULL;
1174 char op = FLOAT;
1176 if (self->write_func(self, &op, 1) < 0)
1177 goto done;
1179 buf = PyOS_double_to_string(x, 'g', 17, 0, NULL);
1180 if (!buf) {
1181 PyErr_NoMemory();
1182 goto done;
1185 if (self->write_func(self, buf, strlen(buf)) < 0)
1186 goto done;
1188 if (self->write_func(self, "\n", 1) < 0)
1189 goto done;
1191 result = 0;
1192 done:
1193 PyMem_Free(buf);
1194 return result;
1197 return 0;
1201 static int
1202 save_string(Picklerobject *self, PyObject *args, int doput)
1204 int size, len;
1205 PyObject *repr=0;
1207 if ((size = PyString_Size(args)) < 0)
1208 return -1;
1210 if (!self->bin) {
1211 char *repr_str;
1213 static char string = STRING;
1215 if (!( repr = PyObject_Repr(args)))
1216 return -1;
1218 if ((len = PyString_Size(repr)) < 0)
1219 goto err;
1220 repr_str = PyString_AS_STRING((PyStringObject *)repr);
1222 if (self->write_func(self, &string, 1) < 0)
1223 goto err;
1225 if (self->write_func(self, repr_str, len) < 0)
1226 goto err;
1228 if (self->write_func(self, "\n", 1) < 0)
1229 goto err;
1231 Py_XDECREF(repr);
1233 else {
1234 int i;
1235 char c_str[5];
1237 if (size < 256) {
1238 c_str[0] = SHORT_BINSTRING;
1239 c_str[1] = size;
1240 len = 2;
1242 else if (size <= INT_MAX) {
1243 c_str[0] = BINSTRING;
1244 for (i = 1; i < 5; i++)
1245 c_str[i] = (int)(size >> ((i - 1) * 8));
1246 len = 5;
1248 else
1249 return -1; /* string too large */
1251 if (self->write_func(self, c_str, len) < 0)
1252 return -1;
1254 if (size > 128 && Pdata_Check(self->file)) {
1255 if (write_other(self, NULL, 0) < 0) return -1;
1256 PDATA_APPEND(self->file, args, -1);
1258 else {
1259 if (self->write_func(self,
1260 PyString_AS_STRING(
1261 (PyStringObject *)args),
1262 size) < 0)
1263 return -1;
1267 if (doput)
1268 if (put(self, args) < 0)
1269 return -1;
1271 return 0;
1273 err:
1274 Py_XDECREF(repr);
1275 return -1;
1279 #ifdef Py_USING_UNICODE
1280 /* A copy of PyUnicode_EncodeRawUnicodeEscape() that also translates
1281 backslash and newline characters to \uXXXX escapes. */
1282 static PyObject *
1283 modified_EncodeRawUnicodeEscape(const Py_UNICODE *s, Py_ssize_t size)
1285 PyObject *repr;
1286 char *p;
1287 char *q;
1289 static const char *hexdigit = "0123456789abcdef";
1290 #ifdef Py_UNICODE_WIDE
1291 const Py_ssize_t expandsize = 10;
1292 #else
1293 const Py_ssize_t expandsize = 6;
1294 #endif
1296 if (size > PY_SSIZE_T_MAX / expandsize)
1297 return PyErr_NoMemory();
1299 repr = PyString_FromStringAndSize(NULL, expandsize * size);
1300 if (repr == NULL)
1301 return NULL;
1302 if (size == 0)
1303 return repr;
1305 p = q = PyString_AS_STRING(repr);
1306 while (size-- > 0) {
1307 Py_UNICODE ch = *s++;
1308 #ifdef Py_UNICODE_WIDE
1309 /* Map 32-bit characters to '\Uxxxxxxxx' */
1310 if (ch >= 0x10000) {
1311 *p++ = '\\';
1312 *p++ = 'U';
1313 *p++ = hexdigit[(ch >> 28) & 0xf];
1314 *p++ = hexdigit[(ch >> 24) & 0xf];
1315 *p++ = hexdigit[(ch >> 20) & 0xf];
1316 *p++ = hexdigit[(ch >> 16) & 0xf];
1317 *p++ = hexdigit[(ch >> 12) & 0xf];
1318 *p++ = hexdigit[(ch >> 8) & 0xf];
1319 *p++ = hexdigit[(ch >> 4) & 0xf];
1320 *p++ = hexdigit[ch & 15];
1322 else
1323 #else
1324 /* Map UTF-16 surrogate pairs to '\U00xxxxxx' */
1325 if (ch >= 0xD800 && ch < 0xDC00) {
1326 Py_UNICODE ch2;
1327 Py_UCS4 ucs;
1329 ch2 = *s++;
1330 size--;
1331 if (ch2 >= 0xDC00 && ch2 <= 0xDFFF) {
1332 ucs = (((ch & 0x03FF) << 10) | (ch2 & 0x03FF)) + 0x00010000;
1333 *p++ = '\\';
1334 *p++ = 'U';
1335 *p++ = hexdigit[(ucs >> 28) & 0xf];
1336 *p++ = hexdigit[(ucs >> 24) & 0xf];
1337 *p++ = hexdigit[(ucs >> 20) & 0xf];
1338 *p++ = hexdigit[(ucs >> 16) & 0xf];
1339 *p++ = hexdigit[(ucs >> 12) & 0xf];
1340 *p++ = hexdigit[(ucs >> 8) & 0xf];
1341 *p++ = hexdigit[(ucs >> 4) & 0xf];
1342 *p++ = hexdigit[ucs & 0xf];
1343 continue;
1345 /* Fall through: isolated surrogates are copied as-is */
1346 s--;
1347 size++;
1349 #endif
1350 /* Map 16-bit characters to '\uxxxx' */
1351 if (ch >= 256 || ch == '\\' || ch == '\n') {
1352 *p++ = '\\';
1353 *p++ = 'u';
1354 *p++ = hexdigit[(ch >> 12) & 0xf];
1355 *p++ = hexdigit[(ch >> 8) & 0xf];
1356 *p++ = hexdigit[(ch >> 4) & 0xf];
1357 *p++ = hexdigit[ch & 15];
1359 /* Copy everything else as-is */
1360 else
1361 *p++ = (char) ch;
1363 *p = '\0';
1364 _PyString_Resize(&repr, p - q);
1365 return repr;
1368 static int
1369 save_unicode(Picklerobject *self, PyObject *args, int doput)
1371 Py_ssize_t size, len;
1372 PyObject *repr=0;
1374 if (!PyUnicode_Check(args))
1375 return -1;
1377 if (!self->bin) {
1378 char *repr_str;
1379 static char string = UNICODE;
1381 repr = modified_EncodeRawUnicodeEscape(
1382 PyUnicode_AS_UNICODE(args), PyUnicode_GET_SIZE(args));
1383 if (!repr)
1384 return -1;
1386 if ((len = PyString_Size(repr)) < 0)
1387 goto err;
1388 repr_str = PyString_AS_STRING((PyStringObject *)repr);
1390 if (self->write_func(self, &string, 1) < 0)
1391 goto err;
1393 if (self->write_func(self, repr_str, len) < 0)
1394 goto err;
1396 if (self->write_func(self, "\n", 1) < 0)
1397 goto err;
1399 Py_XDECREF(repr);
1401 else {
1402 int i;
1403 char c_str[5];
1405 if (!( repr = PyUnicode_AsUTF8String(args)))
1406 return -1;
1408 if ((size = PyString_Size(repr)) < 0)
1409 goto err;
1410 if (size > INT_MAX)
1411 return -1; /* string too large */
1413 c_str[0] = BINUNICODE;
1414 for (i = 1; i < 5; i++)
1415 c_str[i] = (int)(size >> ((i - 1) * 8));
1416 len = 5;
1418 if (self->write_func(self, c_str, len) < 0)
1419 goto err;
1421 if (size > 128 && Pdata_Check(self->file)) {
1422 if (write_other(self, NULL, 0) < 0)
1423 goto err;
1424 PDATA_APPEND(self->file, repr, -1);
1426 else {
1427 if (self->write_func(self, PyString_AS_STRING(repr),
1428 size) < 0)
1429 goto err;
1432 Py_DECREF(repr);
1435 if (doput)
1436 if (put(self, args) < 0)
1437 return -1;
1439 return 0;
1441 err:
1442 Py_XDECREF(repr);
1443 return -1;
1445 #endif
1447 /* A helper for save_tuple. Push the len elements in tuple t on the stack. */
1448 static int
1449 store_tuple_elements(Picklerobject *self, PyObject *t, int len)
1451 int i;
1452 int res = -1; /* guilty until proved innocent */
1454 assert(PyTuple_Size(t) == len);
1456 for (i = 0; i < len; i++) {
1457 PyObject *element = PyTuple_GET_ITEM(t, i);
1459 if (element == NULL)
1460 goto finally;
1461 if (save(self, element, 0) < 0)
1462 goto finally;
1464 res = 0;
1466 finally:
1467 return res;
1470 /* Tuples are ubiquitous in the pickle protocols, so many techniques are
1471 * used across protocols to minimize the space needed to pickle them.
1472 * Tuples are also the only builtin immutable type that can be recursive
1473 * (a tuple can be reached from itself), and that requires some subtle
1474 * magic so that it works in all cases. IOW, this is a long routine.
1476 static int
1477 save_tuple(Picklerobject *self, PyObject *args)
1479 PyObject *py_tuple_id = NULL;
1480 int len, i;
1481 int res = -1;
1483 static char tuple = TUPLE;
1484 static char pop = POP;
1485 static char pop_mark = POP_MARK;
1486 static char len2opcode[] = {EMPTY_TUPLE, TUPLE1, TUPLE2, TUPLE3};
1488 if ((len = PyTuple_Size(args)) < 0)
1489 goto finally;
1491 if (len == 0) {
1492 char c_str[2];
1494 if (self->proto) {
1495 c_str[0] = EMPTY_TUPLE;
1496 len = 1;
1498 else {
1499 c_str[0] = MARK;
1500 c_str[1] = TUPLE;
1501 len = 2;
1503 if (self->write_func(self, c_str, len) >= 0)
1504 res = 0;
1505 /* Don't memoize an empty tuple. */
1506 goto finally;
1509 /* A non-empty tuple. */
1511 /* id(tuple) isn't in the memo now. If it shows up there after
1512 * saving the tuple elements, the tuple must be recursive, in
1513 * which case we'll pop everything we put on the stack, and fetch
1514 * its value from the memo.
1516 py_tuple_id = PyLong_FromVoidPtr(args);
1517 if (py_tuple_id == NULL)
1518 goto finally;
1520 if (len <= 3 && self->proto >= 2) {
1521 /* Use TUPLE{1,2,3} opcodes. */
1522 if (store_tuple_elements(self, args, len) < 0)
1523 goto finally;
1524 if (PyDict_GetItem(self->memo, py_tuple_id)) {
1525 /* pop the len elements */
1526 for (i = 0; i < len; ++i)
1527 if (self->write_func(self, &pop, 1) < 0)
1528 goto finally;
1529 /* fetch from memo */
1530 if (get(self, py_tuple_id) < 0)
1531 goto finally;
1532 res = 0;
1533 goto finally;
1535 /* Not recursive. */
1536 if (self->write_func(self, len2opcode + len, 1) < 0)
1537 goto finally;
1538 goto memoize;
1541 /* proto < 2 and len > 0, or proto >= 2 and len > 3.
1542 * Generate MARK elt1 elt2 ... TUPLE
1544 if (self->write_func(self, &MARKv, 1) < 0)
1545 goto finally;
1547 if (store_tuple_elements(self, args, len) < 0)
1548 goto finally;
1550 if (PyDict_GetItem(self->memo, py_tuple_id)) {
1551 /* pop the stack stuff we pushed */
1552 if (self->bin) {
1553 if (self->write_func(self, &pop_mark, 1) < 0)
1554 goto finally;
1556 else {
1557 /* Note that we pop one more than len, to remove
1558 * the MARK too.
1560 for (i = 0; i <= len; i++)
1561 if (self->write_func(self, &pop, 1) < 0)
1562 goto finally;
1564 /* fetch from memo */
1565 if (get(self, py_tuple_id) >= 0)
1566 res = 0;
1567 goto finally;
1570 /* Not recursive. */
1571 if (self->write_func(self, &tuple, 1) < 0)
1572 goto finally;
1574 memoize:
1575 if (put(self, args) >= 0)
1576 res = 0;
1578 finally:
1579 Py_XDECREF(py_tuple_id);
1580 return res;
1583 /* iter is an iterator giving items, and we batch up chunks of
1584 * MARK item item ... item APPENDS
1585 * opcode sequences. Calling code should have arranged to first create an
1586 * empty list, or list-like object, for the APPENDS to operate on.
1587 * Returns 0 on success, <0 on error.
1589 static int
1590 batch_list(Picklerobject *self, PyObject *iter)
1592 PyObject *obj = NULL;
1593 PyObject *firstitem = NULL;
1594 int i, n;
1596 static char append = APPEND;
1597 static char appends = APPENDS;
1599 assert(iter != NULL);
1601 if (self->proto == 0) {
1602 /* APPENDS isn't available; do one at a time. */
1603 for (;;) {
1604 obj = PyIter_Next(iter);
1605 if (obj == NULL) {
1606 if (PyErr_Occurred())
1607 return -1;
1608 break;
1610 i = save(self, obj, 0);
1611 Py_DECREF(obj);
1612 if (i < 0)
1613 return -1;
1614 if (self->write_func(self, &append, 1) < 0)
1615 return -1;
1617 return 0;
1620 /* proto > 0: write in batches of BATCHSIZE. */
1621 do {
1622 /* Get first item */
1623 firstitem = PyIter_Next(iter);
1624 if (firstitem == NULL) {
1625 if (PyErr_Occurred())
1626 goto BatchFailed;
1628 /* nothing more to add */
1629 break;
1632 /* Try to get a second item */
1633 obj = PyIter_Next(iter);
1634 if (obj == NULL) {
1635 if (PyErr_Occurred())
1636 goto BatchFailed;
1638 /* Only one item to write */
1639 if (save(self, firstitem, 0) < 0)
1640 goto BatchFailed;
1641 if (self->write_func(self, &append, 1) < 0)
1642 goto BatchFailed;
1643 Py_CLEAR(firstitem);
1644 break;
1647 /* More than one item to write */
1649 /* Pump out MARK, items, APPENDS. */
1650 if (self->write_func(self, &MARKv, 1) < 0)
1651 goto BatchFailed;
1653 if (save(self, firstitem, 0) < 0)
1654 goto BatchFailed;
1655 Py_CLEAR(firstitem);
1656 n = 1;
1658 /* Fetch and save up to BATCHSIZE items */
1659 while (obj) {
1660 if (save(self, obj, 0) < 0)
1661 goto BatchFailed;
1662 Py_CLEAR(obj);
1663 n += 1;
1665 if (n == BATCHSIZE)
1666 break;
1668 obj = PyIter_Next(iter);
1669 if (obj == NULL) {
1670 if (PyErr_Occurred())
1671 goto BatchFailed;
1672 break;
1676 if (self->write_func(self, &appends, 1) < 0)
1677 goto BatchFailed;
1679 } while (n == BATCHSIZE);
1680 return 0;
1682 BatchFailed:
1683 Py_XDECREF(firstitem);
1684 Py_XDECREF(obj);
1685 return -1;
1688 static int
1689 save_list(Picklerobject *self, PyObject *args)
1691 int res = -1;
1692 char s[3];
1693 int len;
1694 PyObject *iter;
1696 if (self->fast && !fast_save_enter(self, args))
1697 goto finally;
1699 /* Create an empty list. */
1700 if (self->bin) {
1701 s[0] = EMPTY_LIST;
1702 len = 1;
1704 else {
1705 s[0] = MARK;
1706 s[1] = LIST;
1707 len = 2;
1710 if (self->write_func(self, s, len) < 0)
1711 goto finally;
1713 /* Get list length, and bow out early if empty. */
1714 if ((len = PyList_Size(args)) < 0)
1715 goto finally;
1717 /* Memoize. */
1718 if (len == 0) {
1719 if (put(self, args) >= 0)
1720 res = 0;
1721 goto finally;
1723 if (put2(self, args) < 0)
1724 goto finally;
1726 /* Materialize the list elements. */
1727 iter = PyObject_GetIter(args);
1728 if (iter == NULL)
1729 goto finally;
1731 if (Py_EnterRecursiveCall(" while pickling an object") == 0)
1733 res = batch_list(self, iter);
1734 Py_LeaveRecursiveCall();
1736 Py_DECREF(iter);
1738 finally:
1739 if (self->fast && !fast_save_leave(self, args))
1740 res = -1;
1742 return res;
1746 /* iter is an iterator giving (key, value) pairs, and we batch up chunks of
1747 * MARK key value ... key value SETITEMS
1748 * opcode sequences. Calling code should have arranged to first create an
1749 * empty dict, or dict-like object, for the SETITEMS to operate on.
1750 * Returns 0 on success, <0 on error.
1752 * This is very much like batch_list(). The difference between saving
1753 * elements directly, and picking apart two-tuples, is so long-winded at
1754 * the C level, though, that attempts to combine these routines were too
1755 * ugly to bear.
1757 static int
1758 batch_dict(Picklerobject *self, PyObject *iter)
1760 PyObject *p = NULL;
1761 PyObject *firstitem = NULL;
1762 int i, n;
1764 static char setitem = SETITEM;
1765 static char setitems = SETITEMS;
1767 assert(iter != NULL);
1769 if (self->proto == 0) {
1770 /* SETITEMS isn't available; do one at a time. */
1771 for (;;) {
1772 p = PyIter_Next(iter);
1773 if (p == NULL) {
1774 if (PyErr_Occurred())
1775 return -1;
1776 break;
1778 if (!PyTuple_Check(p) || PyTuple_Size(p) != 2) {
1779 PyErr_SetString(PyExc_TypeError, "dict items "
1780 "iterator must return 2-tuples");
1781 return -1;
1783 i = save(self, PyTuple_GET_ITEM(p, 0), 0);
1784 if (i >= 0)
1785 i = save(self, PyTuple_GET_ITEM(p, 1), 0);
1786 Py_DECREF(p);
1787 if (i < 0)
1788 return -1;
1789 if (self->write_func(self, &setitem, 1) < 0)
1790 return -1;
1792 return 0;
1795 /* proto > 0: write in batches of BATCHSIZE. */
1796 do {
1797 /* Get first item */
1798 firstitem = PyIter_Next(iter);
1799 if (firstitem == NULL) {
1800 if (PyErr_Occurred())
1801 goto BatchFailed;
1803 /* nothing more to add */
1804 break;
1806 if (!PyTuple_Check(firstitem) || PyTuple_Size(firstitem) != 2) {
1807 PyErr_SetString(PyExc_TypeError, "dict items "
1808 "iterator must return 2-tuples");
1809 goto BatchFailed;
1812 /* Try to get a second item */
1813 p = PyIter_Next(iter);
1814 if (p == NULL) {
1815 if (PyErr_Occurred())
1816 goto BatchFailed;
1818 /* Only one item to write */
1819 if (save(self, PyTuple_GET_ITEM(firstitem, 0), 0) < 0)
1820 goto BatchFailed;
1821 if (save(self, PyTuple_GET_ITEM(firstitem, 1), 0) < 0)
1822 goto BatchFailed;
1823 if (self->write_func(self, &setitem, 1) < 0)
1824 goto BatchFailed;
1825 Py_CLEAR(firstitem);
1826 break;
1829 /* More than one item to write */
1831 /* Pump out MARK, items, SETITEMS. */
1832 if (self->write_func(self, &MARKv, 1) < 0)
1833 goto BatchFailed;
1835 if (save(self, PyTuple_GET_ITEM(firstitem, 0), 0) < 0)
1836 goto BatchFailed;
1837 if (save(self, PyTuple_GET_ITEM(firstitem, 1), 0) < 0)
1838 goto BatchFailed;
1839 Py_CLEAR(firstitem);
1840 n = 1;
1842 /* Fetch and save up to BATCHSIZE items */
1843 while (p) {
1844 if (!PyTuple_Check(p) || PyTuple_Size(p) != 2) {
1845 PyErr_SetString(PyExc_TypeError, "dict items "
1846 "iterator must return 2-tuples");
1847 goto BatchFailed;
1849 if (save(self, PyTuple_GET_ITEM(p, 0), 0) < 0)
1850 goto BatchFailed;
1851 if (save(self, PyTuple_GET_ITEM(p, 1), 0) < 0)
1852 goto BatchFailed;
1853 Py_CLEAR(p);
1854 n += 1;
1856 if (n == BATCHSIZE)
1857 break;
1859 p = PyIter_Next(iter);
1860 if (p == NULL) {
1861 if (PyErr_Occurred())
1862 goto BatchFailed;
1863 break;
1867 if (self->write_func(self, &setitems, 1) < 0)
1868 goto BatchFailed;
1870 } while (n == BATCHSIZE);
1871 return 0;
1873 BatchFailed:
1874 Py_XDECREF(firstitem);
1875 Py_XDECREF(p);
1876 return -1;
1879 /* This is a variant of batch_dict() above that specializes for dicts, with no
1880 * support for dict subclasses. Like batch_dict(), we batch up chunks of
1881 * MARK key value ... key value SETITEMS
1882 * opcode sequences. Calling code should have arranged to first create an
1883 * empty dict, or dict-like object, for the SETITEMS to operate on.
1884 * Returns 0 on success, -1 on error.
1886 * Note that this currently doesn't work for protocol 0.
1888 static int
1889 batch_dict_exact(Picklerobject *self, PyObject *obj)
1891 PyObject *key = NULL, *value = NULL;
1892 int i;
1893 Py_ssize_t dict_size, ppos = 0;
1895 static char setitem = SETITEM;
1896 static char setitems = SETITEMS;
1898 assert(obj != NULL);
1899 assert(self->proto > 0);
1901 dict_size = PyDict_Size(obj);
1903 /* Special-case len(d) == 1 to save space. */
1904 if (dict_size == 1) {
1905 PyDict_Next(obj, &ppos, &key, &value);
1906 if (save(self, key, 0) < 0)
1907 return -1;
1908 if (save(self, value, 0) < 0)
1909 return -1;
1910 if (self->write_func(self, &setitem, 1) < 0)
1911 return -1;
1912 return 0;
1915 /* Write in batches of BATCHSIZE. */
1916 do {
1917 i = 0;
1918 if (self->write_func(self, &MARKv, 1) < 0)
1919 return -1;
1920 while (PyDict_Next(obj, &ppos, &key, &value)) {
1921 if (save(self, key, 0) < 0)
1922 return -1;
1923 if (save(self, value, 0) < 0)
1924 return -1;
1925 if (++i == BATCHSIZE)
1926 break;
1928 if (self->write_func(self, &setitems, 1) < 0)
1929 return -1;
1930 if (PyDict_Size(obj) != dict_size) {
1931 PyErr_Format(
1932 PyExc_RuntimeError,
1933 "dictionary changed size during iteration");
1934 return -1;
1937 } while (i == BATCHSIZE);
1938 return 0;
1941 static int
1942 save_dict(Picklerobject *self, PyObject *args)
1944 int res = -1;
1945 char s[3];
1946 int len;
1948 if (self->fast && !fast_save_enter(self, args))
1949 goto finally;
1951 /* Create an empty dict. */
1952 if (self->bin) {
1953 s[0] = EMPTY_DICT;
1954 len = 1;
1956 else {
1957 s[0] = MARK;
1958 s[1] = DICT;
1959 len = 2;
1962 if (self->write_func(self, s, len) < 0)
1963 goto finally;
1965 /* Get dict size, and bow out early if empty. */
1966 if ((len = PyDict_Size(args)) < 0)
1967 goto finally;
1969 if (len == 0) {
1970 if (put(self, args) >= 0)
1971 res = 0;
1972 goto finally;
1974 if (put2(self, args) < 0)
1975 goto finally;
1977 /* Materialize the dict items. */
1978 if (PyDict_CheckExact(args) && self->proto > 0) {
1979 /* We can take certain shortcuts if we know this is a dict and
1980 not a dict subclass. */
1981 if (Py_EnterRecursiveCall(" while pickling an object") == 0) {
1982 res = batch_dict_exact(self, args);
1983 Py_LeaveRecursiveCall();
1985 } else {
1986 PyObject *iter = PyObject_CallMethod(args, "iteritems", "()");
1987 if (iter == NULL)
1988 goto finally;
1989 if (Py_EnterRecursiveCall(" while pickling an object") == 0) {
1990 res = batch_dict(self, iter);
1991 Py_LeaveRecursiveCall();
1993 Py_DECREF(iter);
1996 finally:
1997 if (self->fast && !fast_save_leave(self, args))
1998 res = -1;
2000 return res;
2004 static int
2005 save_inst(Picklerobject *self, PyObject *args)
2007 PyObject *class = 0, *module = 0, *name = 0, *state = 0,
2008 *getinitargs_func = 0, *getstate_func = 0, *class_args = 0;
2009 char *module_str, *name_str;
2010 int module_size, name_size, res = -1;
2012 static char inst = INST, obj = OBJ, build = BUILD;
2014 if (self->fast && !fast_save_enter(self, args))
2015 goto finally;
2017 if (self->write_func(self, &MARKv, 1) < 0)
2018 goto finally;
2020 if (!( class = PyObject_GetAttr(args, __class___str)))
2021 goto finally;
2023 if (self->bin) {
2024 if (save(self, class, 0) < 0)
2025 goto finally;
2028 if ((getinitargs_func = PyObject_GetAttr(args, __getinitargs___str))) {
2029 PyObject *element = 0;
2030 int i, len;
2032 if (!( class_args =
2033 PyObject_Call(getinitargs_func, empty_tuple, NULL)))
2034 goto finally;
2036 if ((len = PyObject_Size(class_args)) < 0)
2037 goto finally;
2039 for (i = 0; i < len; i++) {
2040 if (!( element = PySequence_GetItem(class_args, i)))
2041 goto finally;
2043 if (save(self, element, 0) < 0) {
2044 Py_DECREF(element);
2045 goto finally;
2048 Py_DECREF(element);
2051 else {
2052 if (PyErr_ExceptionMatches(PyExc_AttributeError))
2053 PyErr_Clear();
2054 else
2055 goto finally;
2058 if (!self->bin) {
2059 if (!( name = ((PyClassObject *)class)->cl_name )) {
2060 PyErr_SetString(PicklingError, "class has no name");
2061 goto finally;
2064 if (!( module = whichmodule(class, name)))
2065 goto finally;
2068 if ((module_size = PyString_Size(module)) < 0 ||
2069 (name_size = PyString_Size(name)) < 0)
2070 goto finally;
2072 module_str = PyString_AS_STRING((PyStringObject *)module);
2073 name_str = PyString_AS_STRING((PyStringObject *)name);
2075 if (self->write_func(self, &inst, 1) < 0)
2076 goto finally;
2078 if (self->write_func(self, module_str, module_size) < 0)
2079 goto finally;
2081 if (self->write_func(self, "\n", 1) < 0)
2082 goto finally;
2084 if (self->write_func(self, name_str, name_size) < 0)
2085 goto finally;
2087 if (self->write_func(self, "\n", 1) < 0)
2088 goto finally;
2090 else if (self->write_func(self, &obj, 1) < 0) {
2091 goto finally;
2094 if ((getstate_func = PyObject_GetAttr(args, __getstate___str))) {
2095 state = PyObject_Call(getstate_func, empty_tuple, NULL);
2096 if (!state)
2097 goto finally;
2099 else {
2100 if (PyErr_ExceptionMatches(PyExc_AttributeError))
2101 PyErr_Clear();
2102 else
2103 goto finally;
2105 if (!( state = PyObject_GetAttr(args, __dict___str))) {
2106 if (PyErr_ExceptionMatches(PyExc_AttributeError))
2107 PyErr_Clear();
2108 else
2109 goto finally;
2110 res = 0;
2111 goto finally;
2115 if (!PyDict_Check(state)) {
2116 if (put2(self, args) < 0)
2117 goto finally;
2119 else {
2120 if (put(self, args) < 0)
2121 goto finally;
2124 if (save(self, state, 0) < 0)
2125 goto finally;
2127 if (self->write_func(self, &build, 1) < 0)
2128 goto finally;
2130 res = 0;
2132 finally:
2133 if (self->fast && !fast_save_leave(self, args))
2134 res = -1;
2136 Py_XDECREF(module);
2137 Py_XDECREF(class);
2138 Py_XDECREF(state);
2139 Py_XDECREF(getinitargs_func);
2140 Py_XDECREF(getstate_func);
2141 Py_XDECREF(class_args);
2143 return res;
2147 static int
2148 save_global(Picklerobject *self, PyObject *args, PyObject *name)
2150 PyObject *global_name = 0, *module = 0, *mod = 0, *klass = 0;
2151 char *name_str, *module_str;
2152 int module_size, name_size, res = -1;
2154 static char global = GLOBAL;
2156 if (name) {
2157 global_name = name;
2158 Py_INCREF(global_name);
2160 else {
2161 if (!( global_name = PyObject_GetAttr(args, __name___str)))
2162 goto finally;
2165 if (!( module = whichmodule(args, global_name)))
2166 goto finally;
2168 if ((module_size = PyString_Size(module)) < 0 ||
2169 (name_size = PyString_Size(global_name)) < 0)
2170 goto finally;
2172 module_str = PyString_AS_STRING((PyStringObject *)module);
2173 name_str = PyString_AS_STRING((PyStringObject *)global_name);
2175 /* XXX This can be doing a relative import. Clearly it shouldn't,
2176 but I don't know how to stop it. :-( */
2177 mod = PyImport_ImportModule(module_str);
2178 if (mod == NULL) {
2179 cPickle_ErrFormat(PicklingError,
2180 "Can't pickle %s: import of module %s "
2181 "failed",
2182 "OS", args, module);
2183 goto finally;
2185 klass = PyObject_GetAttrString(mod, name_str);
2186 if (klass == NULL) {
2187 cPickle_ErrFormat(PicklingError,
2188 "Can't pickle %s: attribute lookup %s.%s "
2189 "failed",
2190 "OSS", args, module, global_name);
2191 goto finally;
2193 if (klass != args) {
2194 Py_DECREF(klass);
2195 cPickle_ErrFormat(PicklingError,
2196 "Can't pickle %s: it's not the same object "
2197 "as %s.%s",
2198 "OSS", args, module, global_name);
2199 goto finally;
2201 Py_DECREF(klass);
2203 if (self->proto >= 2) {
2204 /* See whether this is in the extension registry, and if
2205 * so generate an EXT opcode.
2207 PyObject *py_code; /* extension code as Python object */
2208 long code; /* extension code as C value */
2209 char c_str[5];
2210 int n;
2212 PyTuple_SET_ITEM(two_tuple, 0, module);
2213 PyTuple_SET_ITEM(two_tuple, 1, global_name);
2214 py_code = PyDict_GetItem(extension_registry, two_tuple);
2215 if (py_code == NULL)
2216 goto gen_global; /* not registered */
2218 /* Verify py_code has the right type and value. */
2219 if (!PyInt_Check(py_code)) {
2220 cPickle_ErrFormat(PicklingError, "Can't pickle %s: "
2221 "extension code %s isn't an integer",
2222 "OO", args, py_code);
2223 goto finally;
2225 code = PyInt_AS_LONG(py_code);
2226 if (code <= 0 || code > 0x7fffffffL) {
2227 cPickle_ErrFormat(PicklingError, "Can't pickle %s: "
2228 "extension code %ld is out of range",
2229 "Ol", args, code);
2230 goto finally;
2233 /* Generate an EXT opcode. */
2234 if (code <= 0xff) {
2235 c_str[0] = EXT1;
2236 c_str[1] = (char)code;
2237 n = 2;
2239 else if (code <= 0xffff) {
2240 c_str[0] = EXT2;
2241 c_str[1] = (char)(code & 0xff);
2242 c_str[2] = (char)((code >> 8) & 0xff);
2243 n = 3;
2245 else {
2246 c_str[0] = EXT4;
2247 c_str[1] = (char)(code & 0xff);
2248 c_str[2] = (char)((code >> 8) & 0xff);
2249 c_str[3] = (char)((code >> 16) & 0xff);
2250 c_str[4] = (char)((code >> 24) & 0xff);
2251 n = 5;
2254 if (self->write_func(self, c_str, n) >= 0)
2255 res = 0;
2256 goto finally; /* and don't memoize */
2259 gen_global:
2260 if (self->write_func(self, &global, 1) < 0)
2261 goto finally;
2263 if (self->write_func(self, module_str, module_size) < 0)
2264 goto finally;
2266 if (self->write_func(self, "\n", 1) < 0)
2267 goto finally;
2269 if (self->write_func(self, name_str, name_size) < 0)
2270 goto finally;
2272 if (self->write_func(self, "\n", 1) < 0)
2273 goto finally;
2275 if (put(self, args) < 0)
2276 goto finally;
2278 res = 0;
2280 finally:
2281 Py_XDECREF(module);
2282 Py_XDECREF(global_name);
2283 Py_XDECREF(mod);
2285 return res;
2288 static int
2289 save_pers(Picklerobject *self, PyObject *args, PyObject *f)
2291 PyObject *pid = 0;
2292 int size, res = -1;
2294 static char persid = PERSID, binpersid = BINPERSID;
2296 Py_INCREF(args);
2297 ARG_TUP(self, args);
2298 if (self->arg) {
2299 pid = PyObject_Call(f, self->arg, NULL);
2300 FREE_ARG_TUP(self);
2302 if (! pid) return -1;
2304 if (pid != Py_None) {
2305 if (!self->bin) {
2306 if (!PyString_Check(pid)) {
2307 PyErr_SetString(PicklingError,
2308 "persistent id must be string");
2309 goto finally;
2312 if (self->write_func(self, &persid, 1) < 0)
2313 goto finally;
2315 if ((size = PyString_Size(pid)) < 0)
2316 goto finally;
2318 if (self->write_func(self,
2319 PyString_AS_STRING(
2320 (PyStringObject *)pid),
2321 size) < 0)
2322 goto finally;
2324 if (self->write_func(self, "\n", 1) < 0)
2325 goto finally;
2327 res = 1;
2328 goto finally;
2330 else if (save(self, pid, 1) >= 0) {
2331 if (self->write_func(self, &binpersid, 1) < 0)
2332 res = -1;
2333 else
2334 res = 1;
2337 goto finally;
2340 res = 0;
2342 finally:
2343 Py_XDECREF(pid);
2345 return res;
2348 /* We're saving ob, and args is the 2-thru-5 tuple returned by the
2349 * appropriate __reduce__ method for ob.
2351 static int
2352 save_reduce(Picklerobject *self, PyObject *args, PyObject *fn, PyObject *ob)
2354 PyObject *callable;
2355 PyObject *argtup;
2356 PyObject *state = NULL;
2357 PyObject *listitems = Py_None;
2358 PyObject *dictitems = Py_None;
2359 Py_ssize_t size;
2361 int use_newobj = self->proto >= 2;
2363 static char reduce = REDUCE;
2364 static char build = BUILD;
2365 static char newobj = NEWOBJ;
2367 size = PyTuple_Size(args);
2368 if (size < 2 || size > 5) {
2369 cPickle_ErrFormat(PicklingError, "tuple returned by "
2370 "%s must contain 2 through 5 elements",
2371 "O", fn);
2372 return -1;
2375 if (! PyArg_UnpackTuple(args, "save_reduce", 2, 5,
2376 &callable,
2377 &argtup,
2378 &state,
2379 &listitems,
2380 &dictitems))
2381 return -1;
2383 if (!PyTuple_Check(argtup)) {
2384 cPickle_ErrFormat(PicklingError, "Second element of "
2385 "tuple returned by %s must be a tuple",
2386 "O", fn);
2387 return -1;
2390 if (state == Py_None)
2391 state = NULL;
2393 if (listitems == Py_None)
2394 listitems = NULL;
2395 else if (!PyIter_Check(listitems)) {
2396 cPickle_ErrFormat(PicklingError, "Fourth element of "
2397 "tuple returned by %s must be an iterator, not %s",
2398 "Os", fn, Py_TYPE(listitems)->tp_name);
2399 return -1;
2402 if (dictitems == Py_None)
2403 dictitems = NULL;
2404 else if (!PyIter_Check(dictitems)) {
2405 cPickle_ErrFormat(PicklingError, "Fifth element of "
2406 "tuple returned by %s must be an iterator, not %s",
2407 "Os", fn, Py_TYPE(dictitems)->tp_name);
2408 return -1;
2411 /* Protocol 2 special case: if callable's name is __newobj__, use
2412 * NEWOBJ. This consumes a lot of code.
2414 if (use_newobj) {
2415 PyObject *temp = PyObject_GetAttr(callable, __name___str);
2417 if (temp == NULL) {
2418 if (PyErr_ExceptionMatches(PyExc_AttributeError))
2419 PyErr_Clear();
2420 else
2421 return -1;
2422 use_newobj = 0;
2424 else {
2425 use_newobj = PyString_Check(temp) &&
2426 strcmp(PyString_AS_STRING(temp),
2427 "__newobj__") == 0;
2428 Py_DECREF(temp);
2431 if (use_newobj) {
2432 PyObject *cls;
2433 PyObject *newargtup;
2434 int n, i;
2436 /* Sanity checks. */
2437 n = PyTuple_Size(argtup);
2438 if (n < 1) {
2439 PyErr_SetString(PicklingError, "__newobj__ arglist "
2440 "is empty");
2441 return -1;
2444 cls = PyTuple_GET_ITEM(argtup, 0);
2445 if (! PyObject_HasAttrString(cls, "__new__")) {
2446 PyErr_SetString(PicklingError, "args[0] from "
2447 "__newobj__ args has no __new__");
2448 return -1;
2451 /* XXX How could ob be NULL? */
2452 if (ob != NULL) {
2453 PyObject *ob_dot_class;
2455 ob_dot_class = PyObject_GetAttr(ob, __class___str);
2456 if (ob_dot_class == NULL) {
2457 if (PyErr_ExceptionMatches(
2458 PyExc_AttributeError))
2459 PyErr_Clear();
2460 else
2461 return -1;
2463 i = ob_dot_class != cls; /* true iff a problem */
2464 Py_XDECREF(ob_dot_class);
2465 if (i) {
2466 PyErr_SetString(PicklingError, "args[0] from "
2467 "__newobj__ args has the wrong class");
2468 return -1;
2472 /* Save the class and its __new__ arguments. */
2473 if (save(self, cls, 0) < 0)
2474 return -1;
2476 newargtup = PyTuple_New(n-1); /* argtup[1:] */
2477 if (newargtup == NULL)
2478 return -1;
2479 for (i = 1; i < n; ++i) {
2480 PyObject *temp = PyTuple_GET_ITEM(argtup, i);
2481 Py_INCREF(temp);
2482 PyTuple_SET_ITEM(newargtup, i-1, temp);
2484 i = save(self, newargtup, 0);
2485 Py_DECREF(newargtup);
2486 if (i < 0)
2487 return -1;
2489 /* Add NEWOBJ opcode. */
2490 if (self->write_func(self, &newobj, 1) < 0)
2491 return -1;
2493 else {
2494 /* Not using NEWOBJ. */
2495 if (save(self, callable, 0) < 0 ||
2496 save(self, argtup, 0) < 0 ||
2497 self->write_func(self, &reduce, 1) < 0)
2498 return -1;
2501 /* Memoize. */
2502 /* XXX How can ob be NULL? */
2503 if (ob != NULL) {
2504 if (state && !PyDict_Check(state)) {
2505 if (put2(self, ob) < 0)
2506 return -1;
2508 else if (put(self, ob) < 0)
2509 return -1;
2513 if (listitems && batch_list(self, listitems) < 0)
2514 return -1;
2516 if (dictitems && batch_dict(self, dictitems) < 0)
2517 return -1;
2519 if (state) {
2520 if (save(self, state, 0) < 0 ||
2521 self->write_func(self, &build, 1) < 0)
2522 return -1;
2525 return 0;
2528 static int
2529 save(Picklerobject *self, PyObject *args, int pers_save)
2531 PyTypeObject *type;
2532 PyObject *py_ob_id = 0, *__reduce__ = 0, *t = 0;
2533 int res = -1;
2534 int tmp;
2536 if (Py_EnterRecursiveCall(" while pickling an object"))
2537 return -1;
2539 if (!pers_save && self->pers_func) {
2540 if ((tmp = save_pers(self, args, self->pers_func)) != 0) {
2541 res = tmp;
2542 goto finally;
2546 if (args == Py_None) {
2547 res = save_none(self, args);
2548 goto finally;
2551 type = Py_TYPE(args);
2553 switch (type->tp_name[0]) {
2554 case 'b':
2555 if (args == Py_False || args == Py_True) {
2556 res = save_bool(self, args);
2557 goto finally;
2559 break;
2560 case 'i':
2561 if (type == &PyInt_Type) {
2562 res = save_int(self, args);
2563 goto finally;
2565 break;
2567 case 'l':
2568 if (type == &PyLong_Type) {
2569 res = save_long(self, args);
2570 goto finally;
2572 break;
2574 case 'f':
2575 if (type == &PyFloat_Type) {
2576 res = save_float(self, args);
2577 goto finally;
2579 break;
2581 case 't':
2582 if (type == &PyTuple_Type && PyTuple_Size(args) == 0) {
2583 res = save_tuple(self, args);
2584 goto finally;
2586 break;
2588 case 's':
2589 if ((type == &PyString_Type) && (PyString_GET_SIZE(args) < 2)) {
2590 res = save_string(self, args, 0);
2591 goto finally;
2593 break;
2595 #ifdef Py_USING_UNICODE
2596 case 'u':
2597 if ((type == &PyUnicode_Type) && (PyString_GET_SIZE(args) < 2)) {
2598 res = save_unicode(self, args, 0);
2599 goto finally;
2601 break;
2602 #endif
2605 if (Py_REFCNT(args) > 1) {
2606 if (!( py_ob_id = PyLong_FromVoidPtr(args)))
2607 goto finally;
2609 if (PyDict_GetItem(self->memo, py_ob_id)) {
2610 if (get(self, py_ob_id) < 0)
2611 goto finally;
2613 res = 0;
2614 goto finally;
2618 switch (type->tp_name[0]) {
2619 case 's':
2620 if (type == &PyString_Type) {
2621 res = save_string(self, args, 1);
2622 goto finally;
2624 break;
2626 #ifdef Py_USING_UNICODE
2627 case 'u':
2628 if (type == &PyUnicode_Type) {
2629 res = save_unicode(self, args, 1);
2630 goto finally;
2632 break;
2633 #endif
2635 case 't':
2636 if (type == &PyTuple_Type) {
2637 res = save_tuple(self, args);
2638 goto finally;
2640 if (type == &PyType_Type) {
2641 res = save_global(self, args, NULL);
2642 goto finally;
2644 break;
2646 case 'l':
2647 if (type == &PyList_Type) {
2648 res = save_list(self, args);
2649 goto finally;
2651 break;
2653 case 'd':
2654 if (type == &PyDict_Type) {
2655 res = save_dict(self, args);
2656 goto finally;
2658 break;
2660 case 'i':
2661 if (type == &PyInstance_Type) {
2662 res = save_inst(self, args);
2663 goto finally;
2665 break;
2667 case 'c':
2668 if (type == &PyClass_Type) {
2669 res = save_global(self, args, NULL);
2670 goto finally;
2672 break;
2674 case 'f':
2675 if (type == &PyFunction_Type) {
2676 res = save_global(self, args, NULL);
2677 if (res && PyErr_ExceptionMatches(PickleError)) {
2678 /* fall back to reduce */
2679 PyErr_Clear();
2680 break;
2682 goto finally;
2684 break;
2686 case 'b':
2687 if (type == &PyCFunction_Type) {
2688 res = save_global(self, args, NULL);
2689 goto finally;
2693 if (!pers_save && self->inst_pers_func) {
2694 if ((tmp = save_pers(self, args, self->inst_pers_func)) != 0) {
2695 res = tmp;
2696 goto finally;
2700 if (PyType_IsSubtype(type, &PyType_Type)) {
2701 res = save_global(self, args, NULL);
2702 goto finally;
2705 /* Get a reduction callable, and call it. This may come from
2706 * copy_reg.dispatch_table, the object's __reduce_ex__ method,
2707 * or the object's __reduce__ method.
2709 __reduce__ = PyDict_GetItem(dispatch_table, (PyObject *)type);
2710 if (__reduce__ != NULL) {
2711 Py_INCREF(__reduce__);
2712 Py_INCREF(args);
2713 ARG_TUP(self, args);
2714 if (self->arg) {
2715 t = PyObject_Call(__reduce__, self->arg, NULL);
2716 FREE_ARG_TUP(self);
2719 else {
2720 /* Check for a __reduce_ex__ method. */
2721 __reduce__ = PyObject_GetAttr(args, __reduce_ex___str);
2722 if (__reduce__ != NULL) {
2723 t = PyInt_FromLong(self->proto);
2724 if (t != NULL) {
2725 ARG_TUP(self, t);
2726 t = NULL;
2727 if (self->arg) {
2728 t = PyObject_Call(__reduce__,
2729 self->arg, NULL);
2730 FREE_ARG_TUP(self);
2734 else {
2735 if (PyErr_ExceptionMatches(PyExc_AttributeError))
2736 PyErr_Clear();
2737 else
2738 goto finally;
2739 /* Check for a __reduce__ method. */
2740 __reduce__ = PyObject_GetAttr(args, __reduce___str);
2741 if (__reduce__ != NULL) {
2742 t = PyObject_Call(__reduce__,
2743 empty_tuple, NULL);
2745 else {
2746 PyErr_SetObject(UnpickleableError, args);
2747 goto finally;
2752 if (t == NULL)
2753 goto finally;
2755 if (PyString_Check(t)) {
2756 res = save_global(self, args, t);
2757 goto finally;
2760 if (!PyTuple_Check(t)) {
2761 cPickle_ErrFormat(PicklingError, "Value returned by "
2762 "%s must be string or tuple",
2763 "O", __reduce__);
2764 goto finally;
2767 res = save_reduce(self, t, __reduce__, args);
2769 finally:
2770 Py_LeaveRecursiveCall();
2771 Py_XDECREF(py_ob_id);
2772 Py_XDECREF(__reduce__);
2773 Py_XDECREF(t);
2775 return res;
2779 static int
2780 dump(Picklerobject *self, PyObject *args)
2782 static char stop = STOP;
2784 if (self->proto >= 2) {
2785 char bytes[2];
2787 bytes[0] = PROTO;
2788 assert(self->proto >= 0 && self->proto < 256);
2789 bytes[1] = (char)self->proto;
2790 if (self->write_func(self, bytes, 2) < 0)
2791 return -1;
2794 if (save(self, args, 0) < 0)
2795 return -1;
2797 if (self->write_func(self, &stop, 1) < 0)
2798 return -1;
2800 if (self->write_func(self, NULL, 0) < 0)
2801 return -1;
2803 return 0;
2806 static PyObject *
2807 Pickle_clear_memo(Picklerobject *self, PyObject *args)
2809 if (self->memo)
2810 PyDict_Clear(self->memo);
2811 Py_INCREF(Py_None);
2812 return Py_None;
2815 static PyObject *
2816 Pickle_getvalue(Picklerobject *self, PyObject *args)
2818 int l, i, rsize, ssize, clear=1, lm;
2819 long ik;
2820 PyObject *k, *r;
2821 char *s, *p, *have_get;
2822 Pdata *data;
2824 /* Can be called by Python code or C code */
2825 if (args && !PyArg_ParseTuple(args, "|i:getvalue", &clear))
2826 return NULL;
2828 /* Check to make sure we are based on a list */
2829 if (! Pdata_Check(self->file)) {
2830 PyErr_SetString(PicklingError,
2831 "Attempt to getvalue() a non-list-based pickler");
2832 return NULL;
2835 /* flush write buffer */
2836 if (write_other(self, NULL, 0) < 0) return NULL;
2838 data=(Pdata*)self->file;
2839 l=data->length;
2841 /* set up an array to hold get/put status */
2842 lm = PyDict_Size(self->memo);
2843 if (lm < 0) return NULL;
2844 lm++;
2845 have_get = malloc(lm);
2846 if (have_get == NULL) return PyErr_NoMemory();
2847 memset(have_get, 0, lm);
2849 /* Scan for gets. */
2850 for (rsize = 0, i = l; --i >= 0; ) {
2851 k = data->data[i];
2853 if (PyString_Check(k))
2854 rsize += PyString_GET_SIZE(k);
2856 else if (PyInt_Check(k)) { /* put */
2857 ik = PyInt_AS_LONG((PyIntObject*)k);
2858 if (ik >= lm || ik == 0) {
2859 PyErr_SetString(PicklingError,
2860 "Invalid get data");
2861 goto err;
2863 if (have_get[ik]) /* with matching get */
2864 rsize += ik < 256 ? 2 : 5;
2867 else if (! (PyTuple_Check(k) &&
2868 PyTuple_GET_SIZE(k) == 2 &&
2869 PyInt_Check((k = PyTuple_GET_ITEM(k, 0))))
2871 PyErr_SetString(PicklingError,
2872 "Unexpected data in internal list");
2873 goto err;
2876 else { /* put */
2877 ik = PyInt_AS_LONG((PyIntObject *)k);
2878 if (ik >= lm || ik == 0) {
2879 PyErr_SetString(PicklingError,
2880 "Invalid get data");
2881 return NULL;
2883 have_get[ik] = 1;
2884 rsize += ik < 256 ? 2 : 5;
2888 /* Now generate the result */
2889 r = PyString_FromStringAndSize(NULL, rsize);
2890 if (r == NULL) goto err;
2891 s = PyString_AS_STRING((PyStringObject *)r);
2893 for (i = 0; i < l; i++) {
2894 k = data->data[i];
2896 if (PyString_Check(k)) {
2897 ssize = PyString_GET_SIZE(k);
2898 if (ssize) {
2899 p=PyString_AS_STRING((PyStringObject *)k);
2900 while (--ssize >= 0)
2901 *s++ = *p++;
2905 else if (PyTuple_Check(k)) { /* get */
2906 ik = PyInt_AS_LONG((PyIntObject *)
2907 PyTuple_GET_ITEM(k, 0));
2908 if (ik < 256) {
2909 *s++ = BINGET;
2910 *s++ = (int)(ik & 0xff);
2912 else {
2913 *s++ = LONG_BINGET;
2914 *s++ = (int)(ik & 0xff);
2915 *s++ = (int)((ik >> 8) & 0xff);
2916 *s++ = (int)((ik >> 16) & 0xff);
2917 *s++ = (int)((ik >> 24) & 0xff);
2921 else { /* put */
2922 ik = PyInt_AS_LONG((PyIntObject*)k);
2924 if (have_get[ik]) { /* with matching get */
2925 if (ik < 256) {
2926 *s++ = BINPUT;
2927 *s++ = (int)(ik & 0xff);
2929 else {
2930 *s++ = LONG_BINPUT;
2931 *s++ = (int)(ik & 0xff);
2932 *s++ = (int)((ik >> 8) & 0xff);
2933 *s++ = (int)((ik >> 16) & 0xff);
2934 *s++ = (int)((ik >> 24) & 0xff);
2940 if (clear) {
2941 PyDict_Clear(self->memo);
2942 Pdata_clear(data, 0);
2945 free(have_get);
2946 return r;
2947 err:
2948 free(have_get);
2949 return NULL;
2952 static PyObject *
2953 Pickler_dump(Picklerobject *self, PyObject *args)
2955 PyObject *ob;
2956 int get=0;
2958 if (!( PyArg_ParseTuple(args, "O|i:dump", &ob, &get)))
2959 return NULL;
2961 if (dump(self, ob) < 0)
2962 return NULL;
2964 if (get) return Pickle_getvalue(self, NULL);
2966 /* XXX Why does dump() return self? */
2967 Py_INCREF(self);
2968 return (PyObject*)self;
2972 static struct PyMethodDef Pickler_methods[] =
2974 {"dump", (PyCFunction)Pickler_dump, METH_VARARGS,
2975 PyDoc_STR("dump(object) -- "
2976 "Write an object in pickle format to the object's pickle stream")},
2977 {"clear_memo", (PyCFunction)Pickle_clear_memo, METH_NOARGS,
2978 PyDoc_STR("clear_memo() -- Clear the picklers memo")},
2979 {"getvalue", (PyCFunction)Pickle_getvalue, METH_VARARGS,
2980 PyDoc_STR("getvalue() -- Finish picking a list-based pickle")},
2981 {NULL, NULL} /* sentinel */
2985 static Picklerobject *
2986 newPicklerobject(PyObject *file, int proto)
2988 Picklerobject *self;
2990 if (proto < 0)
2991 proto = HIGHEST_PROTOCOL;
2992 if (proto > HIGHEST_PROTOCOL) {
2993 PyErr_Format(PyExc_ValueError, "pickle protocol %d asked for; "
2994 "the highest available protocol is %d",
2995 proto, HIGHEST_PROTOCOL);
2996 return NULL;
2999 self = PyObject_GC_New(Picklerobject, &Picklertype);
3000 if (self == NULL)
3001 return NULL;
3002 self->proto = proto;
3003 self->bin = proto > 0;
3004 self->fp = NULL;
3005 self->write = NULL;
3006 self->memo = NULL;
3007 self->arg = NULL;
3008 self->pers_func = NULL;
3009 self->inst_pers_func = NULL;
3010 self->write_buf = NULL;
3011 self->fast = 0;
3012 self->fast_container = 0;
3013 self->fast_memo = NULL;
3014 self->buf_size = 0;
3015 self->dispatch_table = NULL;
3017 self->file = NULL;
3018 if (file)
3019 Py_INCREF(file);
3020 else {
3021 file = Pdata_New();
3022 if (file == NULL)
3023 goto err;
3025 self->file = file;
3027 if (!( self->memo = PyDict_New()))
3028 goto err;
3030 if (PyFile_Check(file)) {
3031 self->fp = PyFile_AsFile(file);
3032 if (self->fp == NULL) {
3033 PyErr_SetString(PyExc_ValueError,
3034 "I/O operation on closed file");
3035 goto err;
3037 self->write_func = write_file;
3039 else if (PycStringIO_OutputCheck(file)) {
3040 self->write_func = write_cStringIO;
3042 else if (file == Py_None) {
3043 self->write_func = write_none;
3045 else {
3046 self->write_func = write_other;
3048 if (! Pdata_Check(file)) {
3049 self->write = PyObject_GetAttr(file, write_str);
3050 if (!self->write) {
3051 PyErr_Clear();
3052 PyErr_SetString(PyExc_TypeError,
3053 "argument must have 'write' "
3054 "attribute");
3055 goto err;
3059 self->write_buf = (char *)PyMem_Malloc(WRITE_BUF_SIZE);
3060 if (self->write_buf == NULL) {
3061 PyErr_NoMemory();
3062 goto err;
3066 if (PyEval_GetRestricted()) {
3067 /* Restricted execution, get private tables */
3068 PyObject *m = PyImport_ImportModule("copy_reg");
3070 if (m == NULL)
3071 goto err;
3072 self->dispatch_table = PyObject_GetAttr(m, dispatch_table_str);
3073 Py_DECREF(m);
3074 if (self->dispatch_table == NULL)
3075 goto err;
3077 else {
3078 self->dispatch_table = dispatch_table;
3079 Py_INCREF(dispatch_table);
3081 PyObject_GC_Track(self);
3083 return self;
3085 err:
3086 Py_DECREF(self);
3087 return NULL;
3091 static PyObject *
3092 get_Pickler(PyObject *self, PyObject *args, PyObject *kwds)
3094 static char *kwlist[] = {"file", "protocol", NULL};
3095 PyObject *file = NULL;
3096 int proto = 0;
3098 /* XXX
3099 * The documented signature is Pickler(file, protocol=0), but this
3100 * accepts Pickler() and Pickler(integer) too. The meaning then
3101 * is clear as mud, undocumented, and not supported by pickle.py.
3102 * I'm told Zope uses this, but I haven't traced into this code
3103 * far enough to figure out what it means.
3105 if (!PyArg_ParseTuple(args, "|i:Pickler", &proto)) {
3106 PyErr_Clear();
3107 proto = 0;
3108 if (!PyArg_ParseTupleAndKeywords(args, kwds, "O|i:Pickler",
3109 kwlist, &file, &proto))
3110 return NULL;
3112 return (PyObject *)newPicklerobject(file, proto);
3116 static void
3117 Pickler_dealloc(Picklerobject *self)
3119 PyObject_GC_UnTrack(self);
3120 Py_XDECREF(self->write);
3121 Py_XDECREF(self->memo);
3122 Py_XDECREF(self->fast_memo);
3123 Py_XDECREF(self->arg);
3124 Py_XDECREF(self->file);
3125 Py_XDECREF(self->pers_func);
3126 Py_XDECREF(self->inst_pers_func);
3127 Py_XDECREF(self->dispatch_table);
3128 PyMem_Free(self->write_buf);
3129 Py_TYPE(self)->tp_free((PyObject *)self);
3132 static int
3133 Pickler_traverse(Picklerobject *self, visitproc visit, void *arg)
3135 Py_VISIT(self->write);
3136 Py_VISIT(self->memo);
3137 Py_VISIT(self->fast_memo);
3138 Py_VISIT(self->arg);
3139 Py_VISIT(self->file);
3140 Py_VISIT(self->pers_func);
3141 Py_VISIT(self->inst_pers_func);
3142 Py_VISIT(self->dispatch_table);
3143 return 0;
3146 static int
3147 Pickler_clear(Picklerobject *self)
3149 Py_CLEAR(self->write);
3150 Py_CLEAR(self->memo);
3151 Py_CLEAR(self->fast_memo);
3152 Py_CLEAR(self->arg);
3153 Py_CLEAR(self->file);
3154 Py_CLEAR(self->pers_func);
3155 Py_CLEAR(self->inst_pers_func);
3156 Py_CLEAR(self->dispatch_table);
3157 return 0;
3160 static PyObject *
3161 Pickler_get_pers_func(Picklerobject *p)
3163 if (p->pers_func == NULL)
3164 PyErr_SetString(PyExc_AttributeError, "persistent_id");
3165 else
3166 Py_INCREF(p->pers_func);
3167 return p->pers_func;
3170 static int
3171 Pickler_set_pers_func(Picklerobject *p, PyObject *v)
3173 if (v == NULL) {
3174 PyErr_SetString(PyExc_TypeError,
3175 "attribute deletion is not supported");
3176 return -1;
3178 Py_XDECREF(p->pers_func);
3179 Py_INCREF(v);
3180 p->pers_func = v;
3181 return 0;
3184 static int
3185 Pickler_set_inst_pers_func(Picklerobject *p, PyObject *v)
3187 if (v == NULL) {
3188 PyErr_SetString(PyExc_TypeError,
3189 "attribute deletion is not supported");
3190 return -1;
3192 Py_XDECREF(p->inst_pers_func);
3193 Py_INCREF(v);
3194 p->inst_pers_func = v;
3195 return 0;
3198 static PyObject *
3199 Pickler_get_memo(Picklerobject *p)
3201 if (p->memo == NULL)
3202 PyErr_SetString(PyExc_AttributeError, "memo");
3203 else
3204 Py_INCREF(p->memo);
3205 return p->memo;
3208 static int
3209 Pickler_set_memo(Picklerobject *p, PyObject *v)
3211 if (v == NULL) {
3212 PyErr_SetString(PyExc_TypeError,
3213 "attribute deletion is not supported");
3214 return -1;
3216 if (!PyDict_Check(v)) {
3217 PyErr_SetString(PyExc_TypeError, "memo must be a dictionary");
3218 return -1;
3220 Py_XDECREF(p->memo);
3221 Py_INCREF(v);
3222 p->memo = v;
3223 return 0;
3226 static PyObject *
3227 Pickler_get_error(Picklerobject *p)
3229 /* why is this an attribute on the Pickler? */
3230 Py_INCREF(PicklingError);
3231 return PicklingError;
3234 static PyMemberDef Pickler_members[] = {
3235 {"binary", T_INT, offsetof(Picklerobject, bin)},
3236 {"fast", T_INT, offsetof(Picklerobject, fast)},
3237 {NULL}
3240 static PyGetSetDef Pickler_getsets[] = {
3241 {"persistent_id", (getter)Pickler_get_pers_func,
3242 (setter)Pickler_set_pers_func},
3243 {"inst_persistent_id", NULL, (setter)Pickler_set_inst_pers_func},
3244 {"memo", (getter)Pickler_get_memo, (setter)Pickler_set_memo},
3245 {"PicklingError", (getter)Pickler_get_error, NULL},
3246 {NULL}
3249 PyDoc_STRVAR(Picklertype__doc__,
3250 "Objects that know how to pickle objects\n");
3252 static PyTypeObject Picklertype = {
3253 PyVarObject_HEAD_INIT(NULL, 0)
3254 "cPickle.Pickler", /*tp_name*/
3255 sizeof(Picklerobject), /*tp_basicsize*/
3257 (destructor)Pickler_dealloc, /* tp_dealloc */
3258 0, /* tp_print */
3259 0, /* tp_getattr */
3260 0, /* tp_setattr */
3261 0, /* tp_compare */
3262 0, /* tp_repr */
3263 0, /* tp_as_number */
3264 0, /* tp_as_sequence */
3265 0, /* tp_as_mapping */
3266 0, /* tp_hash */
3267 0, /* tp_call */
3268 0, /* tp_str */
3269 PyObject_GenericGetAttr, /* tp_getattro */
3270 PyObject_GenericSetAttr, /* tp_setattro */
3271 0, /* tp_as_buffer */
3272 Py_TPFLAGS_DEFAULT | Py_TPFLAGS_BASETYPE | Py_TPFLAGS_HAVE_GC,
3273 Picklertype__doc__, /* tp_doc */
3274 (traverseproc)Pickler_traverse, /* tp_traverse */
3275 (inquiry)Pickler_clear, /* tp_clear */
3276 0, /* tp_richcompare */
3277 0, /* tp_weaklistoffset */
3278 0, /* tp_iter */
3279 0, /* tp_iternext */
3280 Pickler_methods, /* tp_methods */
3281 Pickler_members, /* tp_members */
3282 Pickler_getsets, /* tp_getset */
3285 static PyObject *
3286 find_class(PyObject *py_module_name, PyObject *py_global_name, PyObject *fc)
3288 PyObject *global = 0, *module;
3290 if (fc) {
3291 if (fc==Py_None) {
3292 PyErr_SetString(UnpicklingError, "Global and instance "
3293 "pickles are not supported.");
3294 return NULL;
3296 return PyObject_CallFunctionObjArgs(fc, py_module_name,
3297 py_global_name, NULL);
3300 module = PySys_GetObject("modules");
3301 if (module == NULL)
3302 return NULL;
3304 module = PyDict_GetItem(module, py_module_name);
3305 if (module == NULL) {
3306 module = PyImport_Import(py_module_name);
3307 if (!module)
3308 return NULL;
3309 global = PyObject_GetAttr(module, py_global_name);
3310 Py_DECREF(module);
3312 else
3313 global = PyObject_GetAttr(module, py_global_name);
3314 return global;
3317 static int
3318 marker(Unpicklerobject *self)
3320 if (self->num_marks < 1) {
3321 PyErr_SetString(UnpicklingError, "could not find MARK");
3322 return -1;
3325 return self->marks[--self->num_marks];
3329 static int
3330 load_none(Unpicklerobject *self)
3332 PDATA_APPEND(self->stack, Py_None, -1);
3333 return 0;
3336 static int
3337 bad_readline(void)
3339 PyErr_SetString(UnpicklingError, "pickle data was truncated");
3340 return -1;
3343 static int
3344 load_int(Unpicklerobject *self)
3346 PyObject *py_int = 0;
3347 char *endptr, *s;
3348 int len, res = -1;
3349 long l;
3351 if ((len = self->readline_func(self, &s)) < 0) return -1;
3352 if (len < 2) return bad_readline();
3353 if (!( s=pystrndup(s,len))) return -1;
3355 errno = 0;
3356 l = strtol(s, &endptr, 0);
3358 if (errno || (*endptr != '\n') || (endptr[1] != '\0')) {
3359 /* Hm, maybe we've got something long. Let's try reading
3360 it as a Python long object. */
3361 errno = 0;
3362 py_int = PyLong_FromString(s, NULL, 0);
3363 if (py_int == NULL) {
3364 PyErr_SetString(PyExc_ValueError,
3365 "could not convert string to int");
3366 goto finally;
3369 else {
3370 if (len == 3 && (l == 0 || l == 1)) {
3371 if (!( py_int = PyBool_FromLong(l))) goto finally;
3373 else {
3374 if (!( py_int = PyInt_FromLong(l))) goto finally;
3378 free(s);
3379 PDATA_PUSH(self->stack, py_int, -1);
3380 return 0;
3382 finally:
3383 free(s);
3385 return res;
3388 static int
3389 load_bool(Unpicklerobject *self, PyObject *boolean)
3391 assert(boolean == Py_True || boolean == Py_False);
3392 PDATA_APPEND(self->stack, boolean, -1);
3393 return 0;
3396 /* s contains x bytes of a little-endian integer. Return its value as a
3397 * C int. Obscure: when x is 1 or 2, this is an unsigned little-endian
3398 * int, but when x is 4 it's a signed one. This is an historical source
3399 * of x-platform bugs.
3401 static long
3402 calc_binint(char *s, int x)
3404 unsigned char c;
3405 int i;
3406 long l;
3408 for (i = 0, l = 0L; i < x; i++) {
3409 c = (unsigned char)s[i];
3410 l |= (long)c << (i * 8);
3412 #if SIZEOF_LONG > 4
3413 /* Unlike BININT1 and BININT2, BININT (more accurately BININT4)
3414 * is signed, so on a box with longs bigger than 4 bytes we need
3415 * to extend a BININT's sign bit to the full width.
3417 if (x == 4 && l & (1L << 31))
3418 l |= (~0L) << 32;
3419 #endif
3420 return l;
3424 static int
3425 load_binintx(Unpicklerobject *self, char *s, int x)
3427 PyObject *py_int = 0;
3428 long l;
3430 l = calc_binint(s, x);
3432 if (!( py_int = PyInt_FromLong(l)))
3433 return -1;
3435 PDATA_PUSH(self->stack, py_int, -1);
3436 return 0;
3440 static int
3441 load_binint(Unpicklerobject *self)
3443 char *s;
3445 if (self->read_func(self, &s, 4) < 0)
3446 return -1;
3448 return load_binintx(self, s, 4);
3452 static int
3453 load_binint1(Unpicklerobject *self)
3455 char *s;
3457 if (self->read_func(self, &s, 1) < 0)
3458 return -1;
3460 return load_binintx(self, s, 1);
3464 static int
3465 load_binint2(Unpicklerobject *self)
3467 char *s;
3469 if (self->read_func(self, &s, 2) < 0)
3470 return -1;
3472 return load_binintx(self, s, 2);
3475 static int
3476 load_long(Unpicklerobject *self)
3478 PyObject *l = 0;
3479 char *end, *s;
3480 int len, res = -1;
3482 if ((len = self->readline_func(self, &s)) < 0) return -1;
3483 if (len < 2) return bad_readline();
3484 if (!( s=pystrndup(s,len))) return -1;
3486 if (!( l = PyLong_FromString(s, &end, 0)))
3487 goto finally;
3489 free(s);
3490 PDATA_PUSH(self->stack, l, -1);
3491 return 0;
3493 finally:
3494 free(s);
3496 return res;
3499 /* 'size' bytes contain the # of bytes of little-endian 256's-complement
3500 * data following.
3502 static int
3503 load_counted_long(Unpicklerobject *self, int size)
3505 Py_ssize_t i;
3506 char *nbytes;
3507 unsigned char *pdata;
3508 PyObject *along;
3510 assert(size == 1 || size == 4);
3511 i = self->read_func(self, &nbytes, size);
3512 if (i < 0) return -1;
3514 size = calc_binint(nbytes, size);
3515 if (size < 0) {
3516 /* Corrupt or hostile pickle -- we never write one like
3517 * this.
3519 PyErr_SetString(UnpicklingError, "LONG pickle has negative "
3520 "byte count");
3521 return -1;
3524 if (size == 0)
3525 along = PyLong_FromLong(0L);
3526 else {
3527 /* Read the raw little-endian bytes & convert. */
3528 i = self->read_func(self, (char **)&pdata, size);
3529 if (i < 0) return -1;
3530 along = _PyLong_FromByteArray(pdata, (size_t)size,
3531 1 /* little endian */, 1 /* signed */);
3533 if (along == NULL)
3534 return -1;
3535 PDATA_PUSH(self->stack, along, -1);
3536 return 0;
3539 static int
3540 load_float(Unpicklerobject *self)
3542 PyObject *py_float = 0;
3543 char *endptr, *s;
3544 int len, res = -1;
3545 double d;
3547 if ((len = self->readline_func(self, &s)) < 0) return -1;
3548 if (len < 2) return bad_readline();
3549 if (!( s=pystrndup(s,len))) return -1;
3551 d = PyOS_string_to_double(s, &endptr, PyExc_OverflowError);
3553 if (d == -1.0 && PyErr_Occurred()) {
3554 goto finally;
3555 } else if ((endptr[0] != '\n') || (endptr[1] != '\0')) {
3556 PyErr_SetString(PyExc_ValueError,
3557 "could not convert string to float");
3558 goto finally;
3561 if (!( py_float = PyFloat_FromDouble(d)))
3562 goto finally;
3564 free(s);
3565 PDATA_PUSH(self->stack, py_float, -1);
3566 return 0;
3568 finally:
3569 free(s);
3571 return res;
3574 static int
3575 load_binfloat(Unpicklerobject *self)
3577 PyObject *py_float;
3578 double x;
3579 char *p;
3581 if (self->read_func(self, &p, 8) < 0)
3582 return -1;
3584 x = _PyFloat_Unpack8((unsigned char *)p, 0);
3585 if (x == -1.0 && PyErr_Occurred())
3586 return -1;
3588 py_float = PyFloat_FromDouble(x);
3589 if (py_float == NULL)
3590 return -1;
3592 PDATA_PUSH(self->stack, py_float, -1);
3593 return 0;
3596 static int
3597 load_string(Unpicklerobject *self)
3599 PyObject *str = 0;
3600 int len, res = -1;
3601 char *s, *p;
3603 if ((len = self->readline_func(self, &s)) < 0) return -1;
3604 if (len < 2) return bad_readline();
3605 if (!( s=pystrndup(s,len))) return -1;
3608 /* Strip outermost quotes */
3609 while (s[len-1] <= ' ')
3610 len--;
3611 if(s[0]=='"' && s[len-1]=='"'){
3612 s[len-1] = '\0';
3613 p = s + 1 ;
3614 len -= 2;
3615 } else if(s[0]=='\'' && s[len-1]=='\''){
3616 s[len-1] = '\0';
3617 p = s + 1 ;
3618 len -= 2;
3619 } else
3620 goto insecure;
3621 /********************************************/
3623 str = PyString_DecodeEscape(p, len, NULL, 0, NULL);
3624 free(s);
3625 if (str) {
3626 PDATA_PUSH(self->stack, str, -1);
3627 res = 0;
3629 return res;
3631 insecure:
3632 free(s);
3633 PyErr_SetString(PyExc_ValueError,"insecure string pickle");
3634 return -1;
3638 static int
3639 load_binstring(Unpicklerobject *self)
3641 PyObject *py_string = 0;
3642 long l;
3643 char *s;
3645 if (self->read_func(self, &s, 4) < 0) return -1;
3647 l = calc_binint(s, 4);
3648 if (l < 0) {
3649 /* Corrupt or hostile pickle -- we never write one like
3650 * this.
3652 PyErr_SetString(UnpicklingError,
3653 "BINSTRING pickle has negative byte count");
3654 return -1;
3657 if (self->read_func(self, &s, l) < 0)
3658 return -1;
3660 if (!( py_string = PyString_FromStringAndSize(s, l)))
3661 return -1;
3663 PDATA_PUSH(self->stack, py_string, -1);
3664 return 0;
3668 static int
3669 load_short_binstring(Unpicklerobject *self)
3671 PyObject *py_string = 0;
3672 unsigned char l;
3673 char *s;
3675 if (self->read_func(self, &s, 1) < 0)
3676 return -1;
3678 l = (unsigned char)s[0];
3680 if (self->read_func(self, &s, l) < 0) return -1;
3682 if (!( py_string = PyString_FromStringAndSize(s, l))) return -1;
3684 PDATA_PUSH(self->stack, py_string, -1);
3685 return 0;
3689 #ifdef Py_USING_UNICODE
3690 static int
3691 load_unicode(Unpicklerobject *self)
3693 PyObject *str = 0;
3694 int len, res = -1;
3695 char *s;
3697 if ((len = self->readline_func(self, &s)) < 0) return -1;
3698 if (len < 1) return bad_readline();
3700 if (!( str = PyUnicode_DecodeRawUnicodeEscape(s, len - 1, NULL)))
3701 goto finally;
3703 PDATA_PUSH(self->stack, str, -1);
3704 return 0;
3706 finally:
3707 return res;
3709 #endif
3712 #ifdef Py_USING_UNICODE
3713 static int
3714 load_binunicode(Unpicklerobject *self)
3716 PyObject *unicode;
3717 long l;
3718 char *s;
3720 if (self->read_func(self, &s, 4) < 0) return -1;
3722 l = calc_binint(s, 4);
3723 if (l < 0) {
3724 /* Corrupt or hostile pickle -- we never write one like
3725 * this.
3727 PyErr_SetString(UnpicklingError,
3728 "BINUNICODE pickle has negative byte count");
3729 return -1;
3732 if (self->read_func(self, &s, l) < 0)
3733 return -1;
3735 if (!( unicode = PyUnicode_DecodeUTF8(s, l, NULL)))
3736 return -1;
3738 PDATA_PUSH(self->stack, unicode, -1);
3739 return 0;
3741 #endif
3744 static int
3745 load_tuple(Unpicklerobject *self)
3747 PyObject *tup;
3748 int i;
3750 if ((i = marker(self)) < 0) return -1;
3751 if (!( tup=Pdata_popTuple(self->stack, i))) return -1;
3752 PDATA_PUSH(self->stack, tup, -1);
3753 return 0;
3756 static int
3757 load_counted_tuple(Unpicklerobject *self, int len)
3759 PyObject *tup = PyTuple_New(len);
3761 if (tup == NULL)
3762 return -1;
3764 while (--len >= 0) {
3765 PyObject *element;
3767 PDATA_POP(self->stack, element);
3768 if (element == NULL)
3769 return -1;
3770 PyTuple_SET_ITEM(tup, len, element);
3772 PDATA_PUSH(self->stack, tup, -1);
3773 return 0;
3776 static int
3777 load_empty_list(Unpicklerobject *self)
3779 PyObject *list;
3781 if (!( list=PyList_New(0))) return -1;
3782 PDATA_PUSH(self->stack, list, -1);
3783 return 0;
3786 static int
3787 load_empty_dict(Unpicklerobject *self)
3789 PyObject *dict;
3791 if (!( dict=PyDict_New())) return -1;
3792 PDATA_PUSH(self->stack, dict, -1);
3793 return 0;
3797 static int
3798 load_list(Unpicklerobject *self)
3800 PyObject *list = 0;
3801 int i;
3803 if ((i = marker(self)) < 0) return -1;
3804 if (!( list=Pdata_popList(self->stack, i))) return -1;
3805 PDATA_PUSH(self->stack, list, -1);
3806 return 0;
3809 static int
3810 load_dict(Unpicklerobject *self)
3812 PyObject *dict, *key, *value;
3813 int i, j, k;
3815 if ((i = marker(self)) < 0) return -1;
3816 j=self->stack->length;
3818 if (!( dict = PyDict_New())) return -1;
3820 for (k = i+1; k < j; k += 2) {
3821 key =self->stack->data[k-1];
3822 value=self->stack->data[k ];
3823 if (PyDict_SetItem(dict, key, value) < 0) {
3824 Py_DECREF(dict);
3825 return -1;
3828 Pdata_clear(self->stack, i);
3829 PDATA_PUSH(self->stack, dict, -1);
3830 return 0;
3833 static PyObject *
3834 Instance_New(PyObject *cls, PyObject *args)
3836 PyObject *r = 0;
3838 if (PyClass_Check(cls)) {
3839 int l;
3841 if ((l=PyObject_Size(args)) < 0) goto err;
3842 if (!( l )) {
3843 PyObject *__getinitargs__;
3845 __getinitargs__ = PyObject_GetAttr(cls,
3846 __getinitargs___str);
3847 if (!__getinitargs__) {
3848 /* We have a class with no __getinitargs__,
3849 so bypass usual construction */
3850 PyObject *inst;
3852 PyErr_Clear();
3853 if (!( inst=PyInstance_NewRaw(cls, NULL)))
3854 goto err;
3855 return inst;
3857 Py_DECREF(__getinitargs__);
3860 if ((r=PyInstance_New(cls, args, NULL))) return r;
3861 else goto err;
3864 if ((r=PyObject_CallObject(cls, args))) return r;
3866 err:
3868 PyObject *tp, *v, *tb, *tmp_value;
3870 PyErr_Fetch(&tp, &v, &tb);
3871 tmp_value = v;
3872 /* NULL occurs when there was a KeyboardInterrupt */
3873 if (tmp_value == NULL)
3874 tmp_value = Py_None;
3875 if ((r = PyTuple_Pack(3, tmp_value, cls, args))) {
3876 Py_XDECREF(v);
3877 v=r;
3879 PyErr_Restore(tp,v,tb);
3881 return NULL;
3885 static int
3886 load_obj(Unpicklerobject *self)
3888 PyObject *class, *tup, *obj=0;
3889 int i;
3891 if ((i = marker(self)) < 0) return -1;
3892 if (!( tup=Pdata_popTuple(self->stack, i+1))) return -1;
3893 PDATA_POP(self->stack, class);
3894 if (class) {
3895 obj = Instance_New(class, tup);
3896 Py_DECREF(class);
3898 Py_DECREF(tup);
3900 if (! obj) return -1;
3901 PDATA_PUSH(self->stack, obj, -1);
3902 return 0;
3906 static int
3907 load_inst(Unpicklerobject *self)
3909 PyObject *tup, *class=0, *obj=0, *module_name, *class_name;
3910 int i, len;
3911 char *s;
3913 if ((i = marker(self)) < 0) return -1;
3915 if ((len = self->readline_func(self, &s)) < 0) return -1;
3916 if (len < 2) return bad_readline();
3917 module_name = PyString_FromStringAndSize(s, len - 1);
3918 if (!module_name) return -1;
3920 if ((len = self->readline_func(self, &s)) >= 0) {
3921 if (len < 2) return bad_readline();
3922 if ((class_name = PyString_FromStringAndSize(s, len - 1))) {
3923 class = find_class(module_name, class_name,
3924 self->find_class);
3925 Py_DECREF(class_name);
3928 Py_DECREF(module_name);
3930 if (! class) return -1;
3932 if ((tup=Pdata_popTuple(self->stack, i))) {
3933 obj = Instance_New(class, tup);
3934 Py_DECREF(tup);
3936 Py_DECREF(class);
3938 if (! obj) return -1;
3940 PDATA_PUSH(self->stack, obj, -1);
3941 return 0;
3944 static int
3945 load_newobj(Unpicklerobject *self)
3947 PyObject *args = NULL;
3948 PyObject *clsraw = NULL;
3949 PyTypeObject *cls; /* clsraw cast to its true type */
3950 PyObject *obj;
3952 /* Stack is ... cls argtuple, and we want to call
3953 * cls.__new__(cls, *argtuple).
3955 PDATA_POP(self->stack, args);
3956 if (args == NULL) goto Fail;
3957 if (! PyTuple_Check(args)) {
3958 PyErr_SetString(UnpicklingError, "NEWOBJ expected an arg "
3959 "tuple.");
3960 goto Fail;
3963 PDATA_POP(self->stack, clsraw);
3964 cls = (PyTypeObject *)clsraw;
3965 if (cls == NULL) goto Fail;
3966 if (! PyType_Check(cls)) {
3967 PyErr_SetString(UnpicklingError, "NEWOBJ class argument "
3968 "isn't a type object");
3969 goto Fail;
3971 if (cls->tp_new == NULL) {
3972 PyErr_SetString(UnpicklingError, "NEWOBJ class argument "
3973 "has NULL tp_new");
3974 goto Fail;
3977 /* Call __new__. */
3978 obj = cls->tp_new(cls, args, NULL);
3979 if (obj == NULL) goto Fail;
3981 Py_DECREF(args);
3982 Py_DECREF(clsraw);
3983 PDATA_PUSH(self->stack, obj, -1);
3984 return 0;
3986 Fail:
3987 Py_XDECREF(args);
3988 Py_XDECREF(clsraw);
3989 return -1;
3992 static int
3993 load_global(Unpicklerobject *self)
3995 PyObject *class = 0, *module_name = 0, *class_name = 0;
3996 int len;
3997 char *s;
3999 if ((len = self->readline_func(self, &s)) < 0) return -1;
4000 if (len < 2) return bad_readline();
4001 module_name = PyString_FromStringAndSize(s, len - 1);
4002 if (!module_name) return -1;
4004 if ((len = self->readline_func(self, &s)) >= 0) {
4005 if (len < 2) {
4006 Py_DECREF(module_name);
4007 return bad_readline();
4009 if ((class_name = PyString_FromStringAndSize(s, len - 1))) {
4010 class = find_class(module_name, class_name,
4011 self->find_class);
4012 Py_DECREF(class_name);
4015 Py_DECREF(module_name);
4017 if (! class) return -1;
4018 PDATA_PUSH(self->stack, class, -1);
4019 return 0;
4023 static int
4024 load_persid(Unpicklerobject *self)
4026 PyObject *pid = 0;
4027 int len;
4028 char *s;
4030 if (self->pers_func) {
4031 if ((len = self->readline_func(self, &s)) < 0) return -1;
4032 if (len < 2) return bad_readline();
4034 pid = PyString_FromStringAndSize(s, len - 1);
4035 if (!pid) return -1;
4037 if (PyList_Check(self->pers_func)) {
4038 if (PyList_Append(self->pers_func, pid) < 0) {
4039 Py_DECREF(pid);
4040 return -1;
4043 else {
4044 ARG_TUP(self, pid);
4045 if (self->arg) {
4046 pid = PyObject_Call(self->pers_func, self->arg,
4047 NULL);
4048 FREE_ARG_TUP(self);
4052 if (! pid) return -1;
4054 PDATA_PUSH(self->stack, pid, -1);
4055 return 0;
4057 else {
4058 PyErr_SetString(UnpicklingError,
4059 "A load persistent id instruction was encountered,\n"
4060 "but no persistent_load function was specified.");
4061 return -1;
4065 static int
4066 load_binpersid(Unpicklerobject *self)
4068 PyObject *pid = 0;
4070 if (self->pers_func) {
4071 PDATA_POP(self->stack, pid);
4072 if (! pid) return -1;
4074 if (PyList_Check(self->pers_func)) {
4075 if (PyList_Append(self->pers_func, pid) < 0) {
4076 Py_DECREF(pid);
4077 return -1;
4080 else {
4081 ARG_TUP(self, pid);
4082 if (self->arg) {
4083 pid = PyObject_Call(self->pers_func, self->arg,
4084 NULL);
4085 FREE_ARG_TUP(self);
4087 if (! pid) return -1;
4090 PDATA_PUSH(self->stack, pid, -1);
4091 return 0;
4093 else {
4094 PyErr_SetString(UnpicklingError,
4095 "A load persistent id instruction was encountered,\n"
4096 "but no persistent_load function was specified.");
4097 return -1;
4102 static int
4103 load_pop(Unpicklerobject *self)
4105 int len = self->stack->length;
4107 /* Note that we split the (pickle.py) stack into two stacks,
4108 an object stack and a mark stack. We have to be clever and
4109 pop the right one. We do this by looking at the top of the
4110 mark stack first, and only signalling a stack underflow if
4111 the object stack is empty and the mark stack doesn't match
4112 our expectations.
4114 if (self->num_marks > 0 && self->marks[self->num_marks - 1] == len) {
4115 self->num_marks--;
4116 } else if (len > 0) {
4117 len--;
4118 Py_DECREF(self->stack->data[len]);
4119 self->stack->length = len;
4120 } else {
4121 return stackUnderflow();
4123 return 0;
4127 static int
4128 load_pop_mark(Unpicklerobject *self)
4130 int i;
4132 if ((i = marker(self)) < 0)
4133 return -1;
4135 Pdata_clear(self->stack, i);
4137 return 0;
4141 static int
4142 load_dup(Unpicklerobject *self)
4144 PyObject *last;
4145 int len;
4147 if ((len = self->stack->length) <= 0) return stackUnderflow();
4148 last=self->stack->data[len-1];
4149 Py_INCREF(last);
4150 PDATA_PUSH(self->stack, last, -1);
4151 return 0;
4155 static int
4156 load_get(Unpicklerobject *self)
4158 PyObject *py_str = 0, *value = 0;
4159 int len;
4160 char *s;
4161 int rc;
4163 if ((len = self->readline_func(self, &s)) < 0) return -1;
4164 if (len < 2) return bad_readline();
4166 if (!( py_str = PyString_FromStringAndSize(s, len - 1))) return -1;
4168 value = PyDict_GetItem(self->memo, py_str);
4169 if (! value) {
4170 PyErr_SetObject(BadPickleGet, py_str);
4171 rc = -1;
4173 else {
4174 PDATA_APPEND(self->stack, value, -1);
4175 rc = 0;
4178 Py_DECREF(py_str);
4179 return rc;
4183 static int
4184 load_binget(Unpicklerobject *self)
4186 PyObject *py_key = 0, *value = 0;
4187 unsigned char key;
4188 char *s;
4189 int rc;
4191 if (self->read_func(self, &s, 1) < 0) return -1;
4193 key = (unsigned char)s[0];
4194 if (!( py_key = PyInt_FromLong((long)key))) return -1;
4196 value = PyDict_GetItem(self->memo, py_key);
4197 if (! value) {
4198 PyErr_SetObject(BadPickleGet, py_key);
4199 rc = -1;
4201 else {
4202 PDATA_APPEND(self->stack, value, -1);
4203 rc = 0;
4206 Py_DECREF(py_key);
4207 return rc;
4211 static int
4212 load_long_binget(Unpicklerobject *self)
4214 PyObject *py_key = 0, *value = 0;
4215 unsigned char c;
4216 char *s;
4217 long key;
4218 int rc;
4220 if (self->read_func(self, &s, 4) < 0) return -1;
4222 c = (unsigned char)s[0];
4223 key = (long)c;
4224 c = (unsigned char)s[1];
4225 key |= (long)c << 8;
4226 c = (unsigned char)s[2];
4227 key |= (long)c << 16;
4228 c = (unsigned char)s[3];
4229 key |= (long)c << 24;
4231 if (!( py_key = PyInt_FromLong((long)key))) return -1;
4233 value = PyDict_GetItem(self->memo, py_key);
4234 if (! value) {
4235 PyErr_SetObject(BadPickleGet, py_key);
4236 rc = -1;
4238 else {
4239 PDATA_APPEND(self->stack, value, -1);
4240 rc = 0;
4243 Py_DECREF(py_key);
4244 return rc;
4247 /* Push an object from the extension registry (EXT[124]). nbytes is
4248 * the number of bytes following the opcode, holding the index (code) value.
4250 static int
4251 load_extension(Unpicklerobject *self, int nbytes)
4253 char *codebytes; /* the nbytes bytes after the opcode */
4254 long code; /* calc_binint returns long */
4255 PyObject *py_code; /* code as a Python int */
4256 PyObject *obj; /* the object to push */
4257 PyObject *pair; /* (module_name, class_name) */
4258 PyObject *module_name, *class_name;
4260 assert(nbytes == 1 || nbytes == 2 || nbytes == 4);
4261 if (self->read_func(self, &codebytes, nbytes) < 0) return -1;
4262 code = calc_binint(codebytes, nbytes);
4263 if (code <= 0) { /* note that 0 is forbidden */
4264 /* Corrupt or hostile pickle. */
4265 PyErr_SetString(UnpicklingError, "EXT specifies code <= 0");
4266 return -1;
4269 /* Look for the code in the cache. */
4270 py_code = PyInt_FromLong(code);
4271 if (py_code == NULL) return -1;
4272 obj = PyDict_GetItem(extension_cache, py_code);
4273 if (obj != NULL) {
4274 /* Bingo. */
4275 Py_DECREF(py_code);
4276 PDATA_APPEND(self->stack, obj, -1);
4277 return 0;
4280 /* Look up the (module_name, class_name) pair. */
4281 pair = PyDict_GetItem(inverted_registry, py_code);
4282 if (pair == NULL) {
4283 Py_DECREF(py_code);
4284 PyErr_Format(PyExc_ValueError, "unregistered extension "
4285 "code %ld", code);
4286 return -1;
4288 /* Since the extension registry is manipulable via Python code,
4289 * confirm that pair is really a 2-tuple of strings.
4291 if (!PyTuple_Check(pair) || PyTuple_Size(pair) != 2 ||
4292 !PyString_Check(module_name = PyTuple_GET_ITEM(pair, 0)) ||
4293 !PyString_Check(class_name = PyTuple_GET_ITEM(pair, 1))) {
4294 Py_DECREF(py_code);
4295 PyErr_Format(PyExc_ValueError, "_inverted_registry[%ld] "
4296 "isn't a 2-tuple of strings", code);
4297 return -1;
4299 /* Load the object. */
4300 obj = find_class(module_name, class_name, self->find_class);
4301 if (obj == NULL) {
4302 Py_DECREF(py_code);
4303 return -1;
4305 /* Cache code -> obj. */
4306 code = PyDict_SetItem(extension_cache, py_code, obj);
4307 Py_DECREF(py_code);
4308 if (code < 0) {
4309 Py_DECREF(obj);
4310 return -1;
4312 PDATA_PUSH(self->stack, obj, -1);
4313 return 0;
4316 static int
4317 load_put(Unpicklerobject *self)
4319 PyObject *py_str = 0, *value = 0;
4320 int len, l;
4321 char *s;
4323 if ((l = self->readline_func(self, &s)) < 0) return -1;
4324 if (l < 2) return bad_readline();
4325 if (!( len=self->stack->length )) return stackUnderflow();
4326 if (!( py_str = PyString_FromStringAndSize(s, l - 1))) return -1;
4327 value=self->stack->data[len-1];
4328 l=PyDict_SetItem(self->memo, py_str, value);
4329 Py_DECREF(py_str);
4330 return l;
4334 static int
4335 load_binput(Unpicklerobject *self)
4337 PyObject *py_key = 0, *value = 0;
4338 unsigned char key;
4339 char *s;
4340 int len;
4342 if (self->read_func(self, &s, 1) < 0) return -1;
4343 if (!( (len=self->stack->length) > 0 )) return stackUnderflow();
4345 key = (unsigned char)s[0];
4347 if (!( py_key = PyInt_FromLong((long)key))) return -1;
4348 value=self->stack->data[len-1];
4349 len=PyDict_SetItem(self->memo, py_key, value);
4350 Py_DECREF(py_key);
4351 return len;
4355 static int
4356 load_long_binput(Unpicklerobject *self)
4358 PyObject *py_key = 0, *value = 0;
4359 long key;
4360 unsigned char c;
4361 char *s;
4362 int len;
4364 if (self->read_func(self, &s, 4) < 0) return -1;
4365 if (!( len=self->stack->length )) return stackUnderflow();
4367 c = (unsigned char)s[0];
4368 key = (long)c;
4369 c = (unsigned char)s[1];
4370 key |= (long)c << 8;
4371 c = (unsigned char)s[2];
4372 key |= (long)c << 16;
4373 c = (unsigned char)s[3];
4374 key |= (long)c << 24;
4376 if (!( py_key = PyInt_FromLong(key))) return -1;
4377 value=self->stack->data[len-1];
4378 len=PyDict_SetItem(self->memo, py_key, value);
4379 Py_DECREF(py_key);
4380 return len;
4384 static int
4385 do_append(Unpicklerobject *self, int x)
4387 PyObject *value = 0, *list = 0, *append_method = 0;
4388 int len, i;
4390 len=self->stack->length;
4391 if (!( len >= x && x > 0 )) return stackUnderflow();
4392 /* nothing to do */
4393 if (len==x) return 0;
4395 list=self->stack->data[x-1];
4397 if (PyList_Check(list)) {
4398 PyObject *slice;
4399 int list_len;
4401 slice=Pdata_popList(self->stack, x);
4402 if (! slice) return -1;
4403 list_len = PyList_GET_SIZE(list);
4404 i=PyList_SetSlice(list, list_len, list_len, slice);
4405 Py_DECREF(slice);
4406 return i;
4408 else {
4410 if (!( append_method = PyObject_GetAttr(list, append_str)))
4411 return -1;
4413 for (i = x; i < len; i++) {
4414 PyObject *junk;
4416 value=self->stack->data[i];
4417 junk=0;
4418 ARG_TUP(self, value);
4419 if (self->arg) {
4420 junk = PyObject_Call(append_method, self->arg,
4421 NULL);
4422 FREE_ARG_TUP(self);
4424 if (! junk) {
4425 Pdata_clear(self->stack, i+1);
4426 self->stack->length=x;
4427 Py_DECREF(append_method);
4428 return -1;
4430 Py_DECREF(junk);
4432 self->stack->length=x;
4433 Py_DECREF(append_method);
4436 return 0;
4440 static int
4441 load_append(Unpicklerobject *self)
4443 return do_append(self, self->stack->length - 1);
4447 static int
4448 load_appends(Unpicklerobject *self)
4450 return do_append(self, marker(self));
4454 static int
4455 do_setitems(Unpicklerobject *self, int x)
4457 PyObject *value = 0, *key = 0, *dict = 0;
4458 int len, i, r=0;
4460 if (!( (len=self->stack->length) >= x
4461 && x > 0 )) return stackUnderflow();
4463 dict=self->stack->data[x-1];
4465 for (i = x+1; i < len; i += 2) {
4466 key =self->stack->data[i-1];
4467 value=self->stack->data[i ];
4468 if (PyObject_SetItem(dict, key, value) < 0) {
4469 r=-1;
4470 break;
4474 Pdata_clear(self->stack, x);
4476 return r;
4480 static int
4481 load_setitem(Unpicklerobject *self)
4483 return do_setitems(self, self->stack->length - 2);
4486 static int
4487 load_setitems(Unpicklerobject *self)
4489 return do_setitems(self, marker(self));
4493 static int
4494 load_build(Unpicklerobject *self)
4496 PyObject *state, *inst, *slotstate;
4497 PyObject *__setstate__;
4498 PyObject *d_key, *d_value;
4499 Py_ssize_t i;
4500 int res = -1;
4502 /* Stack is ... instance, state. We want to leave instance at
4503 * the stack top, possibly mutated via instance.__setstate__(state).
4505 if (self->stack->length < 2)
4506 return stackUnderflow();
4507 PDATA_POP(self->stack, state);
4508 if (state == NULL)
4509 return -1;
4510 inst = self->stack->data[self->stack->length - 1];
4512 __setstate__ = PyObject_GetAttr(inst, __setstate___str);
4513 if (__setstate__ != NULL) {
4514 PyObject *junk = NULL;
4516 /* The explicit __setstate__ is responsible for everything. */
4517 ARG_TUP(self, state);
4518 if (self->arg) {
4519 junk = PyObject_Call(__setstate__, self->arg, NULL);
4520 FREE_ARG_TUP(self);
4522 Py_DECREF(__setstate__);
4523 if (junk == NULL)
4524 return -1;
4525 Py_DECREF(junk);
4526 return 0;
4528 if (!PyErr_ExceptionMatches(PyExc_AttributeError))
4529 return -1;
4530 PyErr_Clear();
4532 /* A default __setstate__. First see whether state embeds a
4533 * slot state dict too (a proto 2 addition).
4535 if (PyTuple_Check(state) && PyTuple_Size(state) == 2) {
4536 PyObject *temp = state;
4537 state = PyTuple_GET_ITEM(temp, 0);
4538 slotstate = PyTuple_GET_ITEM(temp, 1);
4539 Py_INCREF(state);
4540 Py_INCREF(slotstate);
4541 Py_DECREF(temp);
4543 else
4544 slotstate = NULL;
4546 /* Set inst.__dict__ from the state dict (if any). */
4547 if (state != Py_None) {
4548 PyObject *dict;
4549 if (! PyDict_Check(state)) {
4550 PyErr_SetString(UnpicklingError, "state is not a "
4551 "dictionary");
4552 goto finally;
4554 dict = PyObject_GetAttr(inst, __dict___str);
4555 if (dict == NULL)
4556 goto finally;
4558 i = 0;
4559 while (PyDict_Next(state, &i, &d_key, &d_value)) {
4560 /* normally the keys for instance attributes are
4561 interned. we should try to do that here. */
4562 Py_INCREF(d_key);
4563 if (PyString_CheckExact(d_key))
4564 PyString_InternInPlace(&d_key);
4565 if (PyObject_SetItem(dict, d_key, d_value) < 0) {
4566 Py_DECREF(d_key);
4567 goto finally;
4569 Py_DECREF(d_key);
4571 Py_DECREF(dict);
4574 /* Also set instance attributes from the slotstate dict (if any). */
4575 if (slotstate != NULL) {
4576 if (! PyDict_Check(slotstate)) {
4577 PyErr_SetString(UnpicklingError, "slot state is not "
4578 "a dictionary");
4579 goto finally;
4581 i = 0;
4582 while (PyDict_Next(slotstate, &i, &d_key, &d_value)) {
4583 if (PyObject_SetAttr(inst, d_key, d_value) < 0)
4584 goto finally;
4587 res = 0;
4589 finally:
4590 Py_DECREF(state);
4591 Py_XDECREF(slotstate);
4592 return res;
4596 static int
4597 load_mark(Unpicklerobject *self)
4599 int s;
4601 /* Note that we split the (pickle.py) stack into two stacks, an
4602 object stack and a mark stack. Here we push a mark onto the
4603 mark stack.
4606 if ((self->num_marks + 1) >= self->marks_size) {
4607 int *marks;
4608 s=self->marks_size+20;
4609 if (s <= self->num_marks) s=self->num_marks + 1;
4610 if (self->marks == NULL)
4611 marks=(int *)malloc(s * sizeof(int));
4612 else
4613 marks=(int *)realloc(self->marks,
4614 s * sizeof(int));
4615 if (!marks) {
4616 PyErr_NoMemory();
4617 return -1;
4619 self->marks = marks;
4620 self->marks_size = s;
4623 self->marks[self->num_marks++] = self->stack->length;
4625 return 0;
4628 static int
4629 load_reduce(Unpicklerobject *self)
4631 PyObject *callable = 0, *arg_tup = 0, *ob = 0;
4633 PDATA_POP(self->stack, arg_tup);
4634 if (! arg_tup) return -1;
4635 PDATA_POP(self->stack, callable);
4636 if (callable) {
4637 ob = Instance_New(callable, arg_tup);
4638 Py_DECREF(callable);
4640 Py_DECREF(arg_tup);
4642 if (! ob) return -1;
4644 PDATA_PUSH(self->stack, ob, -1);
4645 return 0;
4648 /* Just raises an error if we don't know the protocol specified. PROTO
4649 * is the first opcode for protocols >= 2.
4651 static int
4652 load_proto(Unpicklerobject *self)
4654 int i;
4655 char *protobyte;
4657 i = self->read_func(self, &protobyte, 1);
4658 if (i < 0)
4659 return -1;
4661 i = calc_binint(protobyte, 1);
4662 /* No point checking for < 0, since calc_binint returns an unsigned
4663 * int when chewing on 1 byte.
4665 assert(i >= 0);
4666 if (i <= HIGHEST_PROTOCOL)
4667 return 0;
4669 PyErr_Format(PyExc_ValueError, "unsupported pickle protocol: %d", i);
4670 return -1;
4673 static PyObject *
4674 load(Unpicklerobject *self)
4676 PyObject *err = 0, *val = 0;
4677 char *s;
4679 self->num_marks = 0;
4680 if (self->stack->length) Pdata_clear(self->stack, 0);
4682 while (1) {
4683 if (self->read_func(self, &s, 1) < 0)
4684 break;
4686 switch (s[0]) {
4687 case NONE:
4688 if (load_none(self) < 0)
4689 break;
4690 continue;
4692 case BININT:
4693 if (load_binint(self) < 0)
4694 break;
4695 continue;
4697 case BININT1:
4698 if (load_binint1(self) < 0)
4699 break;
4700 continue;
4702 case BININT2:
4703 if (load_binint2(self) < 0)
4704 break;
4705 continue;
4707 case INT:
4708 if (load_int(self) < 0)
4709 break;
4710 continue;
4712 case LONG:
4713 if (load_long(self) < 0)
4714 break;
4715 continue;
4717 case LONG1:
4718 if (load_counted_long(self, 1) < 0)
4719 break;
4720 continue;
4722 case LONG4:
4723 if (load_counted_long(self, 4) < 0)
4724 break;
4725 continue;
4727 case FLOAT:
4728 if (load_float(self) < 0)
4729 break;
4730 continue;
4732 case BINFLOAT:
4733 if (load_binfloat(self) < 0)
4734 break;
4735 continue;
4737 case BINSTRING:
4738 if (load_binstring(self) < 0)
4739 break;
4740 continue;
4742 case SHORT_BINSTRING:
4743 if (load_short_binstring(self) < 0)
4744 break;
4745 continue;
4747 case STRING:
4748 if (load_string(self) < 0)
4749 break;
4750 continue;
4752 #ifdef Py_USING_UNICODE
4753 case UNICODE:
4754 if (load_unicode(self) < 0)
4755 break;
4756 continue;
4758 case BINUNICODE:
4759 if (load_binunicode(self) < 0)
4760 break;
4761 continue;
4762 #endif
4764 case EMPTY_TUPLE:
4765 if (load_counted_tuple(self, 0) < 0)
4766 break;
4767 continue;
4769 case TUPLE1:
4770 if (load_counted_tuple(self, 1) < 0)
4771 break;
4772 continue;
4774 case TUPLE2:
4775 if (load_counted_tuple(self, 2) < 0)
4776 break;
4777 continue;
4779 case TUPLE3:
4780 if (load_counted_tuple(self, 3) < 0)
4781 break;
4782 continue;
4784 case TUPLE:
4785 if (load_tuple(self) < 0)
4786 break;
4787 continue;
4789 case EMPTY_LIST:
4790 if (load_empty_list(self) < 0)
4791 break;
4792 continue;
4794 case LIST:
4795 if (load_list(self) < 0)
4796 break;
4797 continue;
4799 case EMPTY_DICT:
4800 if (load_empty_dict(self) < 0)
4801 break;
4802 continue;
4804 case DICT:
4805 if (load_dict(self) < 0)
4806 break;
4807 continue;
4809 case OBJ:
4810 if (load_obj(self) < 0)
4811 break;
4812 continue;
4814 case INST:
4815 if (load_inst(self) < 0)
4816 break;
4817 continue;
4819 case NEWOBJ:
4820 if (load_newobj(self) < 0)
4821 break;
4822 continue;
4824 case GLOBAL:
4825 if (load_global(self) < 0)
4826 break;
4827 continue;
4829 case APPEND:
4830 if (load_append(self) < 0)
4831 break;
4832 continue;
4834 case APPENDS:
4835 if (load_appends(self) < 0)
4836 break;
4837 continue;
4839 case BUILD:
4840 if (load_build(self) < 0)
4841 break;
4842 continue;
4844 case DUP:
4845 if (load_dup(self) < 0)
4846 break;
4847 continue;
4849 case BINGET:
4850 if (load_binget(self) < 0)
4851 break;
4852 continue;
4854 case LONG_BINGET:
4855 if (load_long_binget(self) < 0)
4856 break;
4857 continue;
4859 case GET:
4860 if (load_get(self) < 0)
4861 break;
4862 continue;
4864 case EXT1:
4865 if (load_extension(self, 1) < 0)
4866 break;
4867 continue;
4869 case EXT2:
4870 if (load_extension(self, 2) < 0)
4871 break;
4872 continue;
4874 case EXT4:
4875 if (load_extension(self, 4) < 0)
4876 break;
4877 continue;
4878 case MARK:
4879 if (load_mark(self) < 0)
4880 break;
4881 continue;
4883 case BINPUT:
4884 if (load_binput(self) < 0)
4885 break;
4886 continue;
4888 case LONG_BINPUT:
4889 if (load_long_binput(self) < 0)
4890 break;
4891 continue;
4893 case PUT:
4894 if (load_put(self) < 0)
4895 break;
4896 continue;
4898 case POP:
4899 if (load_pop(self) < 0)
4900 break;
4901 continue;
4903 case POP_MARK:
4904 if (load_pop_mark(self) < 0)
4905 break;
4906 continue;
4908 case SETITEM:
4909 if (load_setitem(self) < 0)
4910 break;
4911 continue;
4913 case SETITEMS:
4914 if (load_setitems(self) < 0)
4915 break;
4916 continue;
4918 case STOP:
4919 break;
4921 case PERSID:
4922 if (load_persid(self) < 0)
4923 break;
4924 continue;
4926 case BINPERSID:
4927 if (load_binpersid(self) < 0)
4928 break;
4929 continue;
4931 case REDUCE:
4932 if (load_reduce(self) < 0)
4933 break;
4934 continue;
4936 case PROTO:
4937 if (load_proto(self) < 0)
4938 break;
4939 continue;
4941 case NEWTRUE:
4942 if (load_bool(self, Py_True) < 0)
4943 break;
4944 continue;
4946 case NEWFALSE:
4947 if (load_bool(self, Py_False) < 0)
4948 break;
4949 continue;
4951 case '\0':
4952 /* end of file */
4953 PyErr_SetNone(PyExc_EOFError);
4954 break;
4956 default:
4957 cPickle_ErrFormat(UnpicklingError,
4958 "invalid load key, '%s'.",
4959 "c", s[0]);
4960 return NULL;
4963 break;
4966 if ((err = PyErr_Occurred())) {
4967 if (err == PyExc_EOFError) {
4968 PyErr_SetNone(PyExc_EOFError);
4970 return NULL;
4973 PDATA_POP(self->stack, val);
4974 return val;
4978 /* No-load functions to support noload, which is used to
4979 find persistent references. */
4981 static int
4982 noload_obj(Unpicklerobject *self)
4984 int i;
4986 if ((i = marker(self)) < 0) return -1;
4987 return Pdata_clear(self->stack, i+1);
4991 static int
4992 noload_inst(Unpicklerobject *self)
4994 int i;
4995 char *s;
4997 if ((i = marker(self)) < 0) return -1;
4998 Pdata_clear(self->stack, i);
4999 if (self->readline_func(self, &s) < 0) return -1;
5000 if (self->readline_func(self, &s) < 0) return -1;
5001 PDATA_APPEND(self->stack, Py_None, -1);
5002 return 0;
5005 static int
5006 noload_newobj(Unpicklerobject *self)
5008 PyObject *obj;
5010 PDATA_POP(self->stack, obj); /* pop argtuple */
5011 if (obj == NULL) return -1;
5012 Py_DECREF(obj);
5014 PDATA_POP(self->stack, obj); /* pop cls */
5015 if (obj == NULL) return -1;
5016 Py_DECREF(obj);
5018 PDATA_APPEND(self->stack, Py_None, -1);
5019 return 0;
5022 static int
5023 noload_global(Unpicklerobject *self)
5025 char *s;
5027 if (self->readline_func(self, &s) < 0) return -1;
5028 if (self->readline_func(self, &s) < 0) return -1;
5029 PDATA_APPEND(self->stack, Py_None,-1);
5030 return 0;
5033 static int
5034 noload_reduce(Unpicklerobject *self)
5037 if (self->stack->length < 2) return stackUnderflow();
5038 Pdata_clear(self->stack, self->stack->length-2);
5039 PDATA_APPEND(self->stack, Py_None,-1);
5040 return 0;
5043 static int
5044 noload_build(Unpicklerobject *self) {
5046 if (self->stack->length < 1) return stackUnderflow();
5047 Pdata_clear(self->stack, self->stack->length-1);
5048 return 0;
5051 static int
5052 noload_extension(Unpicklerobject *self, int nbytes)
5054 char *codebytes;
5056 assert(nbytes == 1 || nbytes == 2 || nbytes == 4);
5057 if (self->read_func(self, &codebytes, nbytes) < 0) return -1;
5058 PDATA_APPEND(self->stack, Py_None, -1);
5059 return 0;
5062 static int
5063 noload_append(Unpicklerobject *self)
5065 return Pdata_clear(self->stack, self->stack->length - 1);
5068 static int
5069 noload_appends(Unpicklerobject *self)
5071 int i;
5072 if ((i = marker(self)) < 0) return -1;
5073 return Pdata_clear(self->stack, i);
5076 static int
5077 noload_setitem(Unpicklerobject *self)
5079 return Pdata_clear(self->stack, self->stack->length - 2);
5082 static int
5083 noload_setitems(Unpicklerobject *self)
5085 int i;
5086 if ((i = marker(self)) < 0) return -1;
5087 return Pdata_clear(self->stack, i);
5090 static PyObject *
5091 noload(Unpicklerobject *self)
5093 PyObject *err = 0, *val = 0;
5094 char *s;
5096 self->num_marks = 0;
5097 Pdata_clear(self->stack, 0);
5099 while (1) {
5100 if (self->read_func(self, &s, 1) < 0)
5101 break;
5103 switch (s[0]) {
5104 case NONE:
5105 if (load_none(self) < 0)
5106 break;
5107 continue;
5109 case BININT:
5110 if (load_binint(self) < 0)
5111 break;
5112 continue;
5114 case BININT1:
5115 if (load_binint1(self) < 0)
5116 break;
5117 continue;
5119 case BININT2:
5120 if (load_binint2(self) < 0)
5121 break;
5122 continue;
5124 case INT:
5125 if (load_int(self) < 0)
5126 break;
5127 continue;
5129 case LONG:
5130 if (load_long(self) < 0)
5131 break;
5132 continue;
5134 case LONG1:
5135 if (load_counted_long(self, 1) < 0)
5136 break;
5137 continue;
5139 case LONG4:
5140 if (load_counted_long(self, 4) < 0)
5141 break;
5142 continue;
5144 case FLOAT:
5145 if (load_float(self) < 0)
5146 break;
5147 continue;
5149 case BINFLOAT:
5150 if (load_binfloat(self) < 0)
5151 break;
5152 continue;
5154 case BINSTRING:
5155 if (load_binstring(self) < 0)
5156 break;
5157 continue;
5159 case SHORT_BINSTRING:
5160 if (load_short_binstring(self) < 0)
5161 break;
5162 continue;
5164 case STRING:
5165 if (load_string(self) < 0)
5166 break;
5167 continue;
5169 #ifdef Py_USING_UNICODE
5170 case UNICODE:
5171 if (load_unicode(self) < 0)
5172 break;
5173 continue;
5175 case BINUNICODE:
5176 if (load_binunicode(self) < 0)
5177 break;
5178 continue;
5179 #endif
5181 case EMPTY_TUPLE:
5182 if (load_counted_tuple(self, 0) < 0)
5183 break;
5184 continue;
5186 case TUPLE1:
5187 if (load_counted_tuple(self, 1) < 0)
5188 break;
5189 continue;
5191 case TUPLE2:
5192 if (load_counted_tuple(self, 2) < 0)
5193 break;
5194 continue;
5196 case TUPLE3:
5197 if (load_counted_tuple(self, 3) < 0)
5198 break;
5199 continue;
5201 case TUPLE:
5202 if (load_tuple(self) < 0)
5203 break;
5204 continue;
5206 case EMPTY_LIST:
5207 if (load_empty_list(self) < 0)
5208 break;
5209 continue;
5211 case LIST:
5212 if (load_list(self) < 0)
5213 break;
5214 continue;
5216 case EMPTY_DICT:
5217 if (load_empty_dict(self) < 0)
5218 break;
5219 continue;
5221 case DICT:
5222 if (load_dict(self) < 0)
5223 break;
5224 continue;
5226 case OBJ:
5227 if (noload_obj(self) < 0)
5228 break;
5229 continue;
5231 case INST:
5232 if (noload_inst(self) < 0)
5233 break;
5234 continue;
5236 case NEWOBJ:
5237 if (noload_newobj(self) < 0)
5238 break;
5239 continue;
5241 case GLOBAL:
5242 if (noload_global(self) < 0)
5243 break;
5244 continue;
5246 case APPEND:
5247 if (noload_append(self) < 0)
5248 break;
5249 continue;
5251 case APPENDS:
5252 if (noload_appends(self) < 0)
5253 break;
5254 continue;
5256 case BUILD:
5257 if (noload_build(self) < 0)
5258 break;
5259 continue;
5261 case DUP:
5262 if (load_dup(self) < 0)
5263 break;
5264 continue;
5266 case BINGET:
5267 if (load_binget(self) < 0)
5268 break;
5269 continue;
5271 case LONG_BINGET:
5272 if (load_long_binget(self) < 0)
5273 break;
5274 continue;
5276 case GET:
5277 if (load_get(self) < 0)
5278 break;
5279 continue;
5281 case EXT1:
5282 if (noload_extension(self, 1) < 0)
5283 break;
5284 continue;
5286 case EXT2:
5287 if (noload_extension(self, 2) < 0)
5288 break;
5289 continue;
5291 case EXT4:
5292 if (noload_extension(self, 4) < 0)
5293 break;
5294 continue;
5296 case MARK:
5297 if (load_mark(self) < 0)
5298 break;
5299 continue;
5301 case BINPUT:
5302 if (load_binput(self) < 0)
5303 break;
5304 continue;
5306 case LONG_BINPUT:
5307 if (load_long_binput(self) < 0)
5308 break;
5309 continue;
5311 case PUT:
5312 if (load_put(self) < 0)
5313 break;
5314 continue;
5316 case POP:
5317 if (load_pop(self) < 0)
5318 break;
5319 continue;
5321 case POP_MARK:
5322 if (load_pop_mark(self) < 0)
5323 break;
5324 continue;
5326 case SETITEM:
5327 if (noload_setitem(self) < 0)
5328 break;
5329 continue;
5331 case SETITEMS:
5332 if (noload_setitems(self) < 0)
5333 break;
5334 continue;
5336 case STOP:
5337 break;
5339 case PERSID:
5340 if (load_persid(self) < 0)
5341 break;
5342 continue;
5344 case BINPERSID:
5345 if (load_binpersid(self) < 0)
5346 break;
5347 continue;
5349 case REDUCE:
5350 if (noload_reduce(self) < 0)
5351 break;
5352 continue;
5354 case PROTO:
5355 if (load_proto(self) < 0)
5356 break;
5357 continue;
5359 case NEWTRUE:
5360 if (load_bool(self, Py_True) < 0)
5361 break;
5362 continue;
5364 case NEWFALSE:
5365 if (load_bool(self, Py_False) < 0)
5366 break;
5367 continue;
5368 default:
5369 cPickle_ErrFormat(UnpicklingError,
5370 "invalid load key, '%s'.",
5371 "c", s[0]);
5372 return NULL;
5375 break;
5378 if ((err = PyErr_Occurred())) {
5379 if (err == PyExc_EOFError) {
5380 PyErr_SetNone(PyExc_EOFError);
5382 return NULL;
5385 PDATA_POP(self->stack, val);
5386 return val;
5390 static PyObject *
5391 Unpickler_load(Unpicklerobject *self, PyObject *unused)
5393 return load(self);
5396 static PyObject *
5397 Unpickler_noload(Unpicklerobject *self, PyObject *unused)
5399 return noload(self);
5403 static struct PyMethodDef Unpickler_methods[] = {
5404 {"load", (PyCFunction)Unpickler_load, METH_NOARGS,
5405 PyDoc_STR("load() -- Load a pickle")
5407 {"noload", (PyCFunction)Unpickler_noload, METH_NOARGS,
5408 PyDoc_STR(
5409 "noload() -- not load a pickle, but go through most of the motions\n"
5410 "\n"
5411 "This function can be used to read past a pickle without instantiating\n"
5412 "any objects or importing any modules. It can also be used to find all\n"
5413 "persistent references without instantiating any objects or importing\n"
5414 "any modules.\n")
5416 {NULL, NULL} /* sentinel */
5420 static Unpicklerobject *
5421 newUnpicklerobject(PyObject *f)
5423 Unpicklerobject *self;
5425 if (!( self = PyObject_GC_New(Unpicklerobject, &Unpicklertype)))
5426 return NULL;
5428 self->file = NULL;
5429 self->arg = NULL;
5430 self->stack = (Pdata*)Pdata_New();
5431 self->pers_func = NULL;
5432 self->last_string = NULL;
5433 self->marks = NULL;
5434 self->num_marks = 0;
5435 self->marks_size = 0;
5436 self->buf_size = 0;
5437 self->read = NULL;
5438 self->readline = NULL;
5439 self->find_class = NULL;
5441 if (!( self->memo = PyDict_New()))
5442 goto err;
5444 if (!self->stack)
5445 goto err;
5447 Py_INCREF(f);
5448 self->file = f;
5450 /* Set read, readline based on type of f */
5451 if (PyFile_Check(f)) {
5452 self->fp = PyFile_AsFile(f);
5453 if (self->fp == NULL) {
5454 PyErr_SetString(PyExc_ValueError,
5455 "I/O operation on closed file");
5456 goto err;
5458 self->read_func = read_file;
5459 self->readline_func = readline_file;
5461 else if (PycStringIO_InputCheck(f)) {
5462 self->fp = NULL;
5463 self->read_func = read_cStringIO;
5464 self->readline_func = readline_cStringIO;
5466 else {
5468 self->fp = NULL;
5469 self->read_func = read_other;
5470 self->readline_func = readline_other;
5472 if (!( (self->readline = PyObject_GetAttr(f, readline_str)) &&
5473 (self->read = PyObject_GetAttr(f, read_str)))) {
5474 PyErr_Clear();
5475 PyErr_SetString( PyExc_TypeError,
5476 "argument must have 'read' and "
5477 "'readline' attributes" );
5478 goto err;
5481 PyObject_GC_Track(self);
5483 return self;
5485 err:
5486 Py_DECREF((PyObject *)self);
5487 return NULL;
5491 static PyObject *
5492 get_Unpickler(PyObject *self, PyObject *file)
5494 return (PyObject *)newUnpicklerobject(file);
5498 static void
5499 Unpickler_dealloc(Unpicklerobject *self)
5501 PyObject_GC_UnTrack((PyObject *)self);
5502 Py_XDECREF(self->readline);
5503 Py_XDECREF(self->read);
5504 Py_XDECREF(self->file);
5505 Py_XDECREF(self->memo);
5506 Py_XDECREF(self->stack);
5507 Py_XDECREF(self->pers_func);
5508 Py_XDECREF(self->arg);
5509 Py_XDECREF(self->last_string);
5510 Py_XDECREF(self->find_class);
5512 if (self->marks) {
5513 free(self->marks);
5516 if (self->buf_size) {
5517 free(self->buf);
5520 Py_TYPE(self)->tp_free((PyObject *)self);
5523 static int
5524 Unpickler_traverse(Unpicklerobject *self, visitproc visit, void *arg)
5526 Py_VISIT(self->readline);
5527 Py_VISIT(self->read);
5528 Py_VISIT(self->file);
5529 Py_VISIT(self->memo);
5530 Py_VISIT(self->stack);
5531 Py_VISIT(self->pers_func);
5532 Py_VISIT(self->arg);
5533 Py_VISIT(self->last_string);
5534 Py_VISIT(self->find_class);
5535 return 0;
5538 static int
5539 Unpickler_clear(Unpicklerobject *self)
5541 Py_CLEAR(self->readline);
5542 Py_CLEAR(self->read);
5543 Py_CLEAR(self->file);
5544 Py_CLEAR(self->memo);
5545 Py_CLEAR(self->stack);
5546 Py_CLEAR(self->pers_func);
5547 Py_CLEAR(self->arg);
5548 Py_CLEAR(self->last_string);
5549 Py_CLEAR(self->find_class);
5550 return 0;
5553 static PyObject *
5554 Unpickler_getattr(Unpicklerobject *self, char *name)
5556 if (!strcmp(name, "persistent_load")) {
5557 if (!self->pers_func) {
5558 PyErr_SetString(PyExc_AttributeError, name);
5559 return NULL;
5562 Py_INCREF(self->pers_func);
5563 return self->pers_func;
5566 if (!strcmp(name, "find_global")) {
5567 if (!self->find_class) {
5568 PyErr_SetString(PyExc_AttributeError, name);
5569 return NULL;
5572 Py_INCREF(self->find_class);
5573 return self->find_class;
5576 if (!strcmp(name, "memo")) {
5577 if (!self->memo) {
5578 PyErr_SetString(PyExc_AttributeError, name);
5579 return NULL;
5582 Py_INCREF(self->memo);
5583 return self->memo;
5586 if (!strcmp(name, "UnpicklingError")) {
5587 Py_INCREF(UnpicklingError);
5588 return UnpicklingError;
5591 return Py_FindMethod(Unpickler_methods, (PyObject *)self, name);
5595 static int
5596 Unpickler_setattr(Unpicklerobject *self, char *name, PyObject *value)
5599 if (!strcmp(name, "persistent_load")) {
5600 Py_XDECREF(self->pers_func);
5601 self->pers_func = value;
5602 Py_XINCREF(value);
5603 return 0;
5606 if (!strcmp(name, "find_global")) {
5607 Py_XDECREF(self->find_class);
5608 self->find_class = value;
5609 Py_XINCREF(value);
5610 return 0;
5613 if (! value) {
5614 PyErr_SetString(PyExc_TypeError,
5615 "attribute deletion is not supported");
5616 return -1;
5619 if (strcmp(name, "memo") == 0) {
5620 if (!PyDict_Check(value)) {
5621 PyErr_SetString(PyExc_TypeError,
5622 "memo must be a dictionary");
5623 return -1;
5625 Py_XDECREF(self->memo);
5626 self->memo = value;
5627 Py_INCREF(value);
5628 return 0;
5631 PyErr_SetString(PyExc_AttributeError, name);
5632 return -1;
5635 /* ---------------------------------------------------------------------------
5636 * Module-level functions.
5639 /* dump(obj, file, protocol=0). */
5640 static PyObject *
5641 cpm_dump(PyObject *self, PyObject *args, PyObject *kwds)
5643 static char *kwlist[] = {"obj", "file", "protocol", NULL};
5644 PyObject *ob, *file, *res = NULL;
5645 Picklerobject *pickler = 0;
5646 int proto = 0;
5648 if (!( PyArg_ParseTupleAndKeywords(args, kwds, "OO|i", kwlist,
5649 &ob, &file, &proto)))
5650 goto finally;
5652 if (!( pickler = newPicklerobject(file, proto)))
5653 goto finally;
5655 if (dump(pickler, ob) < 0)
5656 goto finally;
5658 Py_INCREF(Py_None);
5659 res = Py_None;
5661 finally:
5662 Py_XDECREF(pickler);
5664 return res;
5668 /* dumps(obj, protocol=0). */
5669 static PyObject *
5670 cpm_dumps(PyObject *self, PyObject *args, PyObject *kwds)
5672 static char *kwlist[] = {"obj", "protocol", NULL};
5673 PyObject *ob, *file = 0, *res = NULL;
5674 Picklerobject *pickler = 0;
5675 int proto = 0;
5677 if (!( PyArg_ParseTupleAndKeywords(args, kwds, "O|i:dumps", kwlist,
5678 &ob, &proto)))
5679 goto finally;
5681 if (!( file = PycStringIO->NewOutput(128)))
5682 goto finally;
5684 if (!( pickler = newPicklerobject(file, proto)))
5685 goto finally;
5687 if (dump(pickler, ob) < 0)
5688 goto finally;
5690 res = PycStringIO->cgetvalue(file);
5692 finally:
5693 Py_XDECREF(pickler);
5694 Py_XDECREF(file);
5696 return res;
5700 /* load(fileobj). */
5701 static PyObject *
5702 cpm_load(PyObject *self, PyObject *ob)
5704 Unpicklerobject *unpickler = 0;
5705 PyObject *res = NULL;
5707 if (!( unpickler = newUnpicklerobject(ob)))
5708 goto finally;
5710 res = load(unpickler);
5712 finally:
5713 Py_XDECREF(unpickler);
5715 return res;
5719 /* loads(string) */
5720 static PyObject *
5721 cpm_loads(PyObject *self, PyObject *args)
5723 PyObject *ob, *file = 0, *res = NULL;
5724 Unpicklerobject *unpickler = 0;
5726 if (!( PyArg_ParseTuple(args, "S:loads", &ob)))
5727 goto finally;
5729 if (!( file = PycStringIO->NewInput(ob)))
5730 goto finally;
5732 if (!( unpickler = newUnpicklerobject(file)))
5733 goto finally;
5735 res = load(unpickler);
5737 finally:
5738 Py_XDECREF(file);
5739 Py_XDECREF(unpickler);
5741 return res;
5745 PyDoc_STRVAR(Unpicklertype__doc__,
5746 "Objects that know how to unpickle");
5748 static PyTypeObject Unpicklertype = {
5749 PyVarObject_HEAD_INIT(NULL, 0)
5750 "cPickle.Unpickler", /*tp_name*/
5751 sizeof(Unpicklerobject), /*tp_basicsize*/
5753 (destructor)Unpickler_dealloc, /* tp_dealloc */
5754 0, /* tp_print */
5755 (getattrfunc)Unpickler_getattr, /* tp_getattr */
5756 (setattrfunc)Unpickler_setattr, /* tp_setattr */
5757 0, /* tp_compare */
5758 0, /* tp_repr */
5759 0, /* tp_as_number */
5760 0, /* tp_as_sequence */
5761 0, /* tp_as_mapping */
5762 0, /* tp_hash */
5763 0, /* tp_call */
5764 0, /* tp_str */
5765 0, /* tp_getattro */
5766 0, /* tp_setattro */
5767 0, /* tp_as_buffer */
5768 Py_TPFLAGS_DEFAULT | Py_TPFLAGS_BASETYPE | Py_TPFLAGS_HAVE_GC,
5769 Unpicklertype__doc__, /* tp_doc */
5770 (traverseproc)Unpickler_traverse, /* tp_traverse */
5771 (inquiry)Unpickler_clear, /* tp_clear */
5774 static struct PyMethodDef cPickle_methods[] = {
5775 {"dump", (PyCFunction)cpm_dump, METH_VARARGS | METH_KEYWORDS,
5776 PyDoc_STR("dump(obj, file, protocol=0) -- "
5777 "Write an object in pickle format to the given file.\n"
5778 "\n"
5779 "See the Pickler docstring for the meaning of optional argument proto.")
5782 {"dumps", (PyCFunction)cpm_dumps, METH_VARARGS | METH_KEYWORDS,
5783 PyDoc_STR("dumps(obj, protocol=0) -- "
5784 "Return a string containing an object in pickle format.\n"
5785 "\n"
5786 "See the Pickler docstring for the meaning of optional argument proto.")
5789 {"load", (PyCFunction)cpm_load, METH_O,
5790 PyDoc_STR("load(file) -- Load a pickle from the given file")},
5792 {"loads", (PyCFunction)cpm_loads, METH_VARARGS,
5793 PyDoc_STR("loads(string) -- Load a pickle from the given string")},
5795 {"Pickler", (PyCFunction)get_Pickler, METH_VARARGS | METH_KEYWORDS,
5796 PyDoc_STR("Pickler(file, protocol=0) -- Create a pickler.\n"
5797 "\n"
5798 "This takes a file-like object for writing a pickle data stream.\n"
5799 "The optional proto argument tells the pickler to use the given\n"
5800 "protocol; supported protocols are 0, 1, 2. The default\n"
5801 "protocol is 0, to be backwards compatible. (Protocol 0 is the\n"
5802 "only protocol that can be written to a file opened in text\n"
5803 "mode and read back successfully. When using a protocol higher\n"
5804 "than 0, make sure the file is opened in binary mode, both when\n"
5805 "pickling and unpickling.)\n"
5806 "\n"
5807 "Protocol 1 is more efficient than protocol 0; protocol 2 is\n"
5808 "more efficient than protocol 1.\n"
5809 "\n"
5810 "Specifying a negative protocol version selects the highest\n"
5811 "protocol version supported. The higher the protocol used, the\n"
5812 "more recent the version of Python needed to read the pickle\n"
5813 "produced.\n"
5814 "\n"
5815 "The file parameter must have a write() method that accepts a single\n"
5816 "string argument. It can thus be an open file object, a StringIO\n"
5817 "object, or any other custom object that meets this interface.\n")
5820 {"Unpickler", (PyCFunction)get_Unpickler, METH_O,
5821 PyDoc_STR("Unpickler(file) -- Create an unpickler.")},
5823 { NULL, NULL }
5826 static int
5827 init_stuff(PyObject *module_dict)
5829 PyObject *copyreg, *t, *r;
5831 #define INIT_STR(S) if (!( S ## _str=PyString_InternFromString(#S))) return -1;
5833 if (PyType_Ready(&Unpicklertype) < 0)
5834 return -1;
5835 if (PyType_Ready(&Picklertype) < 0)
5836 return -1;
5838 INIT_STR(__class__);
5839 INIT_STR(__getinitargs__);
5840 INIT_STR(__dict__);
5841 INIT_STR(__getstate__);
5842 INIT_STR(__setstate__);
5843 INIT_STR(__name__);
5844 INIT_STR(__main__);
5845 INIT_STR(__reduce__);
5846 INIT_STR(__reduce_ex__);
5847 INIT_STR(write);
5848 INIT_STR(append);
5849 INIT_STR(read);
5850 INIT_STR(readline);
5851 INIT_STR(dispatch_table);
5853 if (!( copyreg = PyImport_ImportModule("copy_reg")))
5854 return -1;
5856 /* This is special because we want to use a different
5857 one in restricted mode. */
5858 dispatch_table = PyObject_GetAttr(copyreg, dispatch_table_str);
5859 if (!dispatch_table) return -1;
5861 extension_registry = PyObject_GetAttrString(copyreg,
5862 "_extension_registry");
5863 if (!extension_registry) return -1;
5865 inverted_registry = PyObject_GetAttrString(copyreg,
5866 "_inverted_registry");
5867 if (!inverted_registry) return -1;
5869 extension_cache = PyObject_GetAttrString(copyreg,
5870 "_extension_cache");
5871 if (!extension_cache) return -1;
5873 Py_DECREF(copyreg);
5875 if (!(empty_tuple = PyTuple_New(0)))
5876 return -1;
5878 two_tuple = PyTuple_New(2);
5879 if (two_tuple == NULL)
5880 return -1;
5881 /* We use this temp container with no regard to refcounts, or to
5882 * keeping containees alive. Exempt from GC, because we don't
5883 * want anything looking at two_tuple() by magic.
5885 PyObject_GC_UnTrack(two_tuple);
5887 /* Ugh */
5888 if (!( t=PyImport_ImportModule("__builtin__"))) return -1;
5889 if (PyDict_SetItemString(module_dict, "__builtins__", t) < 0)
5890 return -1;
5892 if (!( t=PyDict_New())) return -1;
5893 if (!( r=PyRun_String(
5894 "def __str__(self):\n"
5895 " return self.args and ('%s' % self.args[0]) or '(what)'\n",
5896 Py_file_input,
5897 module_dict, t) )) return -1;
5898 Py_DECREF(r);
5900 PickleError = PyErr_NewException("cPickle.PickleError", NULL, t);
5901 if (!PickleError)
5902 return -1;
5904 Py_DECREF(t);
5906 PicklingError = PyErr_NewException("cPickle.PicklingError",
5907 PickleError, NULL);
5908 if (!PicklingError)
5909 return -1;
5911 if (!( t=PyDict_New())) return -1;
5912 if (!( r=PyRun_String(
5913 "def __str__(self):\n"
5914 " a=self.args\n"
5915 " a=a and type(a[0]) or '(what)'\n"
5916 " return 'Cannot pickle %s objects' % a\n"
5917 , Py_file_input,
5918 module_dict, t) )) return -1;
5919 Py_DECREF(r);
5921 if (!( UnpickleableError = PyErr_NewException(
5922 "cPickle.UnpickleableError", PicklingError, t)))
5923 return -1;
5925 Py_DECREF(t);
5927 if (!( UnpicklingError = PyErr_NewException("cPickle.UnpicklingError",
5928 PickleError, NULL)))
5929 return -1;
5931 if (!( BadPickleGet = PyErr_NewException("cPickle.BadPickleGet",
5932 UnpicklingError, NULL)))
5933 return -1;
5935 if (PyDict_SetItemString(module_dict, "PickleError",
5936 PickleError) < 0)
5937 return -1;
5939 if (PyDict_SetItemString(module_dict, "PicklingError",
5940 PicklingError) < 0)
5941 return -1;
5943 if (PyDict_SetItemString(module_dict, "UnpicklingError",
5944 UnpicklingError) < 0)
5945 return -1;
5947 if (PyDict_SetItemString(module_dict, "UnpickleableError",
5948 UnpickleableError) < 0)
5949 return -1;
5951 if (PyDict_SetItemString(module_dict, "BadPickleGet",
5952 BadPickleGet) < 0)
5953 return -1;
5955 PycString_IMPORT;
5957 return 0;
5960 #ifndef PyMODINIT_FUNC /* declarations for DLL import/export */
5961 #define PyMODINIT_FUNC void
5962 #endif
5963 PyMODINIT_FUNC
5964 initcPickle(void)
5966 PyObject *m, *d, *di, *v, *k;
5967 Py_ssize_t i;
5968 char *rev = "1.71"; /* XXX when does this change? */
5969 PyObject *format_version;
5970 PyObject *compatible_formats;
5972 Py_TYPE(&Picklertype) = &PyType_Type;
5973 Py_TYPE(&Unpicklertype) = &PyType_Type;
5974 Py_TYPE(&PdataType) = &PyType_Type;
5976 /* Initialize some pieces. We need to do this before module creation,
5977 * so we're forced to use a temporary dictionary. :(
5979 di = PyDict_New();
5980 if (!di) return;
5981 if (init_stuff(di) < 0) return;
5983 /* Create the module and add the functions */
5984 m = Py_InitModule4("cPickle", cPickle_methods,
5985 cPickle_module_documentation,
5986 (PyObject*)NULL,PYTHON_API_VERSION);
5987 if (m == NULL)
5988 return;
5990 /* Add some symbolic constants to the module */
5991 d = PyModule_GetDict(m);
5992 v = PyString_FromString(rev);
5993 PyDict_SetItemString(d, "__version__", v);
5994 Py_XDECREF(v);
5996 /* Copy data from di. Waaa. */
5997 for (i=0; PyDict_Next(di, &i, &k, &v); ) {
5998 if (PyObject_SetItem(d, k, v) < 0) {
5999 Py_DECREF(di);
6000 return;
6003 Py_DECREF(di);
6005 i = PyModule_AddIntConstant(m, "HIGHEST_PROTOCOL", HIGHEST_PROTOCOL);
6006 if (i < 0)
6007 return;
6009 /* These are purely informational; no code uses them. */
6010 /* File format version we write. */
6011 format_version = PyString_FromString("2.0");
6012 /* Format versions we can read. */
6013 compatible_formats = Py_BuildValue("[sssss]",
6014 "1.0", /* Original protocol 0 */
6015 "1.1", /* Protocol 0 + INST */
6016 "1.2", /* Original protocol 1 */
6017 "1.3", /* Protocol 1 + BINFLOAT */
6018 "2.0"); /* Original protocol 2 */
6019 PyDict_SetItemString(d, "format_version", format_version);
6020 PyDict_SetItemString(d, "compatible_formats", compatible_formats);
6021 Py_XDECREF(format_version);
6022 Py_XDECREF(compatible_formats);