1 /* struct module -- pack values into and (out of) bytes objects */
2
3 /* New version supporting byte order, alignment and size options,
4 character strings, and unsigned numbers */
5
6 #define PY_SSIZE_T_CLEAN
7
8 #include "Python.h"
9 #include "structmember.h"
10 #include <ctype.h>
11
12 /*[clinic input]
13 class Struct "PyStructObject *" "&PyStructType"
14 [clinic start generated code]*/
15 /*[clinic end generated code: output=da39a3ee5e6b4b0d input=9b032058a83ed7c3]*/
16
17 static PyTypeObject PyStructType;
18
19 /* The translation function for each format character is table driven */
20 typedef struct _formatdef {
21 char format;
22 Py_ssize_t size;
23 Py_ssize_t alignment;
24 PyObject* (*unpack)(const char *,
25 const struct _formatdef *);
26 int (*pack)(char *, PyObject *,
27 const struct _formatdef *);
28 } formatdef;
29
30 typedef struct _formatcode {
31 const struct _formatdef *fmtdef;
32 Py_ssize_t offset;
33 Py_ssize_t size;
34 Py_ssize_t repeat;
35 } formatcode;
36
37 /* Struct object interface */
38
39 typedef struct {
40 PyObject_HEAD
41 Py_ssize_t s_size;
42 Py_ssize_t s_len;
43 formatcode *s_codes;
44 PyObject *s_format;
45 PyObject *weakreflist; /* List of weak references */
46 } PyStructObject;
47
48
49 #define PyStruct_Check(op) PyObject_TypeCheck(op, &PyStructType)
50 #define PyStruct_CheckExact(op) (Py_TYPE(op) == &PyStructType)
51
52
53 /* Exception */
54
55 static PyObject *StructError;
56
57
58 /* Define various structs to figure out the alignments of types */
59
60
61 typedef struct { char c; short x; } st_short;
62 typedef struct { char c; int x; } st_int;
63 typedef struct { char c; long x; } st_long;
64 typedef struct { char c; float x; } st_float;
65 typedef struct { char c; double x; } st_double;
66 typedef struct { char c; void *x; } st_void_p;
67 typedef struct { char c; size_t x; } st_size_t;
68 typedef struct { char c; _Bool x; } st_bool;
69
70 #define SHORT_ALIGN (sizeof(st_short) - sizeof(short))
71 #define INT_ALIGN (sizeof(st_int) - sizeof(int))
72 #define LONG_ALIGN (sizeof(st_long) - sizeof(long))
73 #define FLOAT_ALIGN (sizeof(st_float) - sizeof(float))
74 #define DOUBLE_ALIGN (sizeof(st_double) - sizeof(double))
75 #define VOID_P_ALIGN (sizeof(st_void_p) - sizeof(void *))
76 #define SIZE_T_ALIGN (sizeof(st_size_t) - sizeof(size_t))
77 #define BOOL_ALIGN (sizeof(st_bool) - sizeof(_Bool))
78
79 /* We can't support q and Q in native mode unless the compiler does;
80 in std mode, they're 8 bytes on all platforms. */
81 typedef struct { char c; long long x; } s_long_long;
82 #define LONG_LONG_ALIGN (sizeof(s_long_long) - sizeof(long long))
83
84 #ifdef __powerc
85 #pragma options align=reset
86 #endif
87
88 /*[python input]
89 class cache_struct_converter(CConverter):
90 type = 'PyStructObject *'
91 converter = 'cache_struct_converter'
92 c_default = "NULL"
93
94 def cleanup(self):
95 return "Py_XDECREF(%s);\n" % self.name
96 [python start generated code]*/
97 /*[python end generated code: output=da39a3ee5e6b4b0d input=49957cca130ffb63]*/
98
99 static int cache_struct_converter(PyObject *, PyStructObject **);
100
101 #include "clinic/_struct.c.h"
102
103 /* Helper for integer format codes: converts an arbitrary Python object to a
104 PyLongObject if possible, otherwise fails. Caller should decref. */
105
106 static PyObject *
get_pylong(PyObject * v)107 get_pylong(PyObject *v)
108 {
109 assert(v != NULL);
110 if (!PyLong_Check(v)) {
111 /* Not an integer; try to use __index__ to convert. */
112 if (PyIndex_Check(v)) {
113 v = PyNumber_Index(v);
114 if (v == NULL)
115 return NULL;
116 }
117 else {
118 PyErr_SetString(StructError,
119 "required argument is not an integer");
120 return NULL;
121 }
122 }
123 else
124 Py_INCREF(v);
125
126 assert(PyLong_Check(v));
127 return v;
128 }
129
130 /* Helper routine to get a C long and raise the appropriate error if it isn't
131 one */
132
133 static int
get_long(PyObject * v,long * p)134 get_long(PyObject *v, long *p)
135 {
136 long x;
137
138 v = get_pylong(v);
139 if (v == NULL)
140 return -1;
141 assert(PyLong_Check(v));
142 x = PyLong_AsLong(v);
143 Py_DECREF(v);
144 if (x == (long)-1 && PyErr_Occurred()) {
145 if (PyErr_ExceptionMatches(PyExc_OverflowError))
146 PyErr_SetString(StructError,
147 "argument out of range");
148 return -1;
149 }
150 *p = x;
151 return 0;
152 }
153
154
155 /* Same, but handling unsigned long */
156
157 static int
get_ulong(PyObject * v,unsigned long * p)158 get_ulong(PyObject *v, unsigned long *p)
159 {
160 unsigned long x;
161
162 v = get_pylong(v);
163 if (v == NULL)
164 return -1;
165 assert(PyLong_Check(v));
166 x = PyLong_AsUnsignedLong(v);
167 Py_DECREF(v);
168 if (x == (unsigned long)-1 && PyErr_Occurred()) {
169 if (PyErr_ExceptionMatches(PyExc_OverflowError))
170 PyErr_SetString(StructError,
171 "argument out of range");
172 return -1;
173 }
174 *p = x;
175 return 0;
176 }
177
178 /* Same, but handling native long long. */
179
180 static int
get_longlong(PyObject * v,long long * p)181 get_longlong(PyObject *v, long long *p)
182 {
183 long long x;
184
185 v = get_pylong(v);
186 if (v == NULL)
187 return -1;
188 assert(PyLong_Check(v));
189 x = PyLong_AsLongLong(v);
190 Py_DECREF(v);
191 if (x == (long long)-1 && PyErr_Occurred()) {
192 if (PyErr_ExceptionMatches(PyExc_OverflowError))
193 PyErr_SetString(StructError,
194 "argument out of range");
195 return -1;
196 }
197 *p = x;
198 return 0;
199 }
200
201 /* Same, but handling native unsigned long long. */
202
203 static int
get_ulonglong(PyObject * v,unsigned long long * p)204 get_ulonglong(PyObject *v, unsigned long long *p)
205 {
206 unsigned long long x;
207
208 v = get_pylong(v);
209 if (v == NULL)
210 return -1;
211 assert(PyLong_Check(v));
212 x = PyLong_AsUnsignedLongLong(v);
213 Py_DECREF(v);
214 if (x == (unsigned long long)-1 && PyErr_Occurred()) {
215 if (PyErr_ExceptionMatches(PyExc_OverflowError))
216 PyErr_SetString(StructError,
217 "argument out of range");
218 return -1;
219 }
220 *p = x;
221 return 0;
222 }
223
224 /* Same, but handling Py_ssize_t */
225
226 static int
get_ssize_t(PyObject * v,Py_ssize_t * p)227 get_ssize_t(PyObject *v, Py_ssize_t *p)
228 {
229 Py_ssize_t x;
230
231 v = get_pylong(v);
232 if (v == NULL)
233 return -1;
234 assert(PyLong_Check(v));
235 x = PyLong_AsSsize_t(v);
236 Py_DECREF(v);
237 if (x == (Py_ssize_t)-1 && PyErr_Occurred()) {
238 if (PyErr_ExceptionMatches(PyExc_OverflowError))
239 PyErr_SetString(StructError,
240 "argument out of range");
241 return -1;
242 }
243 *p = x;
244 return 0;
245 }
246
247 /* Same, but handling size_t */
248
249 static int
get_size_t(PyObject * v,size_t * p)250 get_size_t(PyObject *v, size_t *p)
251 {
252 size_t x;
253
254 v = get_pylong(v);
255 if (v == NULL)
256 return -1;
257 assert(PyLong_Check(v));
258 x = PyLong_AsSize_t(v);
259 Py_DECREF(v);
260 if (x == (size_t)-1 && PyErr_Occurred()) {
261 if (PyErr_ExceptionMatches(PyExc_OverflowError))
262 PyErr_SetString(StructError,
263 "argument out of range");
264 return -1;
265 }
266 *p = x;
267 return 0;
268 }
269
270
271 #define RANGE_ERROR(x, f, flag, mask) return _range_error(f, flag)
272
273
274 /* Floating point helpers */
275
276 static PyObject *
unpack_halffloat(const char * p,int le)277 unpack_halffloat(const char *p, /* start of 2-byte string */
278 int le) /* true for little-endian, false for big-endian */
279 {
280 double x;
281
282 x = _PyFloat_Unpack2((unsigned char *)p, le);
283 if (x == -1.0 && PyErr_Occurred()) {
284 return NULL;
285 }
286 return PyFloat_FromDouble(x);
287 }
288
289 static int
pack_halffloat(char * p,PyObject * v,int le)290 pack_halffloat(char *p, /* start of 2-byte string */
291 PyObject *v, /* value to pack */
292 int le) /* true for little-endian, false for big-endian */
293 {
294 double x = PyFloat_AsDouble(v);
295 if (x == -1.0 && PyErr_Occurred()) {
296 PyErr_SetString(StructError,
297 "required argument is not a float");
298 return -1;
299 }
300 return _PyFloat_Pack2(x, (unsigned char *)p, le);
301 }
302
303 static PyObject *
unpack_float(const char * p,int le)304 unpack_float(const char *p, /* start of 4-byte string */
305 int le) /* true for little-endian, false for big-endian */
306 {
307 double x;
308
309 x = _PyFloat_Unpack4((unsigned char *)p, le);
310 if (x == -1.0 && PyErr_Occurred())
311 return NULL;
312 return PyFloat_FromDouble(x);
313 }
314
315 static PyObject *
unpack_double(const char * p,int le)316 unpack_double(const char *p, /* start of 8-byte string */
317 int le) /* true for little-endian, false for big-endian */
318 {
319 double x;
320
321 x = _PyFloat_Unpack8((unsigned char *)p, le);
322 if (x == -1.0 && PyErr_Occurred())
323 return NULL;
324 return PyFloat_FromDouble(x);
325 }
326
327 /* Helper to format the range error exceptions */
328 static int
_range_error(const formatdef * f,int is_unsigned)329 _range_error(const formatdef *f, int is_unsigned)
330 {
331 /* ulargest is the largest unsigned value with f->size bytes.
332 * Note that the simpler:
333 * ((size_t)1 << (f->size * 8)) - 1
334 * doesn't work when f->size == sizeof(size_t) because C doesn't
335 * define what happens when a left shift count is >= the number of
336 * bits in the integer being shifted; e.g., on some boxes it doesn't
337 * shift at all when they're equal.
338 */
339 const size_t ulargest = (size_t)-1 >> ((SIZEOF_SIZE_T - f->size)*8);
340 assert(f->size >= 1 && f->size <= SIZEOF_SIZE_T);
341 if (is_unsigned)
342 PyErr_Format(StructError,
343 "'%c' format requires 0 <= number <= %zu",
344 f->format,
345 ulargest);
346 else {
347 const Py_ssize_t largest = (Py_ssize_t)(ulargest >> 1);
348 PyErr_Format(StructError,
349 "'%c' format requires %zd <= number <= %zd",
350 f->format,
351 ~ largest,
352 largest);
353 }
354
355 return -1;
356 }
357
358
359
360 /* A large number of small routines follow, with names of the form
361
362 [bln][up]_TYPE
363
364 [bln] distiguishes among big-endian, little-endian and native.
365 [pu] distiguishes between pack (to struct) and unpack (from struct).
366 TYPE is one of char, byte, ubyte, etc.
367 */
368
369 /* Native mode routines. ****************************************************/
370 /* NOTE:
371 In all n[up]_<type> routines handling types larger than 1 byte, there is
372 *no* guarantee that the p pointer is properly aligned for each type,
373 therefore memcpy is called. An intermediate variable is used to
374 compensate for big-endian architectures.
375 Normally both the intermediate variable and the memcpy call will be
376 skipped by C optimisation in little-endian architectures (gcc >= 2.91
377 does this). */
378
379 static PyObject *
nu_char(const char * p,const formatdef * f)380 nu_char(const char *p, const formatdef *f)
381 {
382 return PyBytes_FromStringAndSize(p, 1);
383 }
384
385 static PyObject *
nu_byte(const char * p,const formatdef * f)386 nu_byte(const char *p, const formatdef *f)
387 {
388 return PyLong_FromLong((long) *(signed char *)p);
389 }
390
391 static PyObject *
nu_ubyte(const char * p,const formatdef * f)392 nu_ubyte(const char *p, const formatdef *f)
393 {
394 return PyLong_FromLong((long) *(unsigned char *)p);
395 }
396
397 static PyObject *
nu_short(const char * p,const formatdef * f)398 nu_short(const char *p, const formatdef *f)
399 {
400 short x;
401 memcpy((char *)&x, p, sizeof x);
402 return PyLong_FromLong((long)x);
403 }
404
405 static PyObject *
nu_ushort(const char * p,const formatdef * f)406 nu_ushort(const char *p, const formatdef *f)
407 {
408 unsigned short x;
409 memcpy((char *)&x, p, sizeof x);
410 return PyLong_FromLong((long)x);
411 }
412
413 static PyObject *
nu_int(const char * p,const formatdef * f)414 nu_int(const char *p, const formatdef *f)
415 {
416 int x;
417 memcpy((char *)&x, p, sizeof x);
418 return PyLong_FromLong((long)x);
419 }
420
421 static PyObject *
nu_uint(const char * p,const formatdef * f)422 nu_uint(const char *p, const formatdef *f)
423 {
424 unsigned int x;
425 memcpy((char *)&x, p, sizeof x);
426 return PyLong_FromUnsignedLong((unsigned long)x);
427 }
428
429 static PyObject *
nu_long(const char * p,const formatdef * f)430 nu_long(const char *p, const formatdef *f)
431 {
432 long x;
433 memcpy((char *)&x, p, sizeof x);
434 return PyLong_FromLong(x);
435 }
436
437 static PyObject *
nu_ulong(const char * p,const formatdef * f)438 nu_ulong(const char *p, const formatdef *f)
439 {
440 unsigned long x;
441 memcpy((char *)&x, p, sizeof x);
442 return PyLong_FromUnsignedLong(x);
443 }
444
445 static PyObject *
nu_ssize_t(const char * p,const formatdef * f)446 nu_ssize_t(const char *p, const formatdef *f)
447 {
448 Py_ssize_t x;
449 memcpy((char *)&x, p, sizeof x);
450 return PyLong_FromSsize_t(x);
451 }
452
453 static PyObject *
nu_size_t(const char * p,const formatdef * f)454 nu_size_t(const char *p, const formatdef *f)
455 {
456 size_t x;
457 memcpy((char *)&x, p, sizeof x);
458 return PyLong_FromSize_t(x);
459 }
460
461 static PyObject *
nu_longlong(const char * p,const formatdef * f)462 nu_longlong(const char *p, const formatdef *f)
463 {
464 long long x;
465 memcpy((char *)&x, p, sizeof x);
466 return PyLong_FromLongLong(x);
467 }
468
469 static PyObject *
nu_ulonglong(const char * p,const formatdef * f)470 nu_ulonglong(const char *p, const formatdef *f)
471 {
472 unsigned long long x;
473 memcpy((char *)&x, p, sizeof x);
474 return PyLong_FromUnsignedLongLong(x);
475 }
476
477 static PyObject *
nu_bool(const char * p,const formatdef * f)478 nu_bool(const char *p, const formatdef *f)
479 {
480 _Bool x;
481 memcpy((char *)&x, p, sizeof x);
482 return PyBool_FromLong(x != 0);
483 }
484
485
486 static PyObject *
nu_halffloat(const char * p,const formatdef * f)487 nu_halffloat(const char *p, const formatdef *f)
488 {
489 #if PY_LITTLE_ENDIAN
490 return unpack_halffloat(p, 1);
491 #else
492 return unpack_halffloat(p, 0);
493 #endif
494 }
495
496 static PyObject *
nu_float(const char * p,const formatdef * f)497 nu_float(const char *p, const formatdef *f)
498 {
499 float x;
500 memcpy((char *)&x, p, sizeof x);
501 return PyFloat_FromDouble((double)x);
502 }
503
504 static PyObject *
nu_double(const char * p,const formatdef * f)505 nu_double(const char *p, const formatdef *f)
506 {
507 double x;
508 memcpy((char *)&x, p, sizeof x);
509 return PyFloat_FromDouble(x);
510 }
511
512 static PyObject *
nu_void_p(const char * p,const formatdef * f)513 nu_void_p(const char *p, const formatdef *f)
514 {
515 void *x;
516 memcpy((char *)&x, p, sizeof x);
517 return PyLong_FromVoidPtr(x);
518 }
519
520 static int
np_byte(char * p,PyObject * v,const formatdef * f)521 np_byte(char *p, PyObject *v, const formatdef *f)
522 {
523 long x;
524 if (get_long(v, &x) < 0)
525 return -1;
526 if (x < -128 || x > 127) {
527 PyErr_SetString(StructError,
528 "byte format requires -128 <= number <= 127");
529 return -1;
530 }
531 *p = (char)x;
532 return 0;
533 }
534
535 static int
np_ubyte(char * p,PyObject * v,const formatdef * f)536 np_ubyte(char *p, PyObject *v, const formatdef *f)
537 {
538 long x;
539 if (get_long(v, &x) < 0)
540 return -1;
541 if (x < 0 || x > 255) {
542 PyErr_SetString(StructError,
543 "ubyte format requires 0 <= number <= 255");
544 return -1;
545 }
546 *(unsigned char *)p = (unsigned char)x;
547 return 0;
548 }
549
550 static int
np_char(char * p,PyObject * v,const formatdef * f)551 np_char(char *p, PyObject *v, const formatdef *f)
552 {
553 if (!PyBytes_Check(v) || PyBytes_GET_SIZE(v) != 1) {
554 PyErr_SetString(StructError,
555 "char format requires a bytes object of length 1");
556 return -1;
557 }
558 *p = *PyBytes_AS_STRING(v);
559 return 0;
560 }
561
562 static int
np_short(char * p,PyObject * v,const formatdef * f)563 np_short(char *p, PyObject *v, const formatdef *f)
564 {
565 long x;
566 short y;
567 if (get_long(v, &x) < 0)
568 return -1;
569 if (x < SHRT_MIN || x > SHRT_MAX) {
570 PyErr_SetString(StructError,
571 "short format requires " Py_STRINGIFY(SHRT_MIN)
572 " <= number <= " Py_STRINGIFY(SHRT_MAX));
573 return -1;
574 }
575 y = (short)x;
576 memcpy(p, (char *)&y, sizeof y);
577 return 0;
578 }
579
580 static int
np_ushort(char * p,PyObject * v,const formatdef * f)581 np_ushort(char *p, PyObject *v, const formatdef *f)
582 {
583 long x;
584 unsigned short y;
585 if (get_long(v, &x) < 0)
586 return -1;
587 if (x < 0 || x > USHRT_MAX) {
588 PyErr_SetString(StructError,
589 "ushort format requires 0 <= number <= "
590 Py_STRINGIFY(USHRT_MAX));
591 return -1;
592 }
593 y = (unsigned short)x;
594 memcpy(p, (char *)&y, sizeof y);
595 return 0;
596 }
597
598 static int
np_int(char * p,PyObject * v,const formatdef * f)599 np_int(char *p, PyObject *v, const formatdef *f)
600 {
601 long x;
602 int y;
603 if (get_long(v, &x) < 0)
604 return -1;
605 #if (SIZEOF_LONG > SIZEOF_INT)
606 if ((x < ((long)INT_MIN)) || (x > ((long)INT_MAX)))
607 RANGE_ERROR(x, f, 0, -1);
608 #endif
609 y = (int)x;
610 memcpy(p, (char *)&y, sizeof y);
611 return 0;
612 }
613
614 static int
np_uint(char * p,PyObject * v,const formatdef * f)615 np_uint(char *p, PyObject *v, const formatdef *f)
616 {
617 unsigned long x;
618 unsigned int y;
619 if (get_ulong(v, &x) < 0)
620 return -1;
621 y = (unsigned int)x;
622 #if (SIZEOF_LONG > SIZEOF_INT)
623 if (x > ((unsigned long)UINT_MAX))
624 RANGE_ERROR(y, f, 1, -1);
625 #endif
626 memcpy(p, (char *)&y, sizeof y);
627 return 0;
628 }
629
630 static int
np_long(char * p,PyObject * v,const formatdef * f)631 np_long(char *p, PyObject *v, const formatdef *f)
632 {
633 long x;
634 if (get_long(v, &x) < 0)
635 return -1;
636 memcpy(p, (char *)&x, sizeof x);
637 return 0;
638 }
639
640 static int
np_ulong(char * p,PyObject * v,const formatdef * f)641 np_ulong(char *p, PyObject *v, const formatdef *f)
642 {
643 unsigned long x;
644 if (get_ulong(v, &x) < 0)
645 return -1;
646 memcpy(p, (char *)&x, sizeof x);
647 return 0;
648 }
649
650 static int
np_ssize_t(char * p,PyObject * v,const formatdef * f)651 np_ssize_t(char *p, PyObject *v, const formatdef *f)
652 {
653 Py_ssize_t x;
654 if (get_ssize_t(v, &x) < 0)
655 return -1;
656 memcpy(p, (char *)&x, sizeof x);
657 return 0;
658 }
659
660 static int
np_size_t(char * p,PyObject * v,const formatdef * f)661 np_size_t(char *p, PyObject *v, const formatdef *f)
662 {
663 size_t x;
664 if (get_size_t(v, &x) < 0)
665 return -1;
666 memcpy(p, (char *)&x, sizeof x);
667 return 0;
668 }
669
670 static int
np_longlong(char * p,PyObject * v,const formatdef * f)671 np_longlong(char *p, PyObject *v, const formatdef *f)
672 {
673 long long x;
674 if (get_longlong(v, &x) < 0)
675 return -1;
676 memcpy(p, (char *)&x, sizeof x);
677 return 0;
678 }
679
680 static int
np_ulonglong(char * p,PyObject * v,const formatdef * f)681 np_ulonglong(char *p, PyObject *v, const formatdef *f)
682 {
683 unsigned long long x;
684 if (get_ulonglong(v, &x) < 0)
685 return -1;
686 memcpy(p, (char *)&x, sizeof x);
687 return 0;
688 }
689
690
691 static int
np_bool(char * p,PyObject * v,const formatdef * f)692 np_bool(char *p, PyObject *v, const formatdef *f)
693 {
694 int y;
695 _Bool x;
696 y = PyObject_IsTrue(v);
697 if (y < 0)
698 return -1;
699 x = y;
700 memcpy(p, (char *)&x, sizeof x);
701 return 0;
702 }
703
704 static int
np_halffloat(char * p,PyObject * v,const formatdef * f)705 np_halffloat(char *p, PyObject *v, const formatdef *f)
706 {
707 #if PY_LITTLE_ENDIAN
708 return pack_halffloat(p, v, 1);
709 #else
710 return pack_halffloat(p, v, 0);
711 #endif
712 }
713
714 static int
np_float(char * p,PyObject * v,const formatdef * f)715 np_float(char *p, PyObject *v, const formatdef *f)
716 {
717 float x = (float)PyFloat_AsDouble(v);
718 if (x == -1 && PyErr_Occurred()) {
719 PyErr_SetString(StructError,
720 "required argument is not a float");
721 return -1;
722 }
723 memcpy(p, (char *)&x, sizeof x);
724 return 0;
725 }
726
727 static int
np_double(char * p,PyObject * v,const formatdef * f)728 np_double(char *p, PyObject *v, const formatdef *f)
729 {
730 double x = PyFloat_AsDouble(v);
731 if (x == -1 && PyErr_Occurred()) {
732 PyErr_SetString(StructError,
733 "required argument is not a float");
734 return -1;
735 }
736 memcpy(p, (char *)&x, sizeof(double));
737 return 0;
738 }
739
740 static int
np_void_p(char * p,PyObject * v,const formatdef * f)741 np_void_p(char *p, PyObject *v, const formatdef *f)
742 {
743 void *x;
744
745 v = get_pylong(v);
746 if (v == NULL)
747 return -1;
748 assert(PyLong_Check(v));
749 x = PyLong_AsVoidPtr(v);
750 Py_DECREF(v);
751 if (x == NULL && PyErr_Occurred())
752 return -1;
753 memcpy(p, (char *)&x, sizeof x);
754 return 0;
755 }
756
757 static const formatdef native_table[] = {
758 {'x', sizeof(char), 0, NULL},
759 {'b', sizeof(char), 0, nu_byte, np_byte},
760 {'B', sizeof(char), 0, nu_ubyte, np_ubyte},
761 {'c', sizeof(char), 0, nu_char, np_char},
762 {'s', sizeof(char), 0, NULL},
763 {'p', sizeof(char), 0, NULL},
764 {'h', sizeof(short), SHORT_ALIGN, nu_short, np_short},
765 {'H', sizeof(short), SHORT_ALIGN, nu_ushort, np_ushort},
766 {'i', sizeof(int), INT_ALIGN, nu_int, np_int},
767 {'I', sizeof(int), INT_ALIGN, nu_uint, np_uint},
768 {'l', sizeof(long), LONG_ALIGN, nu_long, np_long},
769 {'L', sizeof(long), LONG_ALIGN, nu_ulong, np_ulong},
770 {'n', sizeof(size_t), SIZE_T_ALIGN, nu_ssize_t, np_ssize_t},
771 {'N', sizeof(size_t), SIZE_T_ALIGN, nu_size_t, np_size_t},
772 {'q', sizeof(long long), LONG_LONG_ALIGN, nu_longlong, np_longlong},
773 {'Q', sizeof(long long), LONG_LONG_ALIGN, nu_ulonglong,np_ulonglong},
774 {'?', sizeof(_Bool), BOOL_ALIGN, nu_bool, np_bool},
775 {'e', sizeof(short), SHORT_ALIGN, nu_halffloat, np_halffloat},
776 {'f', sizeof(float), FLOAT_ALIGN, nu_float, np_float},
777 {'d', sizeof(double), DOUBLE_ALIGN, nu_double, np_double},
778 {'P', sizeof(void *), VOID_P_ALIGN, nu_void_p, np_void_p},
779 {0}
780 };
781
782 /* Big-endian routines. *****************************************************/
783
784 static PyObject *
bu_int(const char * p,const formatdef * f)785 bu_int(const char *p, const formatdef *f)
786 {
787 long x = 0;
788 Py_ssize_t i = f->size;
789 const unsigned char *bytes = (const unsigned char *)p;
790 do {
791 x = (x<<8) | *bytes++;
792 } while (--i > 0);
793 /* Extend the sign bit. */
794 if (SIZEOF_LONG > f->size)
795 x |= -(x & (1L << ((8 * f->size) - 1)));
796 return PyLong_FromLong(x);
797 }
798
799 static PyObject *
bu_uint(const char * p,const formatdef * f)800 bu_uint(const char *p, const formatdef *f)
801 {
802 unsigned long x = 0;
803 Py_ssize_t i = f->size;
804 const unsigned char *bytes = (const unsigned char *)p;
805 do {
806 x = (x<<8) | *bytes++;
807 } while (--i > 0);
808 return PyLong_FromUnsignedLong(x);
809 }
810
811 static PyObject *
bu_longlong(const char * p,const formatdef * f)812 bu_longlong(const char *p, const formatdef *f)
813 {
814 long long x = 0;
815 Py_ssize_t i = f->size;
816 const unsigned char *bytes = (const unsigned char *)p;
817 do {
818 x = (x<<8) | *bytes++;
819 } while (--i > 0);
820 /* Extend the sign bit. */
821 if (SIZEOF_LONG_LONG > f->size)
822 x |= -(x & ((long long)1 << ((8 * f->size) - 1)));
823 return PyLong_FromLongLong(x);
824 }
825
826 static PyObject *
bu_ulonglong(const char * p,const formatdef * f)827 bu_ulonglong(const char *p, const formatdef *f)
828 {
829 unsigned long long x = 0;
830 Py_ssize_t i = f->size;
831 const unsigned char *bytes = (const unsigned char *)p;
832 do {
833 x = (x<<8) | *bytes++;
834 } while (--i > 0);
835 return PyLong_FromUnsignedLongLong(x);
836 }
837
838 static PyObject *
bu_halffloat(const char * p,const formatdef * f)839 bu_halffloat(const char *p, const formatdef *f)
840 {
841 return unpack_halffloat(p, 0);
842 }
843
844 static PyObject *
bu_float(const char * p,const formatdef * f)845 bu_float(const char *p, const formatdef *f)
846 {
847 return unpack_float(p, 0);
848 }
849
850 static PyObject *
bu_double(const char * p,const formatdef * f)851 bu_double(const char *p, const formatdef *f)
852 {
853 return unpack_double(p, 0);
854 }
855
856 static PyObject *
bu_bool(const char * p,const formatdef * f)857 bu_bool(const char *p, const formatdef *f)
858 {
859 return PyBool_FromLong(*p != 0);
860 }
861
862 static int
bp_int(char * p,PyObject * v,const formatdef * f)863 bp_int(char *p, PyObject *v, const formatdef *f)
864 {
865 long x;
866 Py_ssize_t i;
867 unsigned char *q = (unsigned char *)p;
868 if (get_long(v, &x) < 0)
869 return -1;
870 i = f->size;
871 if (i != SIZEOF_LONG) {
872 if ((i == 2) && (x < -32768 || x > 32767))
873 RANGE_ERROR(x, f, 0, 0xffffL);
874 #if (SIZEOF_LONG != 4)
875 else if ((i == 4) && (x < -2147483648L || x > 2147483647L))
876 RANGE_ERROR(x, f, 0, 0xffffffffL);
877 #endif
878 }
879 do {
880 q[--i] = (unsigned char)(x & 0xffL);
881 x >>= 8;
882 } while (i > 0);
883 return 0;
884 }
885
886 static int
bp_uint(char * p,PyObject * v,const formatdef * f)887 bp_uint(char *p, PyObject *v, const formatdef *f)
888 {
889 unsigned long x;
890 Py_ssize_t i;
891 unsigned char *q = (unsigned char *)p;
892 if (get_ulong(v, &x) < 0)
893 return -1;
894 i = f->size;
895 if (i != SIZEOF_LONG) {
896 unsigned long maxint = 1;
897 maxint <<= (unsigned long)(i * 8);
898 if (x >= maxint)
899 RANGE_ERROR(x, f, 1, maxint - 1);
900 }
901 do {
902 q[--i] = (unsigned char)(x & 0xffUL);
903 x >>= 8;
904 } while (i > 0);
905 return 0;
906 }
907
908 static int
bp_longlong(char * p,PyObject * v,const formatdef * f)909 bp_longlong(char *p, PyObject *v, const formatdef *f)
910 {
911 int res;
912 v = get_pylong(v);
913 if (v == NULL)
914 return -1;
915 res = _PyLong_AsByteArray((PyLongObject *)v,
916 (unsigned char *)p,
917 8,
918 0, /* little_endian */
919 1 /* signed */);
920 Py_DECREF(v);
921 return res;
922 }
923
924 static int
bp_ulonglong(char * p,PyObject * v,const formatdef * f)925 bp_ulonglong(char *p, PyObject *v, const formatdef *f)
926 {
927 int res;
928 v = get_pylong(v);
929 if (v == NULL)
930 return -1;
931 res = _PyLong_AsByteArray((PyLongObject *)v,
932 (unsigned char *)p,
933 8,
934 0, /* little_endian */
935 0 /* signed */);
936 Py_DECREF(v);
937 return res;
938 }
939
940 static int
bp_halffloat(char * p,PyObject * v,const formatdef * f)941 bp_halffloat(char *p, PyObject *v, const formatdef *f)
942 {
943 return pack_halffloat(p, v, 0);
944 }
945
946 static int
bp_float(char * p,PyObject * v,const formatdef * f)947 bp_float(char *p, PyObject *v, const formatdef *f)
948 {
949 double x = PyFloat_AsDouble(v);
950 if (x == -1 && PyErr_Occurred()) {
951 PyErr_SetString(StructError,
952 "required argument is not a float");
953 return -1;
954 }
955 return _PyFloat_Pack4(x, (unsigned char *)p, 0);
956 }
957
958 static int
bp_double(char * p,PyObject * v,const formatdef * f)959 bp_double(char *p, PyObject *v, const formatdef *f)
960 {
961 double x = PyFloat_AsDouble(v);
962 if (x == -1 && PyErr_Occurred()) {
963 PyErr_SetString(StructError,
964 "required argument is not a float");
965 return -1;
966 }
967 return _PyFloat_Pack8(x, (unsigned char *)p, 0);
968 }
969
970 static int
bp_bool(char * p,PyObject * v,const formatdef * f)971 bp_bool(char *p, PyObject *v, const formatdef *f)
972 {
973 int y;
974 y = PyObject_IsTrue(v);
975 if (y < 0)
976 return -1;
977 *p = (char)y;
978 return 0;
979 }
980
981 static formatdef bigendian_table[] = {
982 {'x', 1, 0, NULL},
983 {'b', 1, 0, nu_byte, np_byte},
984 {'B', 1, 0, nu_ubyte, np_ubyte},
985 {'c', 1, 0, nu_char, np_char},
986 {'s', 1, 0, NULL},
987 {'p', 1, 0, NULL},
988 {'h', 2, 0, bu_int, bp_int},
989 {'H', 2, 0, bu_uint, bp_uint},
990 {'i', 4, 0, bu_int, bp_int},
991 {'I', 4, 0, bu_uint, bp_uint},
992 {'l', 4, 0, bu_int, bp_int},
993 {'L', 4, 0, bu_uint, bp_uint},
994 {'q', 8, 0, bu_longlong, bp_longlong},
995 {'Q', 8, 0, bu_ulonglong, bp_ulonglong},
996 {'?', 1, 0, bu_bool, bp_bool},
997 {'e', 2, 0, bu_halffloat, bp_halffloat},
998 {'f', 4, 0, bu_float, bp_float},
999 {'d', 8, 0, bu_double, bp_double},
1000 {0}
1001 };
1002
1003 /* Little-endian routines. *****************************************************/
1004
1005 static PyObject *
lu_int(const char * p,const formatdef * f)1006 lu_int(const char *p, const formatdef *f)
1007 {
1008 long x = 0;
1009 Py_ssize_t i = f->size;
1010 const unsigned char *bytes = (const unsigned char *)p;
1011 do {
1012 x = (x<<8) | bytes[--i];
1013 } while (i > 0);
1014 /* Extend the sign bit. */
1015 if (SIZEOF_LONG > f->size)
1016 x |= -(x & (1L << ((8 * f->size) - 1)));
1017 return PyLong_FromLong(x);
1018 }
1019
1020 static PyObject *
lu_uint(const char * p,const formatdef * f)1021 lu_uint(const char *p, const formatdef *f)
1022 {
1023 unsigned long x = 0;
1024 Py_ssize_t i = f->size;
1025 const unsigned char *bytes = (const unsigned char *)p;
1026 do {
1027 x = (x<<8) | bytes[--i];
1028 } while (i > 0);
1029 return PyLong_FromUnsignedLong(x);
1030 }
1031
1032 static PyObject *
lu_longlong(const char * p,const formatdef * f)1033 lu_longlong(const char *p, const formatdef *f)
1034 {
1035 long long x = 0;
1036 Py_ssize_t i = f->size;
1037 const unsigned char *bytes = (const unsigned char *)p;
1038 do {
1039 x = (x<<8) | bytes[--i];
1040 } while (i > 0);
1041 /* Extend the sign bit. */
1042 if (SIZEOF_LONG_LONG > f->size)
1043 x |= -(x & ((long long)1 << ((8 * f->size) - 1)));
1044 return PyLong_FromLongLong(x);
1045 }
1046
1047 static PyObject *
lu_ulonglong(const char * p,const formatdef * f)1048 lu_ulonglong(const char *p, const formatdef *f)
1049 {
1050 unsigned long long x = 0;
1051 Py_ssize_t i = f->size;
1052 const unsigned char *bytes = (const unsigned char *)p;
1053 do {
1054 x = (x<<8) | bytes[--i];
1055 } while (i > 0);
1056 return PyLong_FromUnsignedLongLong(x);
1057 }
1058
1059 static PyObject *
lu_halffloat(const char * p,const formatdef * f)1060 lu_halffloat(const char *p, const formatdef *f)
1061 {
1062 return unpack_halffloat(p, 1);
1063 }
1064
1065 static PyObject *
lu_float(const char * p,const formatdef * f)1066 lu_float(const char *p, const formatdef *f)
1067 {
1068 return unpack_float(p, 1);
1069 }
1070
1071 static PyObject *
lu_double(const char * p,const formatdef * f)1072 lu_double(const char *p, const formatdef *f)
1073 {
1074 return unpack_double(p, 1);
1075 }
1076
1077 static int
lp_int(char * p,PyObject * v,const formatdef * f)1078 lp_int(char *p, PyObject *v, const formatdef *f)
1079 {
1080 long x;
1081 Py_ssize_t i;
1082 unsigned char *q = (unsigned char *)p;
1083 if (get_long(v, &x) < 0)
1084 return -1;
1085 i = f->size;
1086 if (i != SIZEOF_LONG) {
1087 if ((i == 2) && (x < -32768 || x > 32767))
1088 RANGE_ERROR(x, f, 0, 0xffffL);
1089 #if (SIZEOF_LONG != 4)
1090 else if ((i == 4) && (x < -2147483648L || x > 2147483647L))
1091 RANGE_ERROR(x, f, 0, 0xffffffffL);
1092 #endif
1093 }
1094 do {
1095 *q++ = (unsigned char)(x & 0xffL);
1096 x >>= 8;
1097 } while (--i > 0);
1098 return 0;
1099 }
1100
1101 static int
lp_uint(char * p,PyObject * v,const formatdef * f)1102 lp_uint(char *p, PyObject *v, const formatdef *f)
1103 {
1104 unsigned long x;
1105 Py_ssize_t i;
1106 unsigned char *q = (unsigned char *)p;
1107 if (get_ulong(v, &x) < 0)
1108 return -1;
1109 i = f->size;
1110 if (i != SIZEOF_LONG) {
1111 unsigned long maxint = 1;
1112 maxint <<= (unsigned long)(i * 8);
1113 if (x >= maxint)
1114 RANGE_ERROR(x, f, 1, maxint - 1);
1115 }
1116 do {
1117 *q++ = (unsigned char)(x & 0xffUL);
1118 x >>= 8;
1119 } while (--i > 0);
1120 return 0;
1121 }
1122
1123 static int
lp_longlong(char * p,PyObject * v,const formatdef * f)1124 lp_longlong(char *p, PyObject *v, const formatdef *f)
1125 {
1126 int res;
1127 v = get_pylong(v);
1128 if (v == NULL)
1129 return -1;
1130 res = _PyLong_AsByteArray((PyLongObject*)v,
1131 (unsigned char *)p,
1132 8,
1133 1, /* little_endian */
1134 1 /* signed */);
1135 Py_DECREF(v);
1136 return res;
1137 }
1138
1139 static int
lp_ulonglong(char * p,PyObject * v,const formatdef * f)1140 lp_ulonglong(char *p, PyObject *v, const formatdef *f)
1141 {
1142 int res;
1143 v = get_pylong(v);
1144 if (v == NULL)
1145 return -1;
1146 res = _PyLong_AsByteArray((PyLongObject*)v,
1147 (unsigned char *)p,
1148 8,
1149 1, /* little_endian */
1150 0 /* signed */);
1151 Py_DECREF(v);
1152 return res;
1153 }
1154
1155 static int
lp_halffloat(char * p,PyObject * v,const formatdef * f)1156 lp_halffloat(char *p, PyObject *v, const formatdef *f)
1157 {
1158 return pack_halffloat(p, v, 1);
1159 }
1160
1161 static int
lp_float(char * p,PyObject * v,const formatdef * f)1162 lp_float(char *p, PyObject *v, const formatdef *f)
1163 {
1164 double x = PyFloat_AsDouble(v);
1165 if (x == -1 && PyErr_Occurred()) {
1166 PyErr_SetString(StructError,
1167 "required argument is not a float");
1168 return -1;
1169 }
1170 return _PyFloat_Pack4(x, (unsigned char *)p, 1);
1171 }
1172
1173 static int
lp_double(char * p,PyObject * v,const formatdef * f)1174 lp_double(char *p, PyObject *v, const formatdef *f)
1175 {
1176 double x = PyFloat_AsDouble(v);
1177 if (x == -1 && PyErr_Occurred()) {
1178 PyErr_SetString(StructError,
1179 "required argument is not a float");
1180 return -1;
1181 }
1182 return _PyFloat_Pack8(x, (unsigned char *)p, 1);
1183 }
1184
1185 static formatdef lilendian_table[] = {
1186 {'x', 1, 0, NULL},
1187 {'b', 1, 0, nu_byte, np_byte},
1188 {'B', 1, 0, nu_ubyte, np_ubyte},
1189 {'c', 1, 0, nu_char, np_char},
1190 {'s', 1, 0, NULL},
1191 {'p', 1, 0, NULL},
1192 {'h', 2, 0, lu_int, lp_int},
1193 {'H', 2, 0, lu_uint, lp_uint},
1194 {'i', 4, 0, lu_int, lp_int},
1195 {'I', 4, 0, lu_uint, lp_uint},
1196 {'l', 4, 0, lu_int, lp_int},
1197 {'L', 4, 0, lu_uint, lp_uint},
1198 {'q', 8, 0, lu_longlong, lp_longlong},
1199 {'Q', 8, 0, lu_ulonglong, lp_ulonglong},
1200 {'?', 1, 0, bu_bool, bp_bool}, /* Std rep not endian dep,
1201 but potentially different from native rep -- reuse bx_bool funcs. */
1202 {'e', 2, 0, lu_halffloat, lp_halffloat},
1203 {'f', 4, 0, lu_float, lp_float},
1204 {'d', 8, 0, lu_double, lp_double},
1205 {0}
1206 };
1207
1208
1209 static const formatdef *
whichtable(const char ** pfmt)1210 whichtable(const char **pfmt)
1211 {
1212 const char *fmt = (*pfmt)++; /* May be backed out of later */
1213 switch (*fmt) {
1214 case '<':
1215 return lilendian_table;
1216 case '>':
1217 case '!': /* Network byte order is big-endian */
1218 return bigendian_table;
1219 case '=': { /* Host byte order -- different from native in alignment! */
1220 #if PY_LITTLE_ENDIAN
1221 return lilendian_table;
1222 #else
1223 return bigendian_table;
1224 #endif
1225 }
1226 default:
1227 --*pfmt; /* Back out of pointer increment */
1228 /* Fall through */
1229 case '@':
1230 return native_table;
1231 }
1232 }
1233
1234
1235 /* Get the table entry for a format code */
1236
1237 static const formatdef *
getentry(int c,const formatdef * f)1238 getentry(int c, const formatdef *f)
1239 {
1240 for (; f->format != '\0'; f++) {
1241 if (f->format == c) {
1242 return f;
1243 }
1244 }
1245 PyErr_SetString(StructError, "bad char in struct format");
1246 return NULL;
1247 }
1248
1249
1250 /* Align a size according to a format code. Return -1 on overflow. */
1251
1252 static Py_ssize_t
align(Py_ssize_t size,char c,const formatdef * e)1253 align(Py_ssize_t size, char c, const formatdef *e)
1254 {
1255 Py_ssize_t extra;
1256
1257 if (e->format == c) {
1258 if (e->alignment && size > 0) {
1259 extra = (e->alignment - 1) - (size - 1) % (e->alignment);
1260 if (extra > PY_SSIZE_T_MAX - size)
1261 return -1;
1262 size += extra;
1263 }
1264 }
1265 return size;
1266 }
1267
1268 /*
1269 * Struct object implementation.
1270 */
1271
1272 /* calculate the size of a format string */
1273
1274 static int
prepare_s(PyStructObject * self)1275 prepare_s(PyStructObject *self)
1276 {
1277 const formatdef *f;
1278 const formatdef *e;
1279 formatcode *codes;
1280
1281 const char *s;
1282 const char *fmt;
1283 char c;
1284 Py_ssize_t size, len, num, itemsize;
1285 size_t ncodes;
1286
1287 fmt = PyBytes_AS_STRING(self->s_format);
1288
1289 f = whichtable(&fmt);
1290
1291 s = fmt;
1292 size = 0;
1293 len = 0;
1294 ncodes = 0;
1295 while ((c = *s++) != '\0') {
1296 if (Py_ISSPACE(Py_CHARMASK(c)))
1297 continue;
1298 if ('0' <= c && c <= '9') {
1299 num = c - '0';
1300 while ('0' <= (c = *s++) && c <= '9') {
1301 /* overflow-safe version of
1302 if (num*10 + (c - '0') > PY_SSIZE_T_MAX) { ... } */
1303 if (num >= PY_SSIZE_T_MAX / 10 && (
1304 num > PY_SSIZE_T_MAX / 10 ||
1305 (c - '0') > PY_SSIZE_T_MAX % 10))
1306 goto overflow;
1307 num = num*10 + (c - '0');
1308 }
1309 if (c == '\0') {
1310 PyErr_SetString(StructError,
1311 "repeat count given without format specifier");
1312 return -1;
1313 }
1314 }
1315 else
1316 num = 1;
1317
1318 e = getentry(c, f);
1319 if (e == NULL)
1320 return -1;
1321
1322 switch (c) {
1323 case 's': /* fall through */
1324 case 'p': len++; ncodes++; break;
1325 case 'x': break;
1326 default: len += num; if (num) ncodes++; break;
1327 }
1328
1329 itemsize = e->size;
1330 size = align(size, c, e);
1331 if (size == -1)
1332 goto overflow;
1333
1334 /* if (size + num * itemsize > PY_SSIZE_T_MAX) { ... } */
1335 if (num > (PY_SSIZE_T_MAX - size) / itemsize)
1336 goto overflow;
1337 size += num * itemsize;
1338 }
1339
1340 /* check for overflow */
1341 if ((ncodes + 1) > ((size_t)PY_SSIZE_T_MAX / sizeof(formatcode))) {
1342 PyErr_NoMemory();
1343 return -1;
1344 }
1345
1346 self->s_size = size;
1347 self->s_len = len;
1348 codes = PyMem_MALLOC((ncodes + 1) * sizeof(formatcode));
1349 if (codes == NULL) {
1350 PyErr_NoMemory();
1351 return -1;
1352 }
1353 /* Free any s_codes value left over from a previous initialization. */
1354 if (self->s_codes != NULL)
1355 PyMem_FREE(self->s_codes);
1356 self->s_codes = codes;
1357
1358 s = fmt;
1359 size = 0;
1360 while ((c = *s++) != '\0') {
1361 if (Py_ISSPACE(Py_CHARMASK(c)))
1362 continue;
1363 if ('0' <= c && c <= '9') {
1364 num = c - '0';
1365 while ('0' <= (c = *s++) && c <= '9')
1366 num = num*10 + (c - '0');
1367 }
1368 else
1369 num = 1;
1370
1371 e = getentry(c, f);
1372
1373 size = align(size, c, e);
1374 if (c == 's' || c == 'p') {
1375 codes->offset = size;
1376 codes->size = num;
1377 codes->fmtdef = e;
1378 codes->repeat = 1;
1379 codes++;
1380 size += num;
1381 } else if (c == 'x') {
1382 size += num;
1383 } else if (num) {
1384 codes->offset = size;
1385 codes->size = e->size;
1386 codes->fmtdef = e;
1387 codes->repeat = num;
1388 codes++;
1389 size += e->size * num;
1390 }
1391 }
1392 codes->fmtdef = NULL;
1393 codes->offset = size;
1394 codes->size = 0;
1395 codes->repeat = 0;
1396
1397 return 0;
1398
1399 overflow:
1400 PyErr_SetString(StructError,
1401 "total struct size too long");
1402 return -1;
1403 }
1404
1405 static PyObject *
s_new(PyTypeObject * type,PyObject * args,PyObject * kwds)1406 s_new(PyTypeObject *type, PyObject *args, PyObject *kwds)
1407 {
1408 PyObject *self;
1409
1410 assert(type != NULL && type->tp_alloc != NULL);
1411
1412 self = type->tp_alloc(type, 0);
1413 if (self != NULL) {
1414 PyStructObject *s = (PyStructObject*)self;
1415 Py_INCREF(Py_None);
1416 s->s_format = Py_None;
1417 s->s_codes = NULL;
1418 s->s_size = -1;
1419 s->s_len = -1;
1420 }
1421 return self;
1422 }
1423
1424 /*[clinic input]
1425 Struct.__init__
1426
1427 format: object
1428
1429 Create a compiled struct object.
1430
1431 Return a new Struct object which writes and reads binary data according to
1432 the format string.
1433
1434 See help(struct) for more on format strings.
1435 [clinic start generated code]*/
1436
1437 static int
Struct___init___impl(PyStructObject * self,PyObject * format)1438 Struct___init___impl(PyStructObject *self, PyObject *format)
1439 /*[clinic end generated code: output=b8e80862444e92d0 input=192a4575a3dde802]*/
1440 {
1441 int ret = 0;
1442
1443 if (PyUnicode_Check(format)) {
1444 format = PyUnicode_AsASCIIString(format);
1445 if (format == NULL)
1446 return -1;
1447 }
1448 /* XXX support buffer interface, too */
1449 else {
1450 Py_INCREF(format);
1451 }
1452
1453 if (!PyBytes_Check(format)) {
1454 Py_DECREF(format);
1455 PyErr_Format(PyExc_TypeError,
1456 "Struct() argument 1 must be a str or bytes object, "
1457 "not %.200s",
1458 Py_TYPE(format)->tp_name);
1459 return -1;
1460 }
1461
1462 Py_SETREF(self->s_format, format);
1463
1464 ret = prepare_s(self);
1465 return ret;
1466 }
1467
1468 static void
s_dealloc(PyStructObject * s)1469 s_dealloc(PyStructObject *s)
1470 {
1471 if (s->weakreflist != NULL)
1472 PyObject_ClearWeakRefs((PyObject *)s);
1473 if (s->s_codes != NULL) {
1474 PyMem_FREE(s->s_codes);
1475 }
1476 Py_DECREF(s->s_format);
1477 Py_TYPE(s)->tp_free((PyObject *)s);
1478 }
1479
1480 static PyObject *
s_unpack_internal(PyStructObject * soself,const char * startfrom)1481 s_unpack_internal(PyStructObject *soself, const char *startfrom) {
1482 formatcode *code;
1483 Py_ssize_t i = 0;
1484 PyObject *result = PyTuple_New(soself->s_len);
1485 if (result == NULL)
1486 return NULL;
1487
1488 for (code = soself->s_codes; code->fmtdef != NULL; code++) {
1489 const formatdef *e = code->fmtdef;
1490 const char *res = startfrom + code->offset;
1491 Py_ssize_t j = code->repeat;
1492 while (j--) {
1493 PyObject *v;
1494 if (e->format == 's') {
1495 v = PyBytes_FromStringAndSize(res, code->size);
1496 } else if (e->format == 'p') {
1497 Py_ssize_t n = *(unsigned char*)res;
1498 if (n >= code->size)
1499 n = code->size - 1;
1500 v = PyBytes_FromStringAndSize(res + 1, n);
1501 } else {
1502 v = e->unpack(res, e);
1503 }
1504 if (v == NULL)
1505 goto fail;
1506 PyTuple_SET_ITEM(result, i++, v);
1507 res += code->size;
1508 }
1509 }
1510
1511 return result;
1512 fail:
1513 Py_DECREF(result);
1514 return NULL;
1515 }
1516
1517
1518 /*[clinic input]
1519 Struct.unpack
1520
1521 buffer: Py_buffer
1522 /
1523
1524 Return a tuple containing unpacked values.
1525
1526 Unpack according to the format string Struct.format. The buffer's size
1527 in bytes must be Struct.size.
1528
1529 See help(struct) for more on format strings.
1530 [clinic start generated code]*/
1531
1532 static PyObject *
Struct_unpack_impl(PyStructObject * self,Py_buffer * buffer)1533 Struct_unpack_impl(PyStructObject *self, Py_buffer *buffer)
1534 /*[clinic end generated code: output=873a24faf02e848a input=3113f8e7038b2f6c]*/
1535 {
1536 assert(self->s_codes != NULL);
1537 if (buffer->len != self->s_size) {
1538 PyErr_Format(StructError,
1539 "unpack requires a buffer of %zd bytes",
1540 self->s_size);
1541 return NULL;
1542 }
1543 return s_unpack_internal(self, buffer->buf);
1544 }
1545
1546 /*[clinic input]
1547 Struct.unpack_from
1548
1549 buffer: Py_buffer
1550 offset: Py_ssize_t = 0
1551
1552 Return a tuple containing unpacked values.
1553
1554 Values are unpacked according to the format string Struct.format.
1555
1556 The buffer's size in bytes, starting at position offset, must be
1557 at least Struct.size.
1558
1559 See help(struct) for more on format strings.
1560 [clinic start generated code]*/
1561
1562 static PyObject *
Struct_unpack_from_impl(PyStructObject * self,Py_buffer * buffer,Py_ssize_t offset)1563 Struct_unpack_from_impl(PyStructObject *self, Py_buffer *buffer,
1564 Py_ssize_t offset)
1565 /*[clinic end generated code: output=57fac875e0977316 input=cafd4851d473c894]*/
1566 {
1567 assert(self->s_codes != NULL);
1568
1569 if (offset < 0) {
1570 if (offset + self->s_size > 0) {
1571 PyErr_Format(StructError,
1572 "not enough data to unpack %zd bytes at offset %zd",
1573 self->s_size,
1574 offset);
1575 return NULL;
1576 }
1577
1578 if (offset + buffer->len < 0) {
1579 PyErr_Format(StructError,
1580 "offset %zd out of range for %zd-byte buffer",
1581 offset,
1582 buffer->len);
1583 return NULL;
1584 }
1585 offset += buffer->len;
1586 }
1587
1588 if ((buffer->len - offset) < self->s_size) {
1589 PyErr_Format(StructError,
1590 "unpack_from requires a buffer of at least %zu bytes for "
1591 "unpacking %zd bytes at offset %zd "
1592 "(actual buffer size is %zd)",
1593 (size_t)self->s_size + (size_t)offset,
1594 self->s_size,
1595 offset,
1596 buffer->len);
1597 return NULL;
1598 }
1599 return s_unpack_internal(self, (char*)buffer->buf + offset);
1600 }
1601
1602
1603
1604 /* Unpack iterator type */
1605
1606 typedef struct {
1607 PyObject_HEAD
1608 PyStructObject *so;
1609 Py_buffer buf;
1610 Py_ssize_t index;
1611 } unpackiterobject;
1612
1613 static void
unpackiter_dealloc(unpackiterobject * self)1614 unpackiter_dealloc(unpackiterobject *self)
1615 {
1616 /* bpo-31095: UnTrack is needed before calling any callbacks */
1617 PyObject_GC_UnTrack(self);
1618 Py_XDECREF(self->so);
1619 PyBuffer_Release(&self->buf);
1620 PyObject_GC_Del(self);
1621 }
1622
1623 static int
unpackiter_traverse(unpackiterobject * self,visitproc visit,void * arg)1624 unpackiter_traverse(unpackiterobject *self, visitproc visit, void *arg)
1625 {
1626 Py_VISIT(self->so);
1627 Py_VISIT(self->buf.obj);
1628 return 0;
1629 }
1630
1631 static PyObject *
unpackiter_len(unpackiterobject * self,PyObject * Py_UNUSED (ignored))1632 unpackiter_len(unpackiterobject *self, PyObject *Py_UNUSED(ignored))
1633 {
1634 Py_ssize_t len;
1635 if (self->so == NULL)
1636 len = 0;
1637 else
1638 len = (self->buf.len - self->index) / self->so->s_size;
1639 return PyLong_FromSsize_t(len);
1640 }
1641
1642 static PyMethodDef unpackiter_methods[] = {
1643 {"__length_hint__", (PyCFunction) unpackiter_len, METH_NOARGS, NULL},
1644 {NULL, NULL} /* sentinel */
1645 };
1646
1647 static PyObject *
unpackiter_iternext(unpackiterobject * self)1648 unpackiter_iternext(unpackiterobject *self)
1649 {
1650 PyObject *result;
1651 if (self->so == NULL)
1652 return NULL;
1653 if (self->index >= self->buf.len) {
1654 /* Iterator exhausted */
1655 Py_CLEAR(self->so);
1656 PyBuffer_Release(&self->buf);
1657 return NULL;
1658 }
1659 assert(self->index + self->so->s_size <= self->buf.len);
1660 result = s_unpack_internal(self->so,
1661 (char*) self->buf.buf + self->index);
1662 self->index += self->so->s_size;
1663 return result;
1664 }
1665
1666 static PyTypeObject unpackiter_type = {
1667 PyVarObject_HEAD_INIT(NULL, 0)
1668 "unpack_iterator", /* tp_name */
1669 sizeof(unpackiterobject), /* tp_basicsize */
1670 0, /* tp_itemsize */
1671 (destructor)unpackiter_dealloc, /* tp_dealloc */
1672 0, /* tp_vectorcall_offset */
1673 0, /* tp_getattr */
1674 0, /* tp_setattr */
1675 0, /* tp_as_async */
1676 0, /* tp_repr */
1677 0, /* tp_as_number */
1678 0, /* tp_as_sequence */
1679 0, /* tp_as_mapping */
1680 0, /* tp_hash */
1681 0, /* tp_call */
1682 0, /* tp_str */
1683 PyObject_GenericGetAttr, /* tp_getattro */
1684 0, /* tp_setattro */
1685 0, /* tp_as_buffer */
1686 Py_TPFLAGS_DEFAULT | Py_TPFLAGS_HAVE_GC, /* tp_flags */
1687 0, /* tp_doc */
1688 (traverseproc)unpackiter_traverse, /* tp_traverse */
1689 0, /* tp_clear */
1690 0, /* tp_richcompare */
1691 0, /* tp_weaklistoffset */
1692 PyObject_SelfIter, /* tp_iter */
1693 (iternextfunc)unpackiter_iternext, /* tp_iternext */
1694 unpackiter_methods /* tp_methods */
1695 };
1696
1697 /*[clinic input]
1698 Struct.iter_unpack
1699
1700 buffer: object
1701 /
1702
1703 Return an iterator yielding tuples.
1704
1705 Tuples are unpacked from the given bytes source, like a repeated
1706 invocation of unpack_from().
1707
1708 Requires that the bytes length be a multiple of the struct size.
1709 [clinic start generated code]*/
1710
1711 static PyObject *
Struct_iter_unpack(PyStructObject * self,PyObject * buffer)1712 Struct_iter_unpack(PyStructObject *self, PyObject *buffer)
1713 /*[clinic end generated code: output=172d83d0cd15dbab input=6d65b3f3107dbc99]*/
1714 {
1715 unpackiterobject *iter;
1716
1717 assert(self->s_codes != NULL);
1718
1719 if (self->s_size == 0) {
1720 PyErr_Format(StructError,
1721 "cannot iteratively unpack with a struct of length 0");
1722 return NULL;
1723 }
1724
1725 iter = (unpackiterobject *) PyType_GenericAlloc(&unpackiter_type, 0);
1726 if (iter == NULL)
1727 return NULL;
1728
1729 if (PyObject_GetBuffer(buffer, &iter->buf, PyBUF_SIMPLE) < 0) {
1730 Py_DECREF(iter);
1731 return NULL;
1732 }
1733 if (iter->buf.len % self->s_size != 0) {
1734 PyErr_Format(StructError,
1735 "iterative unpacking requires a buffer of "
1736 "a multiple of %zd bytes",
1737 self->s_size);
1738 Py_DECREF(iter);
1739 return NULL;
1740 }
1741 Py_INCREF(self);
1742 iter->so = self;
1743 iter->index = 0;
1744 return (PyObject *)iter;
1745 }
1746
1747
1748 /*
1749 * Guts of the pack function.
1750 *
1751 * Takes a struct object, a tuple of arguments, and offset in that tuple of
1752 * argument for where to start processing the arguments for packing, and a
1753 * character buffer for writing the packed string. The caller must insure
1754 * that the buffer may contain the required length for packing the arguments.
1755 * 0 is returned on success, 1 is returned if there is an error.
1756 *
1757 */
1758 static int
s_pack_internal(PyStructObject * soself,PyObject * const * args,int offset,char * buf)1759 s_pack_internal(PyStructObject *soself, PyObject *const *args, int offset, char* buf)
1760 {
1761 formatcode *code;
1762 /* XXX(nnorwitz): why does i need to be a local? can we use
1763 the offset parameter or do we need the wider width? */
1764 Py_ssize_t i;
1765
1766 memset(buf, '\0', soself->s_size);
1767 i = offset;
1768 for (code = soself->s_codes; code->fmtdef != NULL; code++) {
1769 const formatdef *e = code->fmtdef;
1770 char *res = buf + code->offset;
1771 Py_ssize_t j = code->repeat;
1772 while (j--) {
1773 PyObject *v = args[i++];
1774 if (e->format == 's') {
1775 Py_ssize_t n;
1776 int isstring;
1777 void *p;
1778 isstring = PyBytes_Check(v);
1779 if (!isstring && !PyByteArray_Check(v)) {
1780 PyErr_SetString(StructError,
1781 "argument for 's' must be a bytes object");
1782 return -1;
1783 }
1784 if (isstring) {
1785 n = PyBytes_GET_SIZE(v);
1786 p = PyBytes_AS_STRING(v);
1787 }
1788 else {
1789 n = PyByteArray_GET_SIZE(v);
1790 p = PyByteArray_AS_STRING(v);
1791 }
1792 if (n > code->size)
1793 n = code->size;
1794 if (n > 0)
1795 memcpy(res, p, n);
1796 } else if (e->format == 'p') {
1797 Py_ssize_t n;
1798 int isstring;
1799 void *p;
1800 isstring = PyBytes_Check(v);
1801 if (!isstring && !PyByteArray_Check(v)) {
1802 PyErr_SetString(StructError,
1803 "argument for 'p' must be a bytes object");
1804 return -1;
1805 }
1806 if (isstring) {
1807 n = PyBytes_GET_SIZE(v);
1808 p = PyBytes_AS_STRING(v);
1809 }
1810 else {
1811 n = PyByteArray_GET_SIZE(v);
1812 p = PyByteArray_AS_STRING(v);
1813 }
1814 if (n > (code->size - 1))
1815 n = code->size - 1;
1816 if (n > 0)
1817 memcpy(res + 1, p, n);
1818 if (n > 255)
1819 n = 255;
1820 *res = Py_SAFE_DOWNCAST(n, Py_ssize_t, unsigned char);
1821 } else {
1822 if (e->pack(res, v, e) < 0) {
1823 if (PyLong_Check(v) && PyErr_ExceptionMatches(PyExc_OverflowError))
1824 PyErr_SetString(StructError,
1825 "int too large to convert");
1826 return -1;
1827 }
1828 }
1829 res += code->size;
1830 }
1831 }
1832
1833 /* Success */
1834 return 0;
1835 }
1836
1837
1838 PyDoc_STRVAR(s_pack__doc__,
1839 "S.pack(v1, v2, ...) -> bytes\n\
1840 \n\
1841 Return a bytes object containing values v1, v2, ... packed according\n\
1842 to the format string S.format. See help(struct) for more on format\n\
1843 strings.");
1844
1845 static PyObject *
s_pack(PyObject * self,PyObject * const * args,Py_ssize_t nargs)1846 s_pack(PyObject *self, PyObject *const *args, Py_ssize_t nargs)
1847 {
1848 PyStructObject *soself;
1849 PyObject *result;
1850
1851 /* Validate arguments. */
1852 soself = (PyStructObject *)self;
1853 assert(PyStruct_Check(self));
1854 assert(soself->s_codes != NULL);
1855 if (nargs != soself->s_len)
1856 {
1857 PyErr_Format(StructError,
1858 "pack expected %zd items for packing (got %zd)", soself->s_len, nargs);
1859 return NULL;
1860 }
1861
1862 /* Allocate a new buffer */
1863 result = PyBytes_FromStringAndSize((char *)NULL, soself->s_size);
1864 if (result == NULL)
1865 return NULL;
1866
1867 /* Call the guts */
1868 if ( s_pack_internal(soself, args, 0, PyBytes_AS_STRING(result)) != 0 ) {
1869 Py_DECREF(result);
1870 return NULL;
1871 }
1872
1873 return result;
1874 }
1875
1876 PyDoc_STRVAR(s_pack_into__doc__,
1877 "S.pack_into(buffer, offset, v1, v2, ...)\n\
1878 \n\
1879 Pack the values v1, v2, ... according to the format string S.format\n\
1880 and write the packed bytes into the writable buffer buf starting at\n\
1881 offset. Note that the offset is a required argument. See\n\
1882 help(struct) for more on format strings.");
1883
1884 static PyObject *
s_pack_into(PyObject * self,PyObject * const * args,Py_ssize_t nargs)1885 s_pack_into(PyObject *self, PyObject *const *args, Py_ssize_t nargs)
1886 {
1887 PyStructObject *soself;
1888 Py_buffer buffer;
1889 Py_ssize_t offset;
1890
1891 /* Validate arguments. +1 is for the first arg as buffer. */
1892 soself = (PyStructObject *)self;
1893 assert(PyStruct_Check(self));
1894 assert(soself->s_codes != NULL);
1895 if (nargs != (soself->s_len + 2))
1896 {
1897 if (nargs == 0) {
1898 PyErr_Format(StructError,
1899 "pack_into expected buffer argument");
1900 }
1901 else if (nargs == 1) {
1902 PyErr_Format(StructError,
1903 "pack_into expected offset argument");
1904 }
1905 else {
1906 PyErr_Format(StructError,
1907 "pack_into expected %zd items for packing (got %zd)",
1908 soself->s_len, (nargs - 2));
1909 }
1910 return NULL;
1911 }
1912
1913 /* Extract a writable memory buffer from the first argument */
1914 if (!PyArg_Parse(args[0], "w*", &buffer))
1915 return NULL;
1916 assert(buffer.len >= 0);
1917
1918 /* Extract the offset from the first argument */
1919 offset = PyNumber_AsSsize_t(args[1], PyExc_IndexError);
1920 if (offset == -1 && PyErr_Occurred()) {
1921 PyBuffer_Release(&buffer);
1922 return NULL;
1923 }
1924
1925 /* Support negative offsets. */
1926 if (offset < 0) {
1927 /* Check that negative offset is low enough to fit data */
1928 if (offset + soself->s_size > 0) {
1929 PyErr_Format(StructError,
1930 "no space to pack %zd bytes at offset %zd",
1931 soself->s_size,
1932 offset);
1933 PyBuffer_Release(&buffer);
1934 return NULL;
1935 }
1936
1937 /* Check that negative offset is not crossing buffer boundary */
1938 if (offset + buffer.len < 0) {
1939 PyErr_Format(StructError,
1940 "offset %zd out of range for %zd-byte buffer",
1941 offset,
1942 buffer.len);
1943 PyBuffer_Release(&buffer);
1944 return NULL;
1945 }
1946
1947 offset += buffer.len;
1948 }
1949
1950 /* Check boundaries */
1951 if ((buffer.len - offset) < soself->s_size) {
1952 assert(offset >= 0);
1953 assert(soself->s_size >= 0);
1954
1955 PyErr_Format(StructError,
1956 "pack_into requires a buffer of at least %zu bytes for "
1957 "packing %zd bytes at offset %zd "
1958 "(actual buffer size is %zd)",
1959 (size_t)soself->s_size + (size_t)offset,
1960 soself->s_size,
1961 offset,
1962 buffer.len);
1963 PyBuffer_Release(&buffer);
1964 return NULL;
1965 }
1966
1967 /* Call the guts */
1968 if (s_pack_internal(soself, args, 2, (char*)buffer.buf + offset) != 0) {
1969 PyBuffer_Release(&buffer);
1970 return NULL;
1971 }
1972
1973 PyBuffer_Release(&buffer);
1974 Py_RETURN_NONE;
1975 }
1976
1977 static PyObject *
s_get_format(PyStructObject * self,void * unused)1978 s_get_format(PyStructObject *self, void *unused)
1979 {
1980 return PyUnicode_FromStringAndSize(PyBytes_AS_STRING(self->s_format),
1981 PyBytes_GET_SIZE(self->s_format));
1982 }
1983
1984 static PyObject *
s_get_size(PyStructObject * self,void * unused)1985 s_get_size(PyStructObject *self, void *unused)
1986 {
1987 return PyLong_FromSsize_t(self->s_size);
1988 }
1989
1990 PyDoc_STRVAR(s_sizeof__doc__,
1991 "S.__sizeof__() -> size of S in memory, in bytes");
1992
1993 static PyObject *
s_sizeof(PyStructObject * self,void * unused)1994 s_sizeof(PyStructObject *self, void *unused)
1995 {
1996 Py_ssize_t size;
1997 formatcode *code;
1998
1999 size = _PyObject_SIZE(Py_TYPE(self)) + sizeof(formatcode);
2000 for (code = self->s_codes; code->fmtdef != NULL; code++)
2001 size += sizeof(formatcode);
2002 return PyLong_FromSsize_t(size);
2003 }
2004
2005 /* List of functions */
2006
2007 static struct PyMethodDef s_methods[] = {
2008 STRUCT_ITER_UNPACK_METHODDEF
2009 {"pack", (PyCFunction)(void(*)(void))s_pack, METH_FASTCALL, s_pack__doc__},
2010 {"pack_into", (PyCFunction)(void(*)(void))s_pack_into, METH_FASTCALL, s_pack_into__doc__},
2011 STRUCT_UNPACK_METHODDEF
2012 STRUCT_UNPACK_FROM_METHODDEF
2013 {"__sizeof__", (PyCFunction)s_sizeof, METH_NOARGS, s_sizeof__doc__},
2014 {NULL, NULL} /* sentinel */
2015 };
2016
2017 #define OFF(x) offsetof(PyStructObject, x)
2018
2019 static PyGetSetDef s_getsetlist[] = {
2020 {"format", (getter)s_get_format, (setter)NULL, "struct format string", NULL},
2021 {"size", (getter)s_get_size, (setter)NULL, "struct size in bytes", NULL},
2022 {NULL} /* sentinel */
2023 };
2024
2025 static
2026 PyTypeObject PyStructType = {
2027 PyVarObject_HEAD_INIT(NULL, 0)
2028 "Struct",
2029 sizeof(PyStructObject),
2030 0,
2031 (destructor)s_dealloc, /* tp_dealloc */
2032 0, /* tp_vectorcall_offset */
2033 0, /* tp_getattr */
2034 0, /* tp_setattr */
2035 0, /* tp_as_async */
2036 0, /* tp_repr */
2037 0, /* tp_as_number */
2038 0, /* tp_as_sequence */
2039 0, /* tp_as_mapping */
2040 0, /* tp_hash */
2041 0, /* tp_call */
2042 0, /* tp_str */
2043 PyObject_GenericGetAttr, /* tp_getattro */
2044 PyObject_GenericSetAttr, /* tp_setattro */
2045 0, /* tp_as_buffer */
2046 Py_TPFLAGS_DEFAULT | Py_TPFLAGS_BASETYPE, /* tp_flags */
2047 Struct___init____doc__, /* tp_doc */
2048 0, /* tp_traverse */
2049 0, /* tp_clear */
2050 0, /* tp_richcompare */
2051 offsetof(PyStructObject, weakreflist), /* tp_weaklistoffset */
2052 0, /* tp_iter */
2053 0, /* tp_iternext */
2054 s_methods, /* tp_methods */
2055 NULL, /* tp_members */
2056 s_getsetlist, /* tp_getset */
2057 0, /* tp_base */
2058 0, /* tp_dict */
2059 0, /* tp_descr_get */
2060 0, /* tp_descr_set */
2061 0, /* tp_dictoffset */
2062 Struct___init__, /* tp_init */
2063 PyType_GenericAlloc, /* tp_alloc */
2064 s_new, /* tp_new */
2065 PyObject_Del, /* tp_free */
2066 };
2067
2068
2069 /* ---- Standalone functions ---- */
2070
2071 #define MAXCACHE 100
2072 static PyObject *cache = NULL;
2073
2074 static int
cache_struct_converter(PyObject * fmt,PyStructObject ** ptr)2075 cache_struct_converter(PyObject *fmt, PyStructObject **ptr)
2076 {
2077 PyObject * s_object;
2078
2079 if (fmt == NULL) {
2080 Py_DECREF(*ptr);
2081 *ptr = NULL;
2082 return 1;
2083 }
2084
2085 if (cache == NULL) {
2086 cache = PyDict_New();
2087 if (cache == NULL)
2088 return 0;
2089 }
2090
2091 s_object = PyDict_GetItemWithError(cache, fmt);
2092 if (s_object != NULL) {
2093 Py_INCREF(s_object);
2094 *ptr = (PyStructObject *)s_object;
2095 return Py_CLEANUP_SUPPORTED;
2096 }
2097 else if (PyErr_Occurred()) {
2098 return 0;
2099 }
2100
2101 s_object = PyObject_CallFunctionObjArgs((PyObject *)(&PyStructType), fmt, NULL);
2102 if (s_object != NULL) {
2103 if (PyDict_GET_SIZE(cache) >= MAXCACHE)
2104 PyDict_Clear(cache);
2105 /* Attempt to cache the result */
2106 if (PyDict_SetItem(cache, fmt, s_object) == -1)
2107 PyErr_Clear();
2108 *ptr = (PyStructObject *)s_object;
2109 return Py_CLEANUP_SUPPORTED;
2110 }
2111 return 0;
2112 }
2113
2114 /*[clinic input]
2115 _clearcache
2116
2117 Clear the internal cache.
2118 [clinic start generated code]*/
2119
2120 static PyObject *
_clearcache_impl(PyObject * module)2121 _clearcache_impl(PyObject *module)
2122 /*[clinic end generated code: output=ce4fb8a7bf7cb523 input=463eaae04bab3211]*/
2123 {
2124 Py_CLEAR(cache);
2125 Py_RETURN_NONE;
2126 }
2127
2128
2129 /*[clinic input]
2130 calcsize -> Py_ssize_t
2131
2132 format as s_object: cache_struct
2133 /
2134
2135 Return size in bytes of the struct described by the format string.
2136 [clinic start generated code]*/
2137
2138 static Py_ssize_t
calcsize_impl(PyObject * module,PyStructObject * s_object)2139 calcsize_impl(PyObject *module, PyStructObject *s_object)
2140 /*[clinic end generated code: output=db7d23d09c6932c4 input=96a6a590c7717ecd]*/
2141 {
2142 return s_object->s_size;
2143 }
2144
2145 PyDoc_STRVAR(pack_doc,
2146 "pack(format, v1, v2, ...) -> bytes\n\
2147 \n\
2148 Return a bytes object containing the values v1, v2, ... packed according\n\
2149 to the format string. See help(struct) for more on format strings.");
2150
2151 static PyObject *
pack(PyObject * self,PyObject * const * args,Py_ssize_t nargs)2152 pack(PyObject *self, PyObject *const *args, Py_ssize_t nargs)
2153 {
2154 PyObject *s_object = NULL;
2155 PyObject *format, *result;
2156
2157 if (nargs == 0) {
2158 PyErr_SetString(PyExc_TypeError, "missing format argument");
2159 return NULL;
2160 }
2161 format = args[0];
2162
2163 if (!cache_struct_converter(format, (PyStructObject **)&s_object)) {
2164 return NULL;
2165 }
2166 result = s_pack(s_object, args + 1, nargs - 1);
2167 Py_DECREF(s_object);
2168 return result;
2169 }
2170
2171 PyDoc_STRVAR(pack_into_doc,
2172 "pack_into(format, buffer, offset, v1, v2, ...)\n\
2173 \n\
2174 Pack the values v1, v2, ... according to the format string and write\n\
2175 the packed bytes into the writable buffer buf starting at offset. Note\n\
2176 that the offset is a required argument. See help(struct) for more\n\
2177 on format strings.");
2178
2179 static PyObject *
pack_into(PyObject * self,PyObject * const * args,Py_ssize_t nargs)2180 pack_into(PyObject *self, PyObject *const *args, Py_ssize_t nargs)
2181 {
2182 PyObject *s_object = NULL;
2183 PyObject *format, *result;
2184
2185 if (nargs == 0) {
2186 PyErr_SetString(PyExc_TypeError, "missing format argument");
2187 return NULL;
2188 }
2189 format = args[0];
2190
2191 if (!cache_struct_converter(format, (PyStructObject **)&s_object)) {
2192 return NULL;
2193 }
2194 result = s_pack_into(s_object, args + 1, nargs - 1);
2195 Py_DECREF(s_object);
2196 return result;
2197 }
2198
2199 /*[clinic input]
2200 unpack
2201
2202 format as s_object: cache_struct
2203 buffer: Py_buffer
2204 /
2205
2206 Return a tuple containing values unpacked according to the format string.
2207
2208 The buffer's size in bytes must be calcsize(format).
2209
2210 See help(struct) for more on format strings.
2211 [clinic start generated code]*/
2212
2213 static PyObject *
unpack_impl(PyObject * module,PyStructObject * s_object,Py_buffer * buffer)2214 unpack_impl(PyObject *module, PyStructObject *s_object, Py_buffer *buffer)
2215 /*[clinic end generated code: output=48ddd4d88eca8551 input=05fa3b91678da727]*/
2216 {
2217 return Struct_unpack_impl(s_object, buffer);
2218 }
2219
2220 /*[clinic input]
2221 unpack_from
2222
2223 format as s_object: cache_struct
2224 /
2225 buffer: Py_buffer
2226 offset: Py_ssize_t = 0
2227
2228 Return a tuple containing values unpacked according to the format string.
2229
2230 The buffer's size, minus offset, must be at least calcsize(format).
2231
2232 See help(struct) for more on format strings.
2233 [clinic start generated code]*/
2234
2235 static PyObject *
unpack_from_impl(PyObject * module,PyStructObject * s_object,Py_buffer * buffer,Py_ssize_t offset)2236 unpack_from_impl(PyObject *module, PyStructObject *s_object,
2237 Py_buffer *buffer, Py_ssize_t offset)
2238 /*[clinic end generated code: output=1042631674c6e0d3 input=6e80a5398e985025]*/
2239 {
2240 return Struct_unpack_from_impl(s_object, buffer, offset);
2241 }
2242
2243 /*[clinic input]
2244 iter_unpack
2245
2246 format as s_object: cache_struct
2247 buffer: object
2248 /
2249
2250 Return an iterator yielding tuples unpacked from the given bytes.
2251
2252 The bytes are unpacked according to the format string, like
2253 a repeated invocation of unpack_from().
2254
2255 Requires that the bytes length be a multiple of the format struct size.
2256 [clinic start generated code]*/
2257
2258 static PyObject *
iter_unpack_impl(PyObject * module,PyStructObject * s_object,PyObject * buffer)2259 iter_unpack_impl(PyObject *module, PyStructObject *s_object,
2260 PyObject *buffer)
2261 /*[clinic end generated code: output=0ae50e250d20e74d input=b214a58869a3c98d]*/
2262 {
2263 return Struct_iter_unpack(s_object, buffer);
2264 }
2265
2266 static struct PyMethodDef module_functions[] = {
2267 _CLEARCACHE_METHODDEF
2268 CALCSIZE_METHODDEF
2269 ITER_UNPACK_METHODDEF
2270 {"pack", (PyCFunction)(void(*)(void))pack, METH_FASTCALL, pack_doc},
2271 {"pack_into", (PyCFunction)(void(*)(void))pack_into, METH_FASTCALL, pack_into_doc},
2272 UNPACK_METHODDEF
2273 UNPACK_FROM_METHODDEF
2274 {NULL, NULL} /* sentinel */
2275 };
2276
2277
2278 /* Module initialization */
2279
2280 PyDoc_STRVAR(module_doc,
2281 "Functions to convert between Python values and C structs.\n\
2282 Python bytes objects are used to hold the data representing the C struct\n\
2283 and also as format strings (explained below) to describe the layout of data\n\
2284 in the C struct.\n\
2285 \n\
2286 The optional first format char indicates byte order, size and alignment:\n\
2287 @: native order, size & alignment (default)\n\
2288 =: native order, std. size & alignment\n\
2289 <: little-endian, std. size & alignment\n\
2290 >: big-endian, std. size & alignment\n\
2291 !: same as >\n\
2292 \n\
2293 The remaining chars indicate types of args and must match exactly;\n\
2294 these can be preceded by a decimal repeat count:\n\
2295 x: pad byte (no data); c:char; b:signed byte; B:unsigned byte;\n\
2296 ?: _Bool (requires C99; if not available, char is used instead)\n\
2297 h:short; H:unsigned short; i:int; I:unsigned int;\n\
2298 l:long; L:unsigned long; f:float; d:double; e:half-float.\n\
2299 Special cases (preceding decimal count indicates length):\n\
2300 s:string (array of char); p: pascal string (with count byte).\n\
2301 Special cases (only available in native format):\n\
2302 n:ssize_t; N:size_t;\n\
2303 P:an integer type that is wide enough to hold a pointer.\n\
2304 Special case (not in native mode unless 'long long' in platform C):\n\
2305 q:long long; Q:unsigned long long\n\
2306 Whitespace between formats is ignored.\n\
2307 \n\
2308 The variable struct.error is an exception raised on errors.\n");
2309
2310
2311 static struct PyModuleDef _structmodule = {
2312 PyModuleDef_HEAD_INIT,
2313 "_struct",
2314 module_doc,
2315 -1,
2316 module_functions,
2317 NULL,
2318 NULL,
2319 NULL,
2320 NULL
2321 };
2322
2323 PyMODINIT_FUNC
PyInit__struct(void)2324 PyInit__struct(void)
2325 {
2326 PyObject *m;
2327
2328 m = PyModule_Create(&_structmodule);
2329 if (m == NULL)
2330 return NULL;
2331
2332 Py_TYPE(&PyStructType) = &PyType_Type;
2333 if (PyType_Ready(&PyStructType) < 0)
2334 return NULL;
2335
2336 if (PyType_Ready(&unpackiter_type) < 0)
2337 return NULL;
2338
2339 /* Check endian and swap in faster functions */
2340 {
2341 const formatdef *native = native_table;
2342 formatdef *other, *ptr;
2343 #if PY_LITTLE_ENDIAN
2344 other = lilendian_table;
2345 #else
2346 other = bigendian_table;
2347 #endif
2348 /* Scan through the native table, find a matching
2349 entry in the endian table and swap in the
2350 native implementations whenever possible
2351 (64-bit platforms may not have "standard" sizes) */
2352 while (native->format != '\0' && other->format != '\0') {
2353 ptr = other;
2354 while (ptr->format != '\0') {
2355 if (ptr->format == native->format) {
2356 /* Match faster when formats are
2357 listed in the same order */
2358 if (ptr == other)
2359 other++;
2360 /* Only use the trick if the
2361 size matches */
2362 if (ptr->size != native->size)
2363 break;
2364 /* Skip float and double, could be
2365 "unknown" float format */
2366 if (ptr->format == 'd' || ptr->format == 'f')
2367 break;
2368 ptr->pack = native->pack;
2369 ptr->unpack = native->unpack;
2370 break;
2371 }
2372 ptr++;
2373 }
2374 native++;
2375 }
2376 }
2377
2378 /* Add some symbolic constants to the module */
2379 if (StructError == NULL) {
2380 StructError = PyErr_NewException("struct.error", NULL, NULL);
2381 if (StructError == NULL)
2382 return NULL;
2383 }
2384
2385 Py_INCREF(StructError);
2386 PyModule_AddObject(m, "error", StructError);
2387
2388 Py_INCREF((PyObject*)&PyStructType);
2389 PyModule_AddObject(m, "Struct", (PyObject*)&PyStructType);
2390
2391 return m;
2392 }
2393