mirror of
				https://github.com/python/cpython.git
				synced 2025-10-26 19:24:34 +00:00 
			
		
		
		
	 772b2b09f2
			
		
	
	
		772b2b09f2
		
	
	
	
	
		
			
			Issue #25399: Don't create temporary bytes objects: modify _PyBytes_Format() to create work directly on bytearray objects. * Rename _PyBytes_Format() to _PyBytes_FormatEx() just in case if something outside CPython uses it * _PyBytes_FormatEx() now uses (char*, Py_ssize_t) for the input string, so bytearray_format() doesn't need tot create a temporary input bytes object * Add use_bytearray parameter to _PyBytes_FormatEx() which is passed to _PyBytesWriter, to create a bytearray buffer instead of a bytes buffer Most formatting operations are now between 2.5 and 5 times faster.
		
			
				
	
	
		
			197 lines
		
	
	
	
		
			7.1 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
			
		
		
	
	
			197 lines
		
	
	
	
		
			7.1 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
| 
 | |
| /* Bytes (String) object interface */
 | |
| 
 | |
| #ifndef Py_BYTESOBJECT_H
 | |
| #define Py_BYTESOBJECT_H
 | |
| #ifdef __cplusplus
 | |
| extern "C" {
 | |
| #endif
 | |
| 
 | |
| #include <stdarg.h>
 | |
| 
 | |
| /*
 | |
| Type PyBytesObject represents a character string.  An extra zero byte is
 | |
| reserved at the end to ensure it is zero-terminated, but a size is
 | |
| present so strings with null bytes in them can be represented.  This
 | |
| is an immutable object type.
 | |
| 
 | |
| There are functions to create new string objects, to test
 | |
| an object for string-ness, and to get the
 | |
| string value.  The latter function returns a null pointer
 | |
| if the object is not of the proper type.
 | |
| There is a variant that takes an explicit size as well as a
 | |
| variant that assumes a zero-terminated string.  Note that none of the
 | |
| functions should be applied to nil objects.
 | |
| */
 | |
| 
 | |
| /* Caching the hash (ob_shash) saves recalculation of a string's hash value.
 | |
|    This significantly speeds up dict lookups. */
 | |
| 
 | |
| #ifndef Py_LIMITED_API
 | |
| typedef struct {
 | |
|     PyObject_VAR_HEAD
 | |
|     Py_hash_t ob_shash;
 | |
|     char ob_sval[1];
 | |
| 
 | |
|     /* Invariants:
 | |
|      *     ob_sval contains space for 'ob_size+1' elements.
 | |
|      *     ob_sval[ob_size] == 0.
 | |
|      *     ob_shash is the hash of the string or -1 if not computed yet.
 | |
|      */
 | |
| } PyBytesObject;
 | |
| #endif
 | |
| 
 | |
| PyAPI_DATA(PyTypeObject) PyBytes_Type;
 | |
| PyAPI_DATA(PyTypeObject) PyBytesIter_Type;
 | |
| 
 | |
| #define PyBytes_Check(op) \
 | |
|                  PyType_FastSubclass(Py_TYPE(op), Py_TPFLAGS_BYTES_SUBCLASS)
 | |
| #define PyBytes_CheckExact(op) (Py_TYPE(op) == &PyBytes_Type)
 | |
| 
 | |
| PyAPI_FUNC(PyObject *) PyBytes_FromStringAndSize(const char *, Py_ssize_t);
 | |
| PyAPI_FUNC(PyObject *) PyBytes_FromString(const char *);
 | |
| PyAPI_FUNC(PyObject *) PyBytes_FromObject(PyObject *);
 | |
| PyAPI_FUNC(PyObject *) PyBytes_FromFormatV(const char*, va_list)
 | |
| 				Py_GCC_ATTRIBUTE((format(printf, 1, 0)));
 | |
| PyAPI_FUNC(PyObject *) PyBytes_FromFormat(const char*, ...)
 | |
| 				Py_GCC_ATTRIBUTE((format(printf, 1, 2)));
 | |
| PyAPI_FUNC(Py_ssize_t) PyBytes_Size(PyObject *);
 | |
| PyAPI_FUNC(char *) PyBytes_AsString(PyObject *);
 | |
| PyAPI_FUNC(PyObject *) PyBytes_Repr(PyObject *, int);
 | |
| PyAPI_FUNC(void) PyBytes_Concat(PyObject **, PyObject *);
 | |
| PyAPI_FUNC(void) PyBytes_ConcatAndDel(PyObject **, PyObject *);
 | |
| #ifndef Py_LIMITED_API
 | |
| PyAPI_FUNC(int) _PyBytes_Resize(PyObject **, Py_ssize_t);
 | |
| PyAPI_FUNC(PyObject*) _PyBytes_FormatEx(
 | |
|     const char *format,
 | |
|     Py_ssize_t format_len,
 | |
|     PyObject *args,
 | |
|     int use_bytearray);
 | |
| #endif
 | |
| PyAPI_FUNC(PyObject *) PyBytes_DecodeEscape(const char *, Py_ssize_t,
 | |
| 						   const char *, Py_ssize_t,
 | |
| 						   const char *);
 | |
| 
 | |
| /* Macro, trading safety for speed */
 | |
| #ifndef Py_LIMITED_API
 | |
| #define PyBytes_AS_STRING(op) (assert(PyBytes_Check(op)), \
 | |
|                                 (((PyBytesObject *)(op))->ob_sval))
 | |
| #define PyBytes_GET_SIZE(op)  (assert(PyBytes_Check(op)),Py_SIZE(op))
 | |
| #endif
 | |
| 
 | |
| /* _PyBytes_Join(sep, x) is like sep.join(x).  sep must be PyBytesObject*,
 | |
|    x must be an iterable object. */
 | |
| #ifndef Py_LIMITED_API
 | |
| PyAPI_FUNC(PyObject *) _PyBytes_Join(PyObject *sep, PyObject *x);
 | |
| #endif
 | |
| 
 | |
| /* Provides access to the internal data buffer and size of a string
 | |
|    object or the default encoded version of an Unicode object. Passing
 | |
|    NULL as *len parameter will force the string buffer to be
 | |
|    0-terminated (passing a string with embedded NULL characters will
 | |
|    cause an exception).  */
 | |
| PyAPI_FUNC(int) PyBytes_AsStringAndSize(
 | |
|     PyObject *obj,      /* string or Unicode object */
 | |
|     char **s,           /* pointer to buffer variable */
 | |
|     Py_ssize_t *len     /* pointer to length variable or NULL
 | |
|                            (only possible for 0-terminated
 | |
|                            strings) */
 | |
|     );
 | |
| 
 | |
| /* Using the current locale, insert the thousands grouping
 | |
|    into the string pointed to by buffer.  For the argument descriptions,
 | |
|    see Objects/stringlib/localeutil.h */
 | |
| #ifndef Py_LIMITED_API
 | |
| PyAPI_FUNC(Py_ssize_t) _PyBytes_InsertThousandsGroupingLocale(char *buffer,
 | |
|                                                    Py_ssize_t n_buffer,
 | |
|                                                    char *digits,
 | |
|                                                    Py_ssize_t n_digits,
 | |
|                                                    Py_ssize_t min_width);
 | |
| 
 | |
| /* Using explicit passed-in values, insert the thousands grouping
 | |
|    into the string pointed to by buffer.  For the argument descriptions,
 | |
|    see Objects/stringlib/localeutil.h */
 | |
| PyAPI_FUNC(Py_ssize_t) _PyBytes_InsertThousandsGrouping(char *buffer,
 | |
|                                                    Py_ssize_t n_buffer,
 | |
|                                                    char *digits,
 | |
|                                                    Py_ssize_t n_digits,
 | |
|                                                    Py_ssize_t min_width,
 | |
|                                                    const char *grouping,
 | |
|                                                    const char *thousands_sep);
 | |
| #endif
 | |
| 
 | |
| /* Flags used by string formatting */
 | |
| #define F_LJUST (1<<0)
 | |
| #define F_SIGN	(1<<1)
 | |
| #define F_BLANK (1<<2)
 | |
| #define F_ALT	(1<<3)
 | |
| #define F_ZERO	(1<<4)
 | |
| 
 | |
| #ifndef Py_LIMITED_API
 | |
| /* The _PyBytesWriter structure is big: it contains an embeded "stack buffer".
 | |
|    A _PyBytesWriter variable must be declared at the end of variables in a
 | |
|    function to optimize the memory allocation on the stack. */
 | |
| typedef struct {
 | |
|     /* bytes, bytearray or NULL (when the small buffer is used) */
 | |
|     PyObject *buffer;
 | |
| 
 | |
|     /* Number of allocated size. */
 | |
|     Py_ssize_t allocated;
 | |
| 
 | |
|     /* Minimum number of allocated bytes,
 | |
|        incremented by _PyBytesWriter_Prepare() */
 | |
|     Py_ssize_t min_size;
 | |
| 
 | |
|     /* If non-zero, use a bytearray instead of a bytes object for buffer. */
 | |
|     int use_bytearray;
 | |
| 
 | |
|     /* If non-zero, overallocate the buffer (default: 0).
 | |
|        This flag must be zero if use_bytearray is non-zero. */
 | |
|     int overallocate;
 | |
| 
 | |
|     /* Stack buffer */
 | |
|     int use_small_buffer;
 | |
|     char small_buffer[512];
 | |
| } _PyBytesWriter;
 | |
| 
 | |
| /* Initialize a bytes writer
 | |
| 
 | |
|    By default, the overallocation is disabled. Set the overallocate attribute
 | |
|    to control the allocation of the buffer. */
 | |
| PyAPI_FUNC(void) _PyBytesWriter_Init(_PyBytesWriter *writer);
 | |
| 
 | |
| /* Get the buffer content and reset the writer.
 | |
|    Return a bytes object, or a bytearray object if use_bytearray is non-zero.
 | |
|    Raise an exception and return NULL on error. */
 | |
| PyAPI_FUNC(PyObject *) _PyBytesWriter_Finish(_PyBytesWriter *writer,
 | |
|     void *str);
 | |
| 
 | |
| /* Deallocate memory of a writer (clear its internal buffer). */
 | |
| PyAPI_FUNC(void) _PyBytesWriter_Dealloc(_PyBytesWriter *writer);
 | |
| 
 | |
| /* Allocate the buffer to write size bytes.
 | |
|    Return the pointer to the beginning of buffer data.
 | |
|    Raise an exception and return NULL on error. */
 | |
| PyAPI_FUNC(void*) _PyBytesWriter_Alloc(_PyBytesWriter *writer,
 | |
|     Py_ssize_t size);
 | |
| 
 | |
| /* Add *size* bytes to the buffer.
 | |
|    str is the current pointer inside the buffer.
 | |
|    Return the updated current pointer inside the buffer.
 | |
|    Raise an exception and return NULL on error. */
 | |
| PyAPI_FUNC(void*) _PyBytesWriter_Prepare(_PyBytesWriter *writer,
 | |
|     void *str,
 | |
|     Py_ssize_t size);
 | |
| 
 | |
| /* Write bytes.
 | |
|    Raise an exception and return NULL on error. */
 | |
| PyAPI_FUNC(void*) _PyBytesWriter_WriteBytes(_PyBytesWriter *writer,
 | |
|     void *str,
 | |
|     const void *bytes,
 | |
|     Py_ssize_t size);
 | |
| #endif   /* Py_LIMITED_API */
 | |
| 
 | |
| #ifdef __cplusplus
 | |
| }
 | |
| #endif
 | |
| #endif /* !Py_BYTESOBJECT_H */
 |