Objects/stringlib/transmogrify.h - platform/external/python/cpython3 - Gitiles

 /* NOTE: this API is -ONLY- for use with single byte character strings. */
 /* Do not use it with Unicode. */

 #include "bytes_methods.h"

 #ifndef STRINGLIB_MUTABLE
 #warning "STRINGLIB_MUTABLE not defined before #include, assuming 0"
 #define STRINGLIB_MUTABLE 0
 #endif

 /* the more complicated methods.  parts of these should be pulled out into the
    shared code in bytes_methods.c to cut down on duplicate code bloat.  */

 PyDoc_STRVAR(expandtabs__doc__,
 "B.expandtabs([tabsize]) -> copy of B\n\
 \n\
 Return a copy of B where all tab characters are expanded using spaces.\n\
 If tabsize is not given, a tab size of 8 characters is assumed.");

 static PyObject*
 stringlib_expandtabs(PyObject *self, PyObject *args)
 {
     const char *e, *p;
     char *q;
     size_t i, j;
     PyObject *u;
     int tabsize = 8;

     if (!PyArg_ParseTuple(args, "|i:expandtabs", &tabsize))
         return NULL;

     /* First pass: determine size of output string */
     i = j = 0;
     e = STRINGLIB_STR(self) + STRINGLIB_LEN(self);
     for (p = STRINGLIB_STR(self); p < e; p++)
         if (*p == '\t') {
             if (tabsize > 0) {
                 j += tabsize - (j % tabsize);
                 if (j > PY_SSIZE_T_MAX) {
                     PyErr_SetString(PyExc_OverflowError,
                                     "result is too long");
                     return NULL;
                 }
             }
         }
         else {
             j++;
             if (*p == '\n' || *p == '\r') {
                 i += j;
                 j = 0;
                 if (i > PY_SSIZE_T_MAX) {
                     PyErr_SetString(PyExc_OverflowError,
                                     "result is too long");
                     return NULL;
                 }
             }
         }

     if ((i + j) > PY_SSIZE_T_MAX) {
         PyErr_SetString(PyExc_OverflowError, "result is too long");
         return NULL;
     }

     /* Second pass: create output string and fill it */
     u = STRINGLIB_NEW(NULL, i + j);
     if (!u)
         return NULL;

     j = 0;
     q = STRINGLIB_STR(u);

     for (p = STRINGLIB_STR(self); p < e; p++)
         if (*p == '\t') {
             if (tabsize > 0) {
                 i = tabsize - (j % tabsize);
                 j += i;
                 while (i--)
                     *q++ = ' ';
             }
         }
         else {
             j++;
             *q++ = *p;
             if (*p == '\n' || *p == '\r')
                 j = 0;
         }

     return u;
 }

 Py_LOCAL_INLINE(PyObject *)
 pad(PyObject *self, Py_ssize_t left, Py_ssize_t right, char fill)
 {
     PyObject *u;

     if (left < 0)
         left = 0;
     if (right < 0)
         right = 0;

     if (left == 0 && right == 0 && STRINGLIB_CHECK_EXACT(self)) {
 #if STRINGLIB_MUTABLE
         /* We're defined as returning a copy;  If the object is mutable
          * that means we must make an identical copy. */
         return STRINGLIB_NEW(STRINGLIB_STR(self), STRINGLIB_LEN(self));
 #else
         Py_INCREF(self);
         return (PyObject *)self;
 #endif /* STRINGLIB_MUTABLE */
     }

     u = STRINGLIB_NEW(NULL,
                                    left + STRINGLIB_LEN(self) + right);
     if (u) {
         if (left)
             memset(STRINGLIB_STR(u), fill, left);
         Py_MEMCPY(STRINGLIB_STR(u) + left,
                STRINGLIB_STR(self),
                STRINGLIB_LEN(self));
         if (right)
             memset(STRINGLIB_STR(u) + left + STRINGLIB_LEN(self),
                    fill, right);
     }

     return u;
 }

 PyDoc_STRVAR(ljust__doc__,
 "B.ljust(width[, fillchar]) -> copy of B\n"
 "\n"
 "Return B left justified in a string of length width. Padding is\n"
 "done using the specified fill character (default is a space).");

 static PyObject *
 stringlib_ljust(PyObject *self, PyObject *args)
 {
     Py_ssize_t width;
     char fillchar = ' ';

     if (!PyArg_ParseTuple(args, "n|c:ljust", &width, &fillchar))
         return NULL;

     if (STRINGLIB_LEN(self) >= width && STRINGLIB_CHECK_EXACT(self)) {
 #if STRINGLIB_MUTABLE
         /* We're defined as returning a copy;  If the object is mutable
          * that means we must make an identical copy. */
         return STRINGLIB_NEW(STRINGLIB_STR(self), STRINGLIB_LEN(self));
 #else
         Py_INCREF(self);
         return (PyObject*) self;
 #endif
     }

     return pad(self, 0, width - STRINGLIB_LEN(self), fillchar);
 }


 PyDoc_STRVAR(rjust__doc__,
 "B.rjust(width[, fillchar]) -> copy of B\n"
 "\n"
 "Return B right justified in a string of length width. Padding is\n"
 "done using the specified fill character (default is a space)");

 static PyObject *
 stringlib_rjust(PyObject *self, PyObject *args)
 {
     Py_ssize_t width;
     char fillchar = ' ';

     if (!PyArg_ParseTuple(args, "n|c:rjust", &width, &fillchar))
         return NULL;

     if (STRINGLIB_LEN(self) >= width && STRINGLIB_CHECK_EXACT(self)) {
 #if STRINGLIB_MUTABLE
         /* We're defined as returning a copy;  If the object is mutable
          * that means we must make an identical copy. */
         return STRINGLIB_NEW(STRINGLIB_STR(self), STRINGLIB_LEN(self));
 #else
         Py_INCREF(self);
         return (PyObject*) self;
 #endif
     }

     return pad(self, width - STRINGLIB_LEN(self), 0, fillchar);
 }


 PyDoc_STRVAR(center__doc__,
 "B.center(width[, fillchar]) -> copy of B\n"
 "\n"
 "Return B centered in a string of length width.  Padding is\n"
 "done using the specified fill character (default is a space).");

 static PyObject *
 stringlib_center(PyObject *self, PyObject *args)
 {
     Py_ssize_t marg, left;
     Py_ssize_t width;
     char fillchar = ' ';

     if (!PyArg_ParseTuple(args, "n|c:center", &width, &fillchar))
         return NULL;

     if (STRINGLIB_LEN(self) >= width && STRINGLIB_CHECK_EXACT(self)) {
 #if STRINGLIB_MUTABLE
         /* We're defined as returning a copy;  If the object is mutable
          * that means we must make an identical copy. */
         return STRINGLIB_NEW(STRINGLIB_STR(self), STRINGLIB_LEN(self));
 #else
         Py_INCREF(self);
         return (PyObject*) self;
 #endif
     }

     marg = width - STRINGLIB_LEN(self);
     left = marg / 2 + (marg & width & 1);

     return pad(self, left, marg - left, fillchar);
 }

 PyDoc_STRVAR(zfill__doc__,
 "B.zfill(width) -> copy of B\n"
 "\n"
 "Pad a numeric string B with zeros on the left, to fill a field\n"
 "of the specified width.  B is never truncated.");

 static PyObject *
 stringlib_zfill(PyObject *self, PyObject *args)
 {
     Py_ssize_t fill;
     PyObject *s;
     char *p;
     Py_ssize_t width;

     if (!PyArg_ParseTuple(args, "n:zfill", &width))
         return NULL;

     if (STRINGLIB_LEN(self) >= width) {
         if (STRINGLIB_CHECK_EXACT(self)) {
 #if STRINGLIB_MUTABLE
             /* We're defined as returning a copy;  If the object is mutable
              * that means we must make an identical copy. */
             return STRINGLIB_NEW(STRINGLIB_STR(self), STRINGLIB_LEN(self));
 #else
             Py_INCREF(self);
             return (PyObject*) self;
 #endif
         }
         else
             return STRINGLIB_NEW(
                 STRINGLIB_STR(self),
                 STRINGLIB_LEN(self)
             );
     }

     fill = width - STRINGLIB_LEN(self);

     s = pad(self, fill, 0, '0');

     if (s == NULL)
         return NULL;

     p = STRINGLIB_STR(s);
     if (p[fill] == '+' || p[fill] == '-') {
         /* move sign to beginning of string */
         p[0] = p[fill];
         p[fill] = '0';
     }

     return (PyObject*) s;
 }


 #define _STRINGLIB_SPLIT_APPEND(data, left, right)              \
         str = STRINGLIB_NEW((data) + (left),                    \
                                          (right) - (left));     \
         if (str == NULL)                                        \
                 goto onError;                                   \
         if (PyList_Append(list, str)) {                         \
                 Py_DECREF(str);                                 \
                 goto onError;                                   \
         }                                                       \
         else                                                    \
                 Py_DECREF(str);

 PyDoc_STRVAR(splitlines__doc__,
 "B.splitlines([keepends]) -> list of lines\n\
 \n\
 Return a list of the lines in B, breaking at line boundaries.\n\
 Line breaks are not included in the resulting list unless keepends\n\
 is given and true.");

 static PyObject*
 stringlib_splitlines(PyObject *self, PyObject *args)
 {
     register Py_ssize_t i;
     register Py_ssize_t j;
     Py_ssize_t len;
     int keepends = 0;
     PyObject *list;
     PyObject *str;
     char *data;

     if (!PyArg_ParseTuple(args, "|i:splitlines", &keepends))
         return NULL;

     data = STRINGLIB_STR(self);
     len = STRINGLIB_LEN(self);

     /* This does not use the preallocated list because splitlines is
        usually run with hundreds of newlines.  The overhead of
        switching between PyList_SET_ITEM and append causes about a
        2-3% slowdown for that common case.  A smarter implementation
        could move the if check out, so the SET_ITEMs are done first
        and the appends only done when the prealloc buffer is full.
        That's too much work for little gain.*/

     list = PyList_New(0);
     if (!list)
         goto onError;

     for (i = j = 0; i < len; ) {
         Py_ssize_t eol;

         /* Find a line and append it */
         while (i < len && data[i] != '\n' && data[i] != '\r')
             i++;

         /* Skip the line break reading CRLF as one line break */
         eol = i;
         if (i < len) {
             if (data[i] == '\r' && i + 1 < len &&
                 data[i+1] == '\n')
                 i += 2;
             else
                 i++;
             if (keepends)
                 eol = i;
         }
         _STRINGLIB_SPLIT_APPEND(data, j, eol);
         j = i;
     }
     if (j < len) {
         _STRINGLIB_SPLIT_APPEND(data, j, len);
     }

     return list;

  onError:
     Py_XDECREF(list);
     return NULL;
 }

 #undef _STRINGLIB_SPLIT_APPEND
	/* NOTE: this API is -ONLY- for use with single byte character strings. */
	/* Do not use it with Unicode. */

	#include "bytes_methods.h"

	#ifndef STRINGLIB_MUTABLE
	#warning "STRINGLIB_MUTABLE not defined before #include, assuming 0"
	#define STRINGLIB_MUTABLE 0
	#endif

	/* the more complicated methods. parts of these should be pulled out into the
	shared code in bytes_methods.c to cut down on duplicate code bloat. */

	PyDoc_STRVAR(expandtabs__doc__,
	"B.expandtabs([tabsize]) -> copy of B\n\
	\n\
	Return a copy of B where all tab characters are expanded using spaces.\n\
	If tabsize is not given, a tab size of 8 characters is assumed.");

	static PyObject*
	stringlib_expandtabs(PyObject self, PyObject args)
	{
	const char e, p;
	char *q;
	size_t i, j;
	PyObject *u;
	int tabsize = 8;

	if (!PyArg_ParseTuple(args, "\|i:expandtabs", &tabsize))
	return NULL;

	/* First pass: determine size of output string */
	i = j = 0;
	e = STRINGLIB_STR(self) + STRINGLIB_LEN(self);
	for (p = STRINGLIB_STR(self); p < e; p++)
	if (*p == '\t') {
	if (tabsize > 0) {
	j += tabsize - (j % tabsize);
	if (j > PY_SSIZE_T_MAX) {
	PyErr_SetString(PyExc_OverflowError,
	"result is too long");
	return NULL;
	}
	}
	}
	else {
	j++;
	if (p == '\n' \|\| p == '\r') {
	i += j;
	j = 0;
	if (i > PY_SSIZE_T_MAX) {
	PyErr_SetString(PyExc_OverflowError,
	"result is too long");
	return NULL;
	}
	}
	}

	if ((i + j) > PY_SSIZE_T_MAX) {
	PyErr_SetString(PyExc_OverflowError, "result is too long");
	return NULL;
	}

	/* Second pass: create output string and fill it */
	u = STRINGLIB_NEW(NULL, i + j);
	if (!u)
	return NULL;

	j = 0;
	q = STRINGLIB_STR(u);

	for (p = STRINGLIB_STR(self); p < e; p++)
	if (*p == '\t') {
	if (tabsize > 0) {
	i = tabsize - (j % tabsize);
	j += i;
	while (i--)
	*q++ = ' ';
	}
	}
	else {
	j++;
	q++ = p;
	if (p == '\n' \|\| p == '\r')
	j = 0;
	}

	return u;
	}

	Py_LOCAL_INLINE(PyObject *)
	pad(PyObject *self, Py_ssize_t left, Py_ssize_t right, char fill)
	{
	PyObject *u;

	if (left < 0)
	left = 0;
	if (right < 0)
	right = 0;

	if (left == 0 && right == 0 && STRINGLIB_CHECK_EXACT(self)) {
	#if STRINGLIB_MUTABLE
	/* We're defined as returning a copy; If the object is mutable
	* that means we must make an identical copy. */
	return STRINGLIB_NEW(STRINGLIB_STR(self), STRINGLIB_LEN(self));
	#else
	Py_INCREF(self);
	return (PyObject *)self;
	#endif /* STRINGLIB_MUTABLE */
	}

	u = STRINGLIB_NEW(NULL,
	left + STRINGLIB_LEN(self) + right);
	if (u) {
	if (left)
	memset(STRINGLIB_STR(u), fill, left);
	Py_MEMCPY(STRINGLIB_STR(u) + left,
	STRINGLIB_STR(self),
	STRINGLIB_LEN(self));
	if (right)
	memset(STRINGLIB_STR(u) + left + STRINGLIB_LEN(self),
	fill, right);
	}

	return u;
	}

	PyDoc_STRVAR(ljust__doc__,
	"B.ljust(width[, fillchar]) -> copy of B\n"
	"\n"
	"Return B left justified in a string of length width. Padding is\n"
	"done using the specified fill character (default is a space).");

	static PyObject *
	stringlib_ljust(PyObject self, PyObject args)
	{
	Py_ssize_t width;
	char fillchar = ' ';

	if (!PyArg_ParseTuple(args, "n\|c:ljust", &width, &fillchar))
	return NULL;

	if (STRINGLIB_LEN(self) >= width && STRINGLIB_CHECK_EXACT(self)) {
	#if STRINGLIB_MUTABLE
	/* We're defined as returning a copy; If the object is mutable
	* that means we must make an identical copy. */
	return STRINGLIB_NEW(STRINGLIB_STR(self), STRINGLIB_LEN(self));
	#else
	Py_INCREF(self);
	return (PyObject*) self;
	#endif
	}

	return pad(self, 0, width - STRINGLIB_LEN(self), fillchar);
	}


	PyDoc_STRVAR(rjust__doc__,
	"B.rjust(width[, fillchar]) -> copy of B\n"
	"\n"
	"Return B right justified in a string of length width. Padding is\n"
	"done using the specified fill character (default is a space)");

	static PyObject *
	stringlib_rjust(PyObject self, PyObject args)
	{
	Py_ssize_t width;
	char fillchar = ' ';

	if (!PyArg_ParseTuple(args, "n\|c:rjust", &width, &fillchar))
	return NULL;

	if (STRINGLIB_LEN(self) >= width && STRINGLIB_CHECK_EXACT(self)) {
	#if STRINGLIB_MUTABLE
	/* We're defined as returning a copy; If the object is mutable
	* that means we must make an identical copy. */
	return STRINGLIB_NEW(STRINGLIB_STR(self), STRINGLIB_LEN(self));
	#else
	Py_INCREF(self);
	return (PyObject*) self;
	#endif
	}

	return pad(self, width - STRINGLIB_LEN(self), 0, fillchar);
	}


	PyDoc_STRVAR(center__doc__,
	"B.center(width[, fillchar]) -> copy of B\n"
	"\n"
	"Return B centered in a string of length width. Padding is\n"
	"done using the specified fill character (default is a space).");

	static PyObject *
	stringlib_center(PyObject self, PyObject args)
	{
	Py_ssize_t marg, left;
	Py_ssize_t width;
	char fillchar = ' ';

	if (!PyArg_ParseTuple(args, "n\|c:center", &width, &fillchar))
	return NULL;

	if (STRINGLIB_LEN(self) >= width && STRINGLIB_CHECK_EXACT(self)) {
	#if STRINGLIB_MUTABLE
	/* We're defined as returning a copy; If the object is mutable
	* that means we must make an identical copy. */
	return STRINGLIB_NEW(STRINGLIB_STR(self), STRINGLIB_LEN(self));
	#else
	Py_INCREF(self);
	return (PyObject*) self;
	#endif
	}

	marg = width - STRINGLIB_LEN(self);
	left = marg / 2 + (marg & width & 1);

	return pad(self, left, marg - left, fillchar);
	}

	PyDoc_STRVAR(zfill__doc__,
	"B.zfill(width) -> copy of B\n"
	"\n"
	"Pad a numeric string B with zeros on the left, to fill a field\n"
	"of the specified width. B is never truncated.");

	static PyObject *
	stringlib_zfill(PyObject self, PyObject args)
	{
	Py_ssize_t fill;
	PyObject *s;
	char *p;
	Py_ssize_t width;

	if (!PyArg_ParseTuple(args, "n:zfill", &width))
	return NULL;

	if (STRINGLIB_LEN(self) >= width) {
	if (STRINGLIB_CHECK_EXACT(self)) {
	#if STRINGLIB_MUTABLE
	/* We're defined as returning a copy; If the object is mutable
	* that means we must make an identical copy. */
	return STRINGLIB_NEW(STRINGLIB_STR(self), STRINGLIB_LEN(self));
	#else
	Py_INCREF(self);
	return (PyObject*) self;
	#endif
	}
	else
	return STRINGLIB_NEW(
	STRINGLIB_STR(self),
	STRINGLIB_LEN(self)
	);
	}

	fill = width - STRINGLIB_LEN(self);

	s = pad(self, fill, 0, '0');

	if (s == NULL)
	return NULL;

	p = STRINGLIB_STR(s);
	if (p[fill] == '+' \|\| p[fill] == '-') {
	/* move sign to beginning of string */
	p[0] = p[fill];
	p[fill] = '0';
	}

	return (PyObject*) s;
	}


	#define _STRINGLIB_SPLIT_APPEND(data, left, right) \
	str = STRINGLIB_NEW((data) + (left), \
	(right) - (left)); \
	if (str == NULL) \
	goto onError; \
	if (PyList_Append(list, str)) { \
	Py_DECREF(str); \
	goto onError; \
	} \
	else \
	Py_DECREF(str);

	PyDoc_STRVAR(splitlines__doc__,
	"B.splitlines([keepends]) -> list of lines\n\
	\n\
	Return a list of the lines in B, breaking at line boundaries.\n\
	Line breaks are not included in the resulting list unless keepends\n\
	is given and true.");

	static PyObject*
	stringlib_splitlines(PyObject self, PyObject args)
	{
	register Py_ssize_t i;
	register Py_ssize_t j;
	Py_ssize_t len;
	int keepends = 0;
	PyObject *list;
	PyObject *str;
	char *data;

	if (!PyArg_ParseTuple(args, "\|i:splitlines", &keepends))
	return NULL;

	data = STRINGLIB_STR(self);
	len = STRINGLIB_LEN(self);

	/* This does not use the preallocated list because splitlines is
	usually run with hundreds of newlines. The overhead of
	switching between PyList_SET_ITEM and append causes about a
	2-3% slowdown for that common case. A smarter implementation
	could move the if check out, so the SET_ITEMs are done first
	and the appends only done when the prealloc buffer is full.
	That's too much work for little gain.*/

	list = PyList_New(0);
	if (!list)
	goto onError;

	for (i = j = 0; i < len; ) {
	Py_ssize_t eol;

	/* Find a line and append it */
	while (i < len && data[i] != '\n' && data[i] != '\r')
	i++;

	/* Skip the line break reading CRLF as one line break */
	eol = i;
	if (i < len) {
	if (data[i] == '\r' && i + 1 < len &&
	data[i+1] == '\n')
	i += 2;
	else
	i++;
	if (keepends)
	eol = i;
	}
	_STRINGLIB_SPLIT_APPEND(data, j, eol);
	j = i;
	}
	if (j < len) {
	_STRINGLIB_SPLIT_APPEND(data, j, len);
	}

	return list;

	onError:
	Py_XDECREF(list);
	return NULL;
	}

	#undef _STRINGLIB_SPLIT_APPEND