| /* bytes to hex implementation */ |
| |
| #include "Python.h" |
| |
| #include "pystrhex.h" |
| |
| static PyObject *_Py_strhex_impl(const char* argbuf, const Py_ssize_t arglen, |
| const PyObject* sep, int bytes_per_sep_group, |
| const int return_bytes) |
| { |
| assert(arglen >= 0); |
| |
| Py_UCS1 sep_char = 0; |
| if (sep) { |
| Py_ssize_t seplen = PyObject_Length((PyObject*)sep); |
| if (seplen < 0) { |
| return NULL; |
| } |
| if (seplen != 1) { |
| PyErr_SetString(PyExc_ValueError, "sep must be length 1."); |
| return NULL; |
| } |
| if (PyUnicode_Check(sep)) { |
| if (PyUnicode_READY(sep)) |
| return NULL; |
| if (PyUnicode_KIND(sep) != PyUnicode_1BYTE_KIND) { |
| PyErr_SetString(PyExc_ValueError, "sep must be ASCII."); |
| return NULL; |
| } |
| sep_char = PyUnicode_READ_CHAR(sep, 0); |
| } |
| else if (PyBytes_Check(sep)) { |
| sep_char = PyBytes_AS_STRING(sep)[0]; |
| } |
| else { |
| PyErr_SetString(PyExc_TypeError, "sep must be str or bytes."); |
| return NULL; |
| } |
| if (sep_char > 127 && !return_bytes) { |
| PyErr_SetString(PyExc_ValueError, "sep must be ASCII."); |
| return NULL; |
| } |
| } |
| else { |
| bytes_per_sep_group = 0; |
| } |
| |
| unsigned int abs_bytes_per_sep = abs(bytes_per_sep_group); |
| Py_ssize_t resultlen = 0; |
| if (bytes_per_sep_group && arglen > 0) { |
| /* How many sep characters we'll be inserting. */ |
| resultlen = (arglen - 1) / abs_bytes_per_sep; |
| } |
| /* Bounds checking for our Py_ssize_t indices. */ |
| if (arglen >= PY_SSIZE_T_MAX / 2 - resultlen) { |
| return PyErr_NoMemory(); |
| } |
| resultlen += arglen * 2; |
| |
| if ((size_t)abs_bytes_per_sep >= (size_t)arglen) { |
| bytes_per_sep_group = 0; |
| abs_bytes_per_sep = 0; |
| } |
| |
| PyObject *retval; |
| Py_UCS1 *retbuf; |
| if (return_bytes) { |
| /* If _PyBytes_FromSize() were public we could avoid malloc+copy. */ |
| retval = PyBytes_FromStringAndSize(NULL, resultlen); |
| if (!retval) { |
| return NULL; |
| } |
| retbuf = (Py_UCS1 *)PyBytes_AS_STRING(retval); |
| } |
| else { |
| retval = PyUnicode_New(resultlen, 127); |
| if (!retval) { |
| return NULL; |
| } |
| retbuf = PyUnicode_1BYTE_DATA(retval); |
| } |
| |
| /* Hexlify */ |
| Py_ssize_t i, j; |
| unsigned char c; |
| |
| if (bytes_per_sep_group == 0) { |
| for (i = j = 0; i < arglen; ++i) { |
| assert((j + 1) < resultlen); |
| c = argbuf[i]; |
| retbuf[j++] = Py_hexdigits[c >> 4]; |
| retbuf[j++] = Py_hexdigits[c & 0x0f]; |
| } |
| assert(j == resultlen); |
| } |
| else { |
| /* The number of complete chunk+sep periods */ |
| Py_ssize_t chunks = (arglen - 1) / abs_bytes_per_sep; |
| Py_ssize_t chunk; |
| unsigned int k; |
| |
| if (bytes_per_sep_group < 0) { |
| i = j = 0; |
| for (chunk = 0; chunk < chunks; chunk++) { |
| for (k = 0; k < abs_bytes_per_sep; k++) { |
| c = argbuf[i++]; |
| retbuf[j++] = Py_hexdigits[c >> 4]; |
| retbuf[j++] = Py_hexdigits[c & 0x0f]; |
| } |
| retbuf[j++] = sep_char; |
| } |
| while (i < arglen) { |
| c = argbuf[i++]; |
| retbuf[j++] = Py_hexdigits[c >> 4]; |
| retbuf[j++] = Py_hexdigits[c & 0x0f]; |
| } |
| assert(j == resultlen); |
| } |
| else { |
| i = arglen - 1; |
| j = resultlen - 1; |
| for (chunk = 0; chunk < chunks; chunk++) { |
| for (k = 0; k < abs_bytes_per_sep; k++) { |
| c = argbuf[i--]; |
| retbuf[j--] = Py_hexdigits[c & 0x0f]; |
| retbuf[j--] = Py_hexdigits[c >> 4]; |
| } |
| retbuf[j--] = sep_char; |
| } |
| while (i >= 0) { |
| c = argbuf[i--]; |
| retbuf[j--] = Py_hexdigits[c & 0x0f]; |
| retbuf[j--] = Py_hexdigits[c >> 4]; |
| } |
| assert(j == -1); |
| } |
| } |
| |
| #ifdef Py_DEBUG |
| if (!return_bytes) { |
| assert(_PyUnicode_CheckConsistency(retval, 1)); |
| } |
| #endif |
| |
| return retval; |
| } |
| |
| PyObject * _Py_strhex(const char* argbuf, const Py_ssize_t arglen) |
| { |
| return _Py_strhex_impl(argbuf, arglen, NULL, 0, 0); |
| } |
| |
| /* Same as above but returns a bytes() instead of str() to avoid the |
| * need to decode the str() when bytes are needed. */ |
| PyObject * _Py_strhex_bytes(const char* argbuf, const Py_ssize_t arglen) |
| { |
| return _Py_strhex_impl(argbuf, arglen, NULL, 0, 1); |
| } |
| |
| /* These variants include support for a separator between every N bytes: */ |
| |
| PyObject * _Py_strhex_with_sep(const char* argbuf, const Py_ssize_t arglen, const PyObject* sep, const int bytes_per_group) |
| { |
| return _Py_strhex_impl(argbuf, arglen, sep, bytes_per_group, 0); |
| } |
| |
| /* Same as above but returns a bytes() instead of str() to avoid the |
| * need to decode the str() when bytes are needed. */ |
| PyObject * _Py_strhex_bytes_with_sep(const char* argbuf, const Py_ssize_t arglen, const PyObject* sep, const int bytes_per_group) |
| { |
| return _Py_strhex_impl(argbuf, arglen, sep, bytes_per_group, 1); |
| } |