123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174 |
- /* Format bytes as hexadecimal */
- #include "Python.h"
- #include "pycore_strhex.h" // _Py_strhex_with_sep()
- #include <stdlib.h> // abs()
- static PyObject *_Py_strhex_impl(const char* argbuf, const Py_ssize_t arglen,
- PyObject* sep, int bytes_per_sep_group,
- const int return_bytes)
- {
- assert(arglen >= 0);
- Py_UCS1 sep_char = 0;
- if (sep) {
- Py_ssize_t seplen = PyObject_Length((PyObject*)sep);
- if (seplen < 0) {
- return NULL;
- }
- if (seplen != 1) {
- PyErr_SetString(PyExc_ValueError, "sep must be length 1.");
- return NULL;
- }
- if (PyUnicode_Check(sep)) {
- if (PyUnicode_READY(sep))
- return NULL;
- if (PyUnicode_KIND(sep) != PyUnicode_1BYTE_KIND) {
- PyErr_SetString(PyExc_ValueError, "sep must be ASCII.");
- return NULL;
- }
- sep_char = PyUnicode_READ_CHAR(sep, 0);
- }
- else if (PyBytes_Check(sep)) {
- sep_char = PyBytes_AS_STRING(sep)[0];
- }
- else {
- PyErr_SetString(PyExc_TypeError, "sep must be str or bytes.");
- return NULL;
- }
- if (sep_char > 127 && !return_bytes) {
- PyErr_SetString(PyExc_ValueError, "sep must be ASCII.");
- return NULL;
- }
- }
- else {
- bytes_per_sep_group = 0;
- }
- unsigned int abs_bytes_per_sep = abs(bytes_per_sep_group);
- Py_ssize_t resultlen = 0;
- if (bytes_per_sep_group && arglen > 0) {
- /* How many sep characters we'll be inserting. */
- resultlen = (arglen - 1) / abs_bytes_per_sep;
- }
- /* Bounds checking for our Py_ssize_t indices. */
- if (arglen >= PY_SSIZE_T_MAX / 2 - resultlen) {
- return PyErr_NoMemory();
- }
- resultlen += arglen * 2;
- if ((size_t)abs_bytes_per_sep >= (size_t)arglen) {
- bytes_per_sep_group = 0;
- abs_bytes_per_sep = 0;
- }
- PyObject *retval;
- Py_UCS1 *retbuf;
- if (return_bytes) {
- /* If _PyBytes_FromSize() were public we could avoid malloc+copy. */
- retval = PyBytes_FromStringAndSize(NULL, resultlen);
- if (!retval) {
- return NULL;
- }
- retbuf = (Py_UCS1 *)PyBytes_AS_STRING(retval);
- }
- else {
- retval = PyUnicode_New(resultlen, 127);
- if (!retval) {
- return NULL;
- }
- retbuf = PyUnicode_1BYTE_DATA(retval);
- }
- /* Hexlify */
- Py_ssize_t i, j;
- unsigned char c;
- if (bytes_per_sep_group == 0) {
- for (i = j = 0; i < arglen; ++i) {
- assert((j + 1) < resultlen);
- c = argbuf[i];
- retbuf[j++] = Py_hexdigits[c >> 4];
- retbuf[j++] = Py_hexdigits[c & 0x0f];
- }
- assert(j == resultlen);
- }
- else {
- /* The number of complete chunk+sep periods */
- Py_ssize_t chunks = (arglen - 1) / abs_bytes_per_sep;
- Py_ssize_t chunk;
- unsigned int k;
- if (bytes_per_sep_group < 0) {
- i = j = 0;
- for (chunk = 0; chunk < chunks; chunk++) {
- for (k = 0; k < abs_bytes_per_sep; k++) {
- c = argbuf[i++];
- retbuf[j++] = Py_hexdigits[c >> 4];
- retbuf[j++] = Py_hexdigits[c & 0x0f];
- }
- retbuf[j++] = sep_char;
- }
- while (i < arglen) {
- c = argbuf[i++];
- retbuf[j++] = Py_hexdigits[c >> 4];
- retbuf[j++] = Py_hexdigits[c & 0x0f];
- }
- assert(j == resultlen);
- }
- else {
- i = arglen - 1;
- j = resultlen - 1;
- for (chunk = 0; chunk < chunks; chunk++) {
- for (k = 0; k < abs_bytes_per_sep; k++) {
- c = argbuf[i--];
- retbuf[j--] = Py_hexdigits[c & 0x0f];
- retbuf[j--] = Py_hexdigits[c >> 4];
- }
- retbuf[j--] = sep_char;
- }
- while (i >= 0) {
- c = argbuf[i--];
- retbuf[j--] = Py_hexdigits[c & 0x0f];
- retbuf[j--] = Py_hexdigits[c >> 4];
- }
- assert(j == -1);
- }
- }
- #ifdef Py_DEBUG
- if (!return_bytes) {
- assert(_PyUnicode_CheckConsistency(retval, 1));
- }
- #endif
- return retval;
- }
- PyObject * _Py_strhex(const char* argbuf, const Py_ssize_t arglen)
- {
- return _Py_strhex_impl(argbuf, arglen, NULL, 0, 0);
- }
- /* Same as above but returns a bytes() instead of str() to avoid the
- * need to decode the str() when bytes are needed. */
- PyObject* _Py_strhex_bytes(const char* argbuf, const Py_ssize_t arglen)
- {
- return _Py_strhex_impl(argbuf, arglen, NULL, 0, 1);
- }
- /* These variants include support for a separator between every N bytes: */
- PyObject* _Py_strhex_with_sep(const char* argbuf, const Py_ssize_t arglen,
- PyObject* sep, const int bytes_per_group)
- {
- return _Py_strhex_impl(argbuf, arglen, sep, bytes_per_group, 0);
- }
- /* Same as above but returns a bytes() instead of str() to avoid the
- * need to decode the str() when bytes are needed. */
- PyObject* _Py_strhex_bytes_with_sep(const char* argbuf, const Py_ssize_t arglen,
- PyObject* sep, const int bytes_per_group)
- {
- return _Py_strhex_impl(argbuf, arglen, sep, bytes_per_group, 1);
- }
|