mirror of
				https://github.com/python/cpython.git
				synced 2025-10-24 15:36:26 +00:00 
			
		
		
		
	
		
			
				
	
	
		
			172 lines
		
	
	
	
		
			5.3 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
			
		
		
	
	
			172 lines
		
	
	
	
		
			5.3 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
| /* Format bytes as hexadecimal */
 | |
| 
 | |
| #include "Python.h"
 | |
| #include "pycore_strhex.h"        // _Py_strhex_with_sep()
 | |
| #include "pycore_unicodeobject.h" // _PyUnicode_CheckConsistency()
 | |
| 
 | |
| static PyObject *_Py_strhex_impl(const char* argbuf, const Py_ssize_t arglen,
 | |
|                                  PyObject* sep, int bytes_per_sep_group,
 | |
|                                  const int return_bytes)
 | |
| {
 | |
|     assert(arglen >= 0);
 | |
| 
 | |
|     Py_UCS1 sep_char = 0;
 | |
|     if (sep) {
 | |
|         Py_ssize_t seplen = PyObject_Length((PyObject*)sep);
 | |
|         if (seplen < 0) {
 | |
|             return NULL;
 | |
|         }
 | |
|         if (seplen != 1) {
 | |
|             PyErr_SetString(PyExc_ValueError, "sep must be length 1.");
 | |
|             return NULL;
 | |
|         }
 | |
|         if (PyUnicode_Check(sep)) {
 | |
|             if (PyUnicode_KIND(sep) != PyUnicode_1BYTE_KIND) {
 | |
|                 PyErr_SetString(PyExc_ValueError, "sep must be ASCII.");
 | |
|                 return NULL;
 | |
|             }
 | |
|             sep_char = PyUnicode_READ_CHAR(sep, 0);
 | |
|         }
 | |
|         else if (PyBytes_Check(sep)) {
 | |
|             sep_char = PyBytes_AS_STRING(sep)[0];
 | |
|         }
 | |
|         else {
 | |
|             PyErr_SetString(PyExc_TypeError, "sep must be str or bytes.");
 | |
|             return NULL;
 | |
|         }
 | |
|         if (sep_char > 127 && !return_bytes) {
 | |
|             PyErr_SetString(PyExc_ValueError, "sep must be ASCII.");
 | |
|             return NULL;
 | |
|         }
 | |
|     }
 | |
|     else {
 | |
|         bytes_per_sep_group = 0;
 | |
|     }
 | |
| 
 | |
|     unsigned int abs_bytes_per_sep = Py_ABS(bytes_per_sep_group);
 | |
|     Py_ssize_t resultlen = 0;
 | |
|     if (bytes_per_sep_group && arglen > 0) {
 | |
|         /* How many sep characters we'll be inserting. */
 | |
|         resultlen = (arglen - 1) / abs_bytes_per_sep;
 | |
|     }
 | |
|     /* Bounds checking for our Py_ssize_t indices. */
 | |
|     if (arglen >= PY_SSIZE_T_MAX / 2 - resultlen) {
 | |
|         return PyErr_NoMemory();
 | |
|     }
 | |
|     resultlen += arglen * 2;
 | |
| 
 | |
|     if ((size_t)abs_bytes_per_sep >= (size_t)arglen) {
 | |
|         bytes_per_sep_group = 0;
 | |
|         abs_bytes_per_sep = 0;
 | |
|     }
 | |
| 
 | |
|     PyObject *retval;
 | |
|     Py_UCS1 *retbuf;
 | |
|     if (return_bytes) {
 | |
|         /* If _PyBytes_FromSize() were public we could avoid malloc+copy. */
 | |
|         retval = PyBytes_FromStringAndSize(NULL, resultlen);
 | |
|         if (!retval) {
 | |
|             return NULL;
 | |
|         }
 | |
|         retbuf = (Py_UCS1 *)PyBytes_AS_STRING(retval);
 | |
|     }
 | |
|     else {
 | |
|         retval = PyUnicode_New(resultlen, 127);
 | |
|         if (!retval) {
 | |
|             return NULL;
 | |
|         }
 | |
|         retbuf = PyUnicode_1BYTE_DATA(retval);
 | |
|     }
 | |
| 
 | |
|     /* Hexlify */
 | |
|     Py_ssize_t i, j;
 | |
|     unsigned char c;
 | |
| 
 | |
|     if (bytes_per_sep_group == 0) {
 | |
|         for (i = j = 0; i < arglen; ++i) {
 | |
|             assert((j + 1) < resultlen);
 | |
|             c = argbuf[i];
 | |
|             retbuf[j++] = Py_hexdigits[c >> 4];
 | |
|             retbuf[j++] = Py_hexdigits[c & 0x0f];
 | |
|         }
 | |
|         assert(j == resultlen);
 | |
|     }
 | |
|     else {
 | |
|         /* The number of complete chunk+sep periods */
 | |
|         Py_ssize_t chunks = (arglen - 1) / abs_bytes_per_sep;
 | |
|         Py_ssize_t chunk;
 | |
|         unsigned int k;
 | |
| 
 | |
|         if (bytes_per_sep_group < 0) {
 | |
|             i = j = 0;
 | |
|             for (chunk = 0; chunk < chunks; chunk++) {
 | |
|                 for (k = 0; k < abs_bytes_per_sep; k++) {
 | |
|                     c = argbuf[i++];
 | |
|                     retbuf[j++] = Py_hexdigits[c >> 4];
 | |
|                     retbuf[j++] = Py_hexdigits[c & 0x0f];
 | |
|                 }
 | |
|                 retbuf[j++] = sep_char;
 | |
|             }
 | |
|             while (i < arglen) {
 | |
|                 c = argbuf[i++];
 | |
|                 retbuf[j++] = Py_hexdigits[c >> 4];
 | |
|                 retbuf[j++] = Py_hexdigits[c & 0x0f];
 | |
|             }
 | |
|             assert(j == resultlen);
 | |
|         }
 | |
|         else {
 | |
|             i = arglen - 1;
 | |
|             j = resultlen - 1;
 | |
|             for (chunk = 0; chunk < chunks; chunk++) {
 | |
|                 for (k = 0; k < abs_bytes_per_sep; k++) {
 | |
|                     c = argbuf[i--];
 | |
|                     retbuf[j--] = Py_hexdigits[c & 0x0f];
 | |
|                     retbuf[j--] = Py_hexdigits[c >> 4];
 | |
|                 }
 | |
|                 retbuf[j--] = sep_char;
 | |
|             }
 | |
|             while (i >= 0) {
 | |
|                 c = argbuf[i--];
 | |
|                 retbuf[j--] = Py_hexdigits[c & 0x0f];
 | |
|                 retbuf[j--] = Py_hexdigits[c >> 4];
 | |
|             }
 | |
|             assert(j == -1);
 | |
|         }
 | |
|     }
 | |
| 
 | |
| #ifdef Py_DEBUG
 | |
|     if (!return_bytes) {
 | |
|         assert(_PyUnicode_CheckConsistency(retval, 1));
 | |
|     }
 | |
| #endif
 | |
| 
 | |
|     return retval;
 | |
| }
 | |
| 
 | |
| PyObject * _Py_strhex(const char* argbuf, const Py_ssize_t arglen)
 | |
| {
 | |
|     return _Py_strhex_impl(argbuf, arglen, NULL, 0, 0);
 | |
| }
 | |
| 
 | |
| /* Same as above but returns a bytes() instead of str() to avoid the
 | |
|  * need to decode the str() when bytes are needed. */
 | |
| PyObject* _Py_strhex_bytes(const char* argbuf, const Py_ssize_t arglen)
 | |
| {
 | |
|     return _Py_strhex_impl(argbuf, arglen, NULL, 0, 1);
 | |
| }
 | |
| 
 | |
| /* These variants include support for a separator between every N bytes: */
 | |
| 
 | |
| PyObject* _Py_strhex_with_sep(const char* argbuf, const Py_ssize_t arglen,
 | |
|                               PyObject* sep, const int bytes_per_group)
 | |
| {
 | |
|     return _Py_strhex_impl(argbuf, arglen, sep, bytes_per_group, 0);
 | |
| }
 | |
| 
 | |
| /* Same as above but returns a bytes() instead of str() to avoid the
 | |
|  * need to decode the str() when bytes are needed. */
 | |
| PyObject* _Py_strhex_bytes_with_sep(const char* argbuf, const Py_ssize_t arglen,
 | |
|                                     PyObject* sep, const int bytes_per_group)
 | |
| {
 | |
|     return _Py_strhex_impl(argbuf, arglen, sep, bytes_per_group, 1);
 | |
| }
 | 
