mirror of
				https://github.com/python/cpython.git
				synced 2025-11-04 03:44:55 +00:00 
			
		
		
		
	svn+ssh://pythondev@svn.python.org/python/branches/py3k ........ r75404 | antoine.pitrou | 2009-10-14 19:14:16 +0200 (mer., 14 oct. 2009) | 5 lines Issue #7065: Fix a crash in bytes.maketrans and bytearray.maketrans when using byte values greater than 127. Patch by egreen. ........
		
			
				
	
	
		
			464 lines
		
	
	
	
		
			9.8 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
			
		
		
	
	
			464 lines
		
	
	
	
		
			9.8 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
#include "Python.h"
 | 
						|
#include "bytes_methods.h"
 | 
						|
 | 
						|
PyDoc_STRVAR_shared(_Py_isspace__doc__,
 | 
						|
"B.isspace() -> bool\n\
 | 
						|
\n\
 | 
						|
Return True if all characters in B are whitespace\n\
 | 
						|
and there is at least one character in B, False otherwise.");
 | 
						|
 | 
						|
PyObject*
 | 
						|
_Py_bytes_isspace(const char *cptr, Py_ssize_t len)
 | 
						|
{
 | 
						|
    register const unsigned char *p
 | 
						|
        = (unsigned char *) cptr;
 | 
						|
    register const unsigned char *e;
 | 
						|
 | 
						|
    /* Shortcut for single character strings */
 | 
						|
    if (len == 1 && Py_ISSPACE(*p))
 | 
						|
        Py_RETURN_TRUE;
 | 
						|
 | 
						|
    /* Special case for empty strings */
 | 
						|
    if (len == 0)
 | 
						|
        Py_RETURN_FALSE;
 | 
						|
 | 
						|
    e = p + len;
 | 
						|
    for (; p < e; p++) {
 | 
						|
	if (!Py_ISSPACE(*p))
 | 
						|
            Py_RETURN_FALSE;
 | 
						|
    }
 | 
						|
    Py_RETURN_TRUE;
 | 
						|
}
 | 
						|
 | 
						|
 | 
						|
PyDoc_STRVAR_shared(_Py_isalpha__doc__,
 | 
						|
"B.isalpha() -> bool\n\
 | 
						|
\n\
 | 
						|
Return True if all characters in B are alphabetic\n\
 | 
						|
and there is at least one character in B, False otherwise.");
 | 
						|
 | 
						|
PyObject*
 | 
						|
_Py_bytes_isalpha(const char *cptr, Py_ssize_t len)
 | 
						|
{
 | 
						|
    register const unsigned char *p
 | 
						|
        = (unsigned char *) cptr;
 | 
						|
    register const unsigned char *e;
 | 
						|
 | 
						|
    /* Shortcut for single character strings */
 | 
						|
    if (len == 1 && Py_ISALPHA(*p))
 | 
						|
	Py_RETURN_TRUE;
 | 
						|
 | 
						|
    /* Special case for empty strings */
 | 
						|
    if (len == 0)
 | 
						|
	Py_RETURN_FALSE;
 | 
						|
 | 
						|
    e = p + len;
 | 
						|
    for (; p < e; p++) {
 | 
						|
	if (!Py_ISALPHA(*p))
 | 
						|
	    Py_RETURN_FALSE;
 | 
						|
    }
 | 
						|
    Py_RETURN_TRUE;
 | 
						|
}
 | 
						|
 | 
						|
 | 
						|
PyDoc_STRVAR_shared(_Py_isalnum__doc__,
 | 
						|
"B.isalnum() -> bool\n\
 | 
						|
\n\
 | 
						|
Return True if all characters in B are alphanumeric\n\
 | 
						|
and there is at least one character in B, False otherwise.");
 | 
						|
 | 
						|
PyObject*
 | 
						|
_Py_bytes_isalnum(const char *cptr, Py_ssize_t len)
 | 
						|
{
 | 
						|
    register const unsigned char *p
 | 
						|
        = (unsigned char *) cptr;
 | 
						|
    register const unsigned char *e;
 | 
						|
 | 
						|
    /* Shortcut for single character strings */
 | 
						|
    if (len == 1 && Py_ISALNUM(*p))
 | 
						|
	Py_RETURN_TRUE;
 | 
						|
 | 
						|
    /* Special case for empty strings */
 | 
						|
    if (len == 0)
 | 
						|
	Py_RETURN_FALSE;
 | 
						|
 | 
						|
    e = p + len;
 | 
						|
    for (; p < e; p++) {
 | 
						|
	if (!Py_ISALNUM(*p))
 | 
						|
	    Py_RETURN_FALSE;
 | 
						|
    }
 | 
						|
    Py_RETURN_TRUE;
 | 
						|
}
 | 
						|
 | 
						|
 | 
						|
PyDoc_STRVAR_shared(_Py_isdigit__doc__,
 | 
						|
"B.isdigit() -> bool\n\
 | 
						|
\n\
 | 
						|
Return True if all characters in B are digits\n\
 | 
						|
and there is at least one character in B, False otherwise.");
 | 
						|
 | 
						|
PyObject*
 | 
						|
_Py_bytes_isdigit(const char *cptr, Py_ssize_t len)
 | 
						|
{
 | 
						|
    register const unsigned char *p
 | 
						|
        = (unsigned char *) cptr;
 | 
						|
    register const unsigned char *e;
 | 
						|
 | 
						|
    /* Shortcut for single character strings */
 | 
						|
    if (len == 1 && Py_ISDIGIT(*p))
 | 
						|
	Py_RETURN_TRUE;
 | 
						|
 | 
						|
    /* Special case for empty strings */
 | 
						|
    if (len == 0)
 | 
						|
	Py_RETURN_FALSE;
 | 
						|
 | 
						|
    e = p + len;
 | 
						|
    for (; p < e; p++) {
 | 
						|
	if (!Py_ISDIGIT(*p))
 | 
						|
	    Py_RETURN_FALSE;
 | 
						|
    }
 | 
						|
    Py_RETURN_TRUE;
 | 
						|
}
 | 
						|
 | 
						|
 | 
						|
PyDoc_STRVAR_shared(_Py_islower__doc__,
 | 
						|
"B.islower() -> bool\n\
 | 
						|
\n\
 | 
						|
Return True if all cased characters in B are lowercase and there is\n\
 | 
						|
at least one cased character in B, False otherwise.");
 | 
						|
 | 
						|
PyObject*
 | 
						|
_Py_bytes_islower(const char *cptr, Py_ssize_t len)
 | 
						|
{
 | 
						|
    register const unsigned char *p
 | 
						|
        = (unsigned char *) cptr;
 | 
						|
    register const unsigned char *e;
 | 
						|
    int cased;
 | 
						|
 | 
						|
    /* Shortcut for single character strings */
 | 
						|
    if (len == 1)
 | 
						|
	return PyBool_FromLong(Py_ISLOWER(*p));
 | 
						|
 | 
						|
    /* Special case for empty strings */
 | 
						|
    if (len == 0)
 | 
						|
	Py_RETURN_FALSE;
 | 
						|
 | 
						|
    e = p + len;
 | 
						|
    cased = 0;
 | 
						|
    for (; p < e; p++) {
 | 
						|
	if (Py_ISUPPER(*p))
 | 
						|
	    Py_RETURN_FALSE;
 | 
						|
	else if (!cased && Py_ISLOWER(*p))
 | 
						|
	    cased = 1;
 | 
						|
    }
 | 
						|
    return PyBool_FromLong(cased);
 | 
						|
}
 | 
						|
 | 
						|
 | 
						|
PyDoc_STRVAR_shared(_Py_isupper__doc__,
 | 
						|
"B.isupper() -> bool\n\
 | 
						|
\n\
 | 
						|
Return True if all cased characters in B are uppercase and there is\n\
 | 
						|
at least one cased character in B, False otherwise.");
 | 
						|
 | 
						|
PyObject*
 | 
						|
_Py_bytes_isupper(const char *cptr, Py_ssize_t len)
 | 
						|
{
 | 
						|
    register const unsigned char *p
 | 
						|
        = (unsigned char *) cptr;
 | 
						|
    register const unsigned char *e;
 | 
						|
    int cased;
 | 
						|
 | 
						|
    /* Shortcut for single character strings */
 | 
						|
    if (len == 1)
 | 
						|
	return PyBool_FromLong(Py_ISUPPER(*p));
 | 
						|
 | 
						|
    /* Special case for empty strings */
 | 
						|
    if (len == 0)
 | 
						|
	Py_RETURN_FALSE;
 | 
						|
 | 
						|
    e = p + len;
 | 
						|
    cased = 0;
 | 
						|
    for (; p < e; p++) {
 | 
						|
	if (Py_ISLOWER(*p))
 | 
						|
	    Py_RETURN_FALSE;
 | 
						|
	else if (!cased && Py_ISUPPER(*p))
 | 
						|
	    cased = 1;
 | 
						|
    }
 | 
						|
    return PyBool_FromLong(cased);
 | 
						|
}
 | 
						|
 | 
						|
 | 
						|
PyDoc_STRVAR_shared(_Py_istitle__doc__,
 | 
						|
"B.istitle() -> bool\n\
 | 
						|
\n\
 | 
						|
Return True if B is a titlecased string and there is at least one\n\
 | 
						|
character in B, i.e. uppercase characters may only follow uncased\n\
 | 
						|
characters and lowercase characters only cased ones. Return False\n\
 | 
						|
otherwise.");
 | 
						|
 | 
						|
PyObject*
 | 
						|
_Py_bytes_istitle(const char *cptr, Py_ssize_t len)
 | 
						|
{
 | 
						|
    register const unsigned char *p
 | 
						|
        = (unsigned char *) cptr;
 | 
						|
    register const unsigned char *e;
 | 
						|
    int cased, previous_is_cased;
 | 
						|
 | 
						|
    /* Shortcut for single character strings */
 | 
						|
    if (len == 1)
 | 
						|
	return PyBool_FromLong(Py_ISUPPER(*p));
 | 
						|
 | 
						|
    /* Special case for empty strings */
 | 
						|
    if (len == 0)
 | 
						|
	Py_RETURN_FALSE;
 | 
						|
 | 
						|
    e = p + len;
 | 
						|
    cased = 0;
 | 
						|
    previous_is_cased = 0;
 | 
						|
    for (; p < e; p++) {
 | 
						|
	register const unsigned char ch = *p;
 | 
						|
 | 
						|
	if (Py_ISUPPER(ch)) {
 | 
						|
	    if (previous_is_cased)
 | 
						|
		Py_RETURN_FALSE;
 | 
						|
	    previous_is_cased = 1;
 | 
						|
	    cased = 1;
 | 
						|
	}
 | 
						|
	else if (Py_ISLOWER(ch)) {
 | 
						|
	    if (!previous_is_cased)
 | 
						|
		Py_RETURN_FALSE;
 | 
						|
	    previous_is_cased = 1;
 | 
						|
	    cased = 1;
 | 
						|
	}
 | 
						|
	else
 | 
						|
	    previous_is_cased = 0;
 | 
						|
    }
 | 
						|
    return PyBool_FromLong(cased);
 | 
						|
}
 | 
						|
 | 
						|
 | 
						|
PyDoc_STRVAR_shared(_Py_lower__doc__,
 | 
						|
"B.lower() -> copy of B\n\
 | 
						|
\n\
 | 
						|
Return a copy of B with all ASCII characters converted to lowercase.");
 | 
						|
 | 
						|
void
 | 
						|
_Py_bytes_lower(char *result, const char *cptr, Py_ssize_t len)
 | 
						|
{
 | 
						|
	Py_ssize_t i;
 | 
						|
 | 
						|
        /*
 | 
						|
	newobj = PyBytes_FromStringAndSize(NULL, len);
 | 
						|
	if (!newobj)
 | 
						|
		return NULL;
 | 
						|
 | 
						|
	s = PyBytes_AS_STRING(newobj);
 | 
						|
        */
 | 
						|
 | 
						|
	Py_MEMCPY(result, cptr, len);
 | 
						|
 | 
						|
	for (i = 0; i < len; i++) {
 | 
						|
		int c = Py_CHARMASK(result[i]);
 | 
						|
		if (Py_ISUPPER(c))
 | 
						|
			result[i] = Py_TOLOWER(c);
 | 
						|
	}
 | 
						|
}
 | 
						|
 | 
						|
 | 
						|
PyDoc_STRVAR_shared(_Py_upper__doc__,
 | 
						|
"B.upper() -> copy of B\n\
 | 
						|
\n\
 | 
						|
Return a copy of B with all ASCII characters converted to uppercase.");
 | 
						|
 | 
						|
void
 | 
						|
_Py_bytes_upper(char *result, const char *cptr, Py_ssize_t len)
 | 
						|
{
 | 
						|
	Py_ssize_t i;
 | 
						|
 | 
						|
        /*
 | 
						|
	newobj = PyBytes_FromStringAndSize(NULL, len);
 | 
						|
	if (!newobj)
 | 
						|
		return NULL;
 | 
						|
 | 
						|
	s = PyBytes_AS_STRING(newobj);
 | 
						|
        */
 | 
						|
 | 
						|
	Py_MEMCPY(result, cptr, len);
 | 
						|
 | 
						|
	for (i = 0; i < len; i++) {
 | 
						|
		int c = Py_CHARMASK(result[i]);
 | 
						|
		if (Py_ISLOWER(c))
 | 
						|
			result[i] = Py_TOUPPER(c);
 | 
						|
	}
 | 
						|
}
 | 
						|
 | 
						|
 | 
						|
PyDoc_STRVAR_shared(_Py_title__doc__,
 | 
						|
"B.title() -> copy of B\n\
 | 
						|
\n\
 | 
						|
Return a titlecased version of B, i.e. ASCII words start with uppercase\n\
 | 
						|
characters, all remaining cased characters have lowercase.");
 | 
						|
 | 
						|
void
 | 
						|
_Py_bytes_title(char *result, char *s, Py_ssize_t len)
 | 
						|
{
 | 
						|
	Py_ssize_t i;
 | 
						|
	int previous_is_cased = 0;
 | 
						|
 | 
						|
        /*
 | 
						|
	newobj = PyBytes_FromStringAndSize(NULL, len);
 | 
						|
	if (newobj == NULL)
 | 
						|
		return NULL;
 | 
						|
	s_new = PyBytes_AsString(newobj);
 | 
						|
        */
 | 
						|
	for (i = 0; i < len; i++) {
 | 
						|
		int c = Py_CHARMASK(*s++);
 | 
						|
		if (Py_ISLOWER(c)) {
 | 
						|
			if (!previous_is_cased)
 | 
						|
			    c = Py_TOUPPER(c);
 | 
						|
			previous_is_cased = 1;
 | 
						|
		} else if (Py_ISUPPER(c)) {
 | 
						|
			if (previous_is_cased)
 | 
						|
			    c = Py_TOLOWER(c);
 | 
						|
			previous_is_cased = 1;
 | 
						|
		} else
 | 
						|
			previous_is_cased = 0;
 | 
						|
		*result++ = c;
 | 
						|
	}
 | 
						|
}
 | 
						|
 | 
						|
 | 
						|
PyDoc_STRVAR_shared(_Py_capitalize__doc__,
 | 
						|
"B.capitalize() -> copy of B\n\
 | 
						|
\n\
 | 
						|
Return a copy of B with only its first character capitalized (ASCII).");
 | 
						|
 | 
						|
void
 | 
						|
_Py_bytes_capitalize(char *result, char *s, Py_ssize_t len)
 | 
						|
{
 | 
						|
	Py_ssize_t i;
 | 
						|
 | 
						|
        /*
 | 
						|
	newobj = PyBytes_FromStringAndSize(NULL, len);
 | 
						|
	if (newobj == NULL)
 | 
						|
		return NULL;
 | 
						|
	s_new = PyBytes_AsString(newobj);
 | 
						|
        */
 | 
						|
	if (0 < len) {
 | 
						|
		int c = Py_CHARMASK(*s++);
 | 
						|
		if (Py_ISLOWER(c))
 | 
						|
			*result = Py_TOUPPER(c);
 | 
						|
		else
 | 
						|
			*result = c;
 | 
						|
		result++;
 | 
						|
	}
 | 
						|
	for (i = 1; i < len; i++) {
 | 
						|
		int c = Py_CHARMASK(*s++);
 | 
						|
		if (Py_ISUPPER(c))
 | 
						|
			*result = Py_TOLOWER(c);
 | 
						|
		else
 | 
						|
			*result = c;
 | 
						|
		result++;
 | 
						|
	}
 | 
						|
}
 | 
						|
 | 
						|
 | 
						|
PyDoc_STRVAR_shared(_Py_swapcase__doc__,
 | 
						|
"B.swapcase() -> copy of B\n\
 | 
						|
\n\
 | 
						|
Return a copy of B with uppercase ASCII characters converted\n\
 | 
						|
to lowercase ASCII and vice versa.");
 | 
						|
 | 
						|
void
 | 
						|
_Py_bytes_swapcase(char *result, char *s, Py_ssize_t len)
 | 
						|
{
 | 
						|
	Py_ssize_t i;
 | 
						|
 | 
						|
        /*
 | 
						|
	newobj = PyBytes_FromStringAndSize(NULL, len);
 | 
						|
	if (newobj == NULL)
 | 
						|
		return NULL;
 | 
						|
	s_new = PyBytes_AsString(newobj);
 | 
						|
        */
 | 
						|
	for (i = 0; i < len; i++) {
 | 
						|
		int c = Py_CHARMASK(*s++);
 | 
						|
		if (Py_ISLOWER(c)) {
 | 
						|
			*result = Py_TOUPPER(c);
 | 
						|
		}
 | 
						|
		else if (Py_ISUPPER(c)) {
 | 
						|
			*result = Py_TOLOWER(c);
 | 
						|
		}
 | 
						|
		else
 | 
						|
			*result = c;
 | 
						|
		result++;
 | 
						|
	}
 | 
						|
}
 | 
						|
 | 
						|
 | 
						|
PyDoc_STRVAR_shared(_Py_maketrans__doc__,
 | 
						|
"B.maketrans(frm, to) -> translation table\n\
 | 
						|
\n\
 | 
						|
Return a translation table (a bytes object of length 256)\n\
 | 
						|
suitable for use in bytes.translate where each byte in frm is\n\
 | 
						|
mapped to the byte at the same position in to.\n\
 | 
						|
The strings frm and to must be of the same length.");
 | 
						|
 | 
						|
static Py_ssize_t
 | 
						|
_getbuffer(PyObject *obj, Py_buffer *view)
 | 
						|
{
 | 
						|
    PyBufferProcs *buffer = Py_TYPE(obj)->tp_as_buffer;
 | 
						|
 | 
						|
    if (buffer == NULL || buffer->bf_getbuffer == NULL)
 | 
						|
    {
 | 
						|
        PyErr_Format(PyExc_TypeError,
 | 
						|
                     "Type %.100s doesn't support the buffer API",
 | 
						|
                     Py_TYPE(obj)->tp_name);
 | 
						|
        return -1;
 | 
						|
    }
 | 
						|
 | 
						|
    if (buffer->bf_getbuffer(obj, view, PyBUF_SIMPLE) < 0)
 | 
						|
            return -1;
 | 
						|
    return view->len;
 | 
						|
}
 | 
						|
 | 
						|
PyObject *
 | 
						|
_Py_bytes_maketrans(PyObject *args)
 | 
						|
{
 | 
						|
	PyObject *frm, *to, *res = NULL;
 | 
						|
	Py_buffer bfrm, bto;
 | 
						|
	Py_ssize_t i;
 | 
						|
	char *p;
 | 
						|
 | 
						|
	bfrm.len = -1;
 | 
						|
	bto.len = -1;
 | 
						|
	
 | 
						|
	if (!PyArg_ParseTuple(args, "OO:maketrans", &frm, &to))
 | 
						|
		return NULL;
 | 
						|
	if (_getbuffer(frm, &bfrm) < 0)
 | 
						|
		return NULL;
 | 
						|
	if (_getbuffer(to, &bto) < 0)
 | 
						|
		goto done;
 | 
						|
	if (bfrm.len != bto.len) {
 | 
						|
		PyErr_Format(PyExc_ValueError,
 | 
						|
			     "maketrans arguments must have same length");
 | 
						|
		goto done;
 | 
						|
	}
 | 
						|
	res = PyBytes_FromStringAndSize(NULL, 256);
 | 
						|
	if (!res) {
 | 
						|
		goto done;
 | 
						|
	}
 | 
						|
	p = PyBytes_AS_STRING(res);
 | 
						|
	for (i = 0; i < 256; i++)
 | 
						|
		p[i] = i;
 | 
						|
	for (i = 0; i < bfrm.len; i++) {
 | 
						|
		p[((unsigned char *)bfrm.buf)[i]] = ((char *)bto.buf)[i];
 | 
						|
	}
 | 
						|
 | 
						|
  done:
 | 
						|
	if (bfrm.len != -1)
 | 
						|
		PyBuffer_Release(&bfrm);
 | 
						|
	if (bto.len != -1)
 | 
						|
		PyBuffer_Release(&bto);
 | 
						|
	return res;
 | 
						|
}
 |