mirror of
https://github.com/python/cpython.git
synced 2025-08-03 08:34:29 +00:00
Added checks to prevent PyUnicode_Count() from dumping core
in case the parameters are out of bounds and fixes error handling for .count(), .startswith() and .endswith() for the case of mixed string/Unicode objects. This patch adds Python style index semantics to PyUnicode_Count() indices (including the special handling of negative indices). The patch is an extended version of patch #103249 submitted by Michael Hudson (mwh) on SF. It also includes new test cases.
This commit is contained in:
parent
1c5aa6901f
commit
3a645e4dd4
4 changed files with 56 additions and 19 deletions
|
@ -1236,9 +1236,14 @@ string_count(PyStringObject *self, PyObject *args)
|
|||
sub = PyString_AS_STRING(subobj);
|
||||
n = PyString_GET_SIZE(subobj);
|
||||
}
|
||||
else if (PyUnicode_Check(subobj))
|
||||
return PyInt_FromLong(
|
||||
PyUnicode_Count((PyObject *)self, subobj, i, last));
|
||||
else if (PyUnicode_Check(subobj)) {
|
||||
int count;
|
||||
count = PyUnicode_Count((PyObject *)self, subobj, i, last);
|
||||
if (count == -1)
|
||||
return NULL;
|
||||
else
|
||||
return PyInt_FromLong((long) count);
|
||||
}
|
||||
else if (PyObject_AsCharBuffer(subobj, &sub, &n))
|
||||
return NULL;
|
||||
|
||||
|
@ -1637,10 +1642,15 @@ string_startswith(PyStringObject *self, PyObject *args)
|
|||
prefix = PyString_AS_STRING(subobj);
|
||||
plen = PyString_GET_SIZE(subobj);
|
||||
}
|
||||
else if (PyUnicode_Check(subobj))
|
||||
return PyInt_FromLong(
|
||||
PyUnicode_Tailmatch((PyObject *)self,
|
||||
subobj, start, end, -1));
|
||||
else if (PyUnicode_Check(subobj)) {
|
||||
int rc;
|
||||
rc = PyUnicode_Tailmatch((PyObject *)self,
|
||||
subobj, start, end, -1);
|
||||
if (rc == -1)
|
||||
return NULL;
|
||||
else
|
||||
return PyInt_FromLong((long) rc);
|
||||
}
|
||||
else if (PyObject_AsCharBuffer(subobj, &prefix, &plen))
|
||||
return NULL;
|
||||
|
||||
|
@ -1690,10 +1700,15 @@ string_endswith(PyStringObject *self, PyObject *args)
|
|||
suffix = PyString_AS_STRING(subobj);
|
||||
slen = PyString_GET_SIZE(subobj);
|
||||
}
|
||||
else if (PyUnicode_Check(subobj))
|
||||
return PyInt_FromLong(
|
||||
PyUnicode_Tailmatch((PyObject *)self,
|
||||
subobj, start, end, +1));
|
||||
else if (PyUnicode_Check(subobj)) {
|
||||
int rc;
|
||||
rc = PyUnicode_Tailmatch((PyObject *)self,
|
||||
subobj, start, end, +1);
|
||||
if (rc == -1)
|
||||
return NULL;
|
||||
else
|
||||
return PyInt_FromLong((long) rc);
|
||||
}
|
||||
else if (PyObject_AsCharBuffer(subobj, &suffix, &slen))
|
||||
return NULL;
|
||||
|
||||
|
|
|
@ -1976,7 +1976,7 @@ PyObject *PyUnicode_DecodeCharmap(const char *s,
|
|||
x = Py_None;
|
||||
Py_INCREF(x);
|
||||
} else
|
||||
goto onError;
|
||||
goto onError;
|
||||
}
|
||||
|
||||
/* Apply mapping */
|
||||
|
@ -2014,9 +2014,9 @@ PyObject *PyUnicode_DecodeCharmap(const char *s,
|
|||
(targetsize << 2);
|
||||
extrachars += needed;
|
||||
if (_PyUnicode_Resize(v, PyUnicode_GET_SIZE(v) + needed)) {
|
||||
Py_DECREF(x);
|
||||
goto onError;
|
||||
}
|
||||
Py_DECREF(x);
|
||||
goto onError;
|
||||
}
|
||||
p = PyUnicode_AS_UNICODE(v) + oldpos;
|
||||
}
|
||||
Py_UNICODE_COPY(p,
|
||||
|
@ -2112,7 +2112,7 @@ PyObject *PyUnicode_EncodeCharmap(const Py_UNICODE *p,
|
|||
x = Py_None;
|
||||
Py_INCREF(x);
|
||||
} else
|
||||
goto onError;
|
||||
goto onError;
|
||||
}
|
||||
|
||||
/* Apply mapping */
|
||||
|
@ -2150,9 +2150,9 @@ PyObject *PyUnicode_EncodeCharmap(const Py_UNICODE *p,
|
|||
(targetsize << 2);
|
||||
extrachars += needed;
|
||||
if (_PyString_Resize(&v, PyString_GET_SIZE(v) + needed)) {
|
||||
Py_DECREF(x);
|
||||
goto onError;
|
||||
}
|
||||
Py_DECREF(x);
|
||||
goto onError;
|
||||
}
|
||||
s = PyString_AS_STRING(v) + oldpos;
|
||||
}
|
||||
memcpy(s,
|
||||
|
@ -2392,6 +2392,17 @@ int count(PyUnicodeObject *self,
|
|||
{
|
||||
int count = 0;
|
||||
|
||||
if (start < 0)
|
||||
start += self->length;
|
||||
if (start < 0)
|
||||
start = 0;
|
||||
if (end > self->length)
|
||||
end = self->length;
|
||||
if (end < 0)
|
||||
end += self->length;
|
||||
if (end < 0)
|
||||
end = 0;
|
||||
|
||||
if (substring->length == 0)
|
||||
return (end - start + 1);
|
||||
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue