mirror of
				https://github.com/python/cpython.git
				synced 2025-10-24 23:46:23 +00:00 
			
		
		
		
	
		
			
				
	
	
		
			175 lines
		
	
	
	
		
			5 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
			
		
		
	
	
			175 lines
		
	
	
	
		
			5 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
| /* stringlib: find/index implementation */
 | |
| 
 | |
| #ifndef STRINGLIB_FIND_H
 | |
| #define STRINGLIB_FIND_H
 | |
| 
 | |
| #ifndef STRINGLIB_FASTSEARCH_H
 | |
| #error must include "stringlib/fastsearch.h" before including this module
 | |
| #endif
 | |
| 
 | |
| Py_LOCAL_INLINE(Py_ssize_t)
 | |
| stringlib_find(const STRINGLIB_CHAR* str, Py_ssize_t str_len,
 | |
|                const STRINGLIB_CHAR* sub, Py_ssize_t sub_len,
 | |
|                Py_ssize_t offset)
 | |
| {
 | |
|     Py_ssize_t pos;
 | |
| 
 | |
|     if (str_len < 0)
 | |
|         return -1;
 | |
|     if (sub_len == 0)
 | |
|         return offset;
 | |
| 
 | |
|     pos = fastsearch(str, str_len, sub, sub_len, -1, FAST_SEARCH);
 | |
| 
 | |
|     if (pos >= 0)
 | |
|         pos += offset;
 | |
| 
 | |
|     return pos;
 | |
| }
 | |
| 
 | |
| Py_LOCAL_INLINE(Py_ssize_t)
 | |
| stringlib_rfind(const STRINGLIB_CHAR* str, Py_ssize_t str_len,
 | |
|                 const STRINGLIB_CHAR* sub, Py_ssize_t sub_len,
 | |
|                 Py_ssize_t offset)
 | |
| {
 | |
|     Py_ssize_t pos;
 | |
| 
 | |
|     if (str_len < 0)
 | |
|         return -1;
 | |
|     if (sub_len == 0)
 | |
|         return str_len + offset;
 | |
| 
 | |
|     pos = fastsearch(str, str_len, sub, sub_len, -1, FAST_RSEARCH);
 | |
| 
 | |
|     if (pos >= 0)
 | |
|         pos += offset;
 | |
| 
 | |
|     return pos;
 | |
| }
 | |
| 
 | |
| /* helper macro to fixup start/end slice values */
 | |
| #define ADJUST_INDICES(start, end, len)         \
 | |
|     if (end > len)                              \
 | |
|         end = len;                              \
 | |
|     else if (end < 0) {                         \
 | |
|         end += len;                             \
 | |
|         if (end < 0)                            \
 | |
|             end = 0;                            \
 | |
|     }                                           \
 | |
|     if (start < 0) {                            \
 | |
|         start += len;                           \
 | |
|         if (start < 0)                          \
 | |
|             start = 0;                          \
 | |
|     }
 | |
| 
 | |
| Py_LOCAL_INLINE(Py_ssize_t)
 | |
| stringlib_find_slice(const STRINGLIB_CHAR* str, Py_ssize_t str_len,
 | |
|                      const STRINGLIB_CHAR* sub, Py_ssize_t sub_len,
 | |
|                      Py_ssize_t start, Py_ssize_t end)
 | |
| {
 | |
|     ADJUST_INDICES(start, end, str_len);
 | |
|     return stringlib_find(str + start, end - start, sub, sub_len, start);
 | |
| }
 | |
| 
 | |
| Py_LOCAL_INLINE(Py_ssize_t)
 | |
| stringlib_rfind_slice(const STRINGLIB_CHAR* str, Py_ssize_t str_len,
 | |
|                       const STRINGLIB_CHAR* sub, Py_ssize_t sub_len,
 | |
|                       Py_ssize_t start, Py_ssize_t end)
 | |
| {
 | |
|     ADJUST_INDICES(start, end, str_len);
 | |
|     return stringlib_rfind(str + start, end - start, sub, sub_len, start);
 | |
| }
 | |
| 
 | |
| #ifdef STRINGLIB_WANT_CONTAINS_OBJ
 | |
| 
 | |
| Py_LOCAL_INLINE(int)
 | |
| stringlib_contains_obj(PyObject* str, PyObject* sub)
 | |
| {
 | |
|     return stringlib_find(
 | |
|         STRINGLIB_STR(str), STRINGLIB_LEN(str),
 | |
|         STRINGLIB_STR(sub), STRINGLIB_LEN(sub), 0
 | |
|         ) != -1;
 | |
| }
 | |
| 
 | |
| #endif /* STRINGLIB_WANT_CONTAINS_OBJ */
 | |
| 
 | |
| /*
 | |
| This function is a helper for the "find" family (find, rfind, index,
 | |
| rindex) and for count, startswith and endswith, because they all have
 | |
| the same behaviour for the arguments.
 | |
| 
 | |
| It does not touch the variables received until it knows everything 
 | |
| is ok.
 | |
| */
 | |
| 
 | |
| #define FORMAT_BUFFER_SIZE 50
 | |
| 
 | |
| Py_LOCAL_INLINE(int)
 | |
| stringlib_parse_args_finds(const char * function_name, PyObject *args,
 | |
|                            PyObject **subobj,
 | |
|                            Py_ssize_t *start, Py_ssize_t *end)
 | |
| {
 | |
|     PyObject *tmp_subobj;
 | |
|     Py_ssize_t tmp_start = 0;
 | |
|     Py_ssize_t tmp_end = PY_SSIZE_T_MAX;
 | |
|     PyObject *obj_start=Py_None, *obj_end=Py_None;
 | |
|     char format[FORMAT_BUFFER_SIZE] = "O|OO:";
 | |
|     size_t len = strlen(format);
 | |
| 
 | |
|     strncpy(format + len, function_name, FORMAT_BUFFER_SIZE - len - 1);
 | |
|     format[FORMAT_BUFFER_SIZE - 1] = '\0';
 | |
| 
 | |
|     if (!PyArg_ParseTuple(args, format, &tmp_subobj, &obj_start, &obj_end))
 | |
|         return 0;
 | |
| 
 | |
|     /* To support None in "start" and "end" arguments, meaning
 | |
|        the same as if they were not passed.
 | |
|     */
 | |
|     if (obj_start != Py_None)
 | |
|         if (!_PyEval_SliceIndex(obj_start, &tmp_start))
 | |
|             return 0;
 | |
|     if (obj_end != Py_None)
 | |
|         if (!_PyEval_SliceIndex(obj_end, &tmp_end))
 | |
|             return 0;
 | |
| 
 | |
|     *start = tmp_start;
 | |
|     *end = tmp_end;
 | |
|     *subobj = tmp_subobj;
 | |
|     return 1;
 | |
| }
 | |
| 
 | |
| #undef FORMAT_BUFFER_SIZE
 | |
| 
 | |
| #if STRINGLIB_IS_UNICODE
 | |
| 
 | |
| /*
 | |
| Wraps stringlib_parse_args_finds() and additionally ensures that the
 | |
| first argument is a unicode object.
 | |
| 
 | |
| Note that we receive a pointer to the pointer of the substring object,
 | |
| so when we create that object in this function we don't DECREF it,
 | |
| because it continues living in the caller functions (those functions, 
 | |
| after finishing using the substring, must DECREF it).
 | |
| */
 | |
| 
 | |
| Py_LOCAL_INLINE(int)
 | |
| stringlib_parse_args_finds_unicode(const char * function_name, PyObject *args,
 | |
|                                    PyUnicodeObject **substring,
 | |
|                                    Py_ssize_t *start, Py_ssize_t *end)
 | |
| {
 | |
|     PyObject *tmp_substring;
 | |
| 
 | |
|     if(stringlib_parse_args_finds(function_name, args, &tmp_substring,
 | |
|                                   start, end)) {
 | |
|         tmp_substring = PyUnicode_FromObject(tmp_substring);
 | |
|         if (!tmp_substring)
 | |
|             return 0;
 | |
|         *substring = (PyUnicodeObject *)tmp_substring;
 | |
|         return 1;
 | |
|     }
 | |
|     return 0;
 | |
| }
 | |
| 
 | |
| #endif /* STRINGLIB_IS_UNICODE */
 | |
| 
 | |
| #endif /* STRINGLIB_FIND_H */
 | 
