| /* stringlib: find/index implementation */ |
| |
| #ifndef STRINGLIB_FIND_H |
| #define STRINGLIB_FIND_H |
| |
| #ifndef STRINGLIB_FASTSEARCH_H |
| #error must include "stringlib/fastsearch.h" before including this module |
| #endif |
| |
| Py_LOCAL_INLINE(Py_ssize_t) |
| stringlib_find(const STRINGLIB_CHAR* str, Py_ssize_t str_len, |
| const STRINGLIB_CHAR* sub, Py_ssize_t sub_len, |
| Py_ssize_t offset) |
| { |
| Py_ssize_t pos; |
| |
| if (str_len < 0) |
| return -1; |
| if (sub_len == 0) |
| return offset; |
| |
| pos = fastsearch(str, str_len, sub, sub_len, -1, FAST_SEARCH); |
| |
| if (pos >= 0) |
| pos += offset; |
| |
| return pos; |
| } |
| |
| Py_LOCAL_INLINE(Py_ssize_t) |
| stringlib_rfind(const STRINGLIB_CHAR* str, Py_ssize_t str_len, |
| const STRINGLIB_CHAR* sub, Py_ssize_t sub_len, |
| Py_ssize_t offset) |
| { |
| Py_ssize_t pos; |
| |
| if (str_len < 0) |
| return -1; |
| if (sub_len == 0) |
| return str_len + offset; |
| |
| pos = fastsearch(str, str_len, sub, sub_len, -1, FAST_RSEARCH); |
| |
| if (pos >= 0) |
| pos += offset; |
| |
| return pos; |
| } |
| |
| /* helper macro to fixup start/end slice values */ |
| #define ADJUST_INDICES(start, end, len) \ |
| if (end > len) \ |
| end = len; \ |
| else if (end < 0) { \ |
| end += len; \ |
| if (end < 0) \ |
| end = 0; \ |
| } \ |
| if (start < 0) { \ |
| start += len; \ |
| if (start < 0) \ |
| start = 0; \ |
| } |
| |
| Py_LOCAL_INLINE(Py_ssize_t) |
| stringlib_find_slice(const STRINGLIB_CHAR* str, Py_ssize_t str_len, |
| const STRINGLIB_CHAR* sub, Py_ssize_t sub_len, |
| Py_ssize_t start, Py_ssize_t end) |
| { |
| ADJUST_INDICES(start, end, str_len); |
| return stringlib_find(str + start, end - start, sub, sub_len, start); |
| } |
| |
| Py_LOCAL_INLINE(Py_ssize_t) |
| stringlib_rfind_slice(const STRINGLIB_CHAR* str, Py_ssize_t str_len, |
| const STRINGLIB_CHAR* sub, Py_ssize_t sub_len, |
| Py_ssize_t start, Py_ssize_t end) |
| { |
| ADJUST_INDICES(start, end, str_len); |
| return stringlib_rfind(str + start, end - start, sub, sub_len, start); |
| } |
| |
| #ifdef STRINGLIB_WANT_CONTAINS_OBJ |
| |
| Py_LOCAL_INLINE(int) |
| stringlib_contains_obj(PyObject* str, PyObject* sub) |
| { |
| return stringlib_find( |
| STRINGLIB_STR(str), STRINGLIB_LEN(str), |
| STRINGLIB_STR(sub), STRINGLIB_LEN(sub), 0 |
| ) != -1; |
| } |
| |
| #endif /* STRINGLIB_WANT_CONTAINS_OBJ */ |
| |
| /* |
| This function is a helper for the "find" family (find, rfind, index, |
| rindex) and for count, startswith and endswith, because they all have |
| the same behaviour for the arguments. |
| |
| It does not touch the variables received until it knows everything |
| is ok. |
| */ |
| |
| #define FORMAT_BUFFER_SIZE 50 |
| |
| Py_LOCAL_INLINE(int) |
| stringlib_parse_args_finds(const char * function_name, PyObject *args, |
| PyObject **subobj, |
| Py_ssize_t *start, Py_ssize_t *end) |
| { |
| PyObject *tmp_subobj; |
| Py_ssize_t tmp_start = 0; |
| Py_ssize_t tmp_end = PY_SSIZE_T_MAX; |
| PyObject *obj_start=Py_None, *obj_end=Py_None; |
| char format[FORMAT_BUFFER_SIZE] = "O|OO:"; |
| size_t len = strlen(format); |
| |
| strncpy(format + len, function_name, FORMAT_BUFFER_SIZE - len - 1); |
| format[FORMAT_BUFFER_SIZE - 1] = '\0'; |
| |
| if (!PyArg_ParseTuple(args, format, &tmp_subobj, &obj_start, &obj_end)) |
| return 0; |
| |
| /* To support None in "start" and "end" arguments, meaning |
| the same as if they were not passed. |
| */ |
| if (obj_start != Py_None) |
| if (!_PyEval_SliceIndex(obj_start, &tmp_start)) |
| return 0; |
| if (obj_end != Py_None) |
| if (!_PyEval_SliceIndex(obj_end, &tmp_end)) |
| return 0; |
| |
| *start = tmp_start; |
| *end = tmp_end; |
| *subobj = tmp_subobj; |
| return 1; |
| } |
| |
| #undef FORMAT_BUFFER_SIZE |
| |
| #if STRINGLIB_IS_UNICODE |
| |
| /* |
| Wraps stringlib_parse_args_finds() and additionally ensures that the |
| first argument is a unicode object. |
| |
| Note that we receive a pointer to the pointer of the substring object, |
| so when we create that object in this function we don't DECREF it, |
| because it continues living in the caller functions (those functions, |
| after finishing using the substring, must DECREF it). |
| */ |
| |
| Py_LOCAL_INLINE(int) |
| stringlib_parse_args_finds_unicode(const char * function_name, PyObject *args, |
| PyUnicodeObject **substring, |
| Py_ssize_t *start, Py_ssize_t *end) |
| { |
| PyObject *tmp_substring; |
| |
| if(stringlib_parse_args_finds(function_name, args, &tmp_substring, |
| start, end)) { |
| tmp_substring = PyUnicode_FromObject(tmp_substring); |
| if (!tmp_substring) |
| return 0; |
| *substring = (PyUnicodeObject *)tmp_substring; |
| return 1; |
| } |
| return 0; |
| } |
| |
| #endif /* STRINGLIB_IS_UNICODE */ |
| |
| #endif /* STRINGLIB_FIND_H */ |