/* stringlib: find/index implementation */ | |
#ifndef STRINGLIB_FIND_H | |
#define STRINGLIB_FIND_H | |
#ifndef STRINGLIB_FASTSEARCH_H | |
#error must include "stringlib/fastsearch.h" before including this module | |
#endif | |
Py_LOCAL_INLINE(Py_ssize_t) | |
stringlib_find(const STRINGLIB_CHAR* str, Py_ssize_t str_len, | |
const STRINGLIB_CHAR* sub, Py_ssize_t sub_len, | |
Py_ssize_t offset) | |
{ | |
Py_ssize_t pos; | |
if (str_len < 0) | |
return -1; | |
if (sub_len == 0) | |
return offset; | |
pos = fastsearch(str, str_len, sub, sub_len, -1, FAST_SEARCH); | |
if (pos >= 0) | |
pos += offset; | |
return pos; | |
} | |
Py_LOCAL_INLINE(Py_ssize_t) | |
stringlib_rfind(const STRINGLIB_CHAR* str, Py_ssize_t str_len, | |
const STRINGLIB_CHAR* sub, Py_ssize_t sub_len, | |
Py_ssize_t offset) | |
{ | |
Py_ssize_t pos; | |
if (str_len < 0) | |
return -1; | |
if (sub_len == 0) | |
return str_len + offset; | |
pos = fastsearch(str, str_len, sub, sub_len, -1, FAST_RSEARCH); | |
if (pos >= 0) | |
pos += offset; | |
return pos; | |
} | |
/* helper macro to fixup start/end slice values */ | |
#define ADJUST_INDICES(start, end, len) \ | |
if (end > len) \ | |
end = len; \ | |
else if (end < 0) { \ | |
end += len; \ | |
if (end < 0) \ | |
end = 0; \ | |
} \ | |
if (start < 0) { \ | |
start += len; \ | |
if (start < 0) \ | |
start = 0; \ | |
} | |
Py_LOCAL_INLINE(Py_ssize_t) | |
stringlib_find_slice(const STRINGLIB_CHAR* str, Py_ssize_t str_len, | |
const STRINGLIB_CHAR* sub, Py_ssize_t sub_len, | |
Py_ssize_t start, Py_ssize_t end) | |
{ | |
ADJUST_INDICES(start, end, str_len); | |
return stringlib_find(str + start, end - start, sub, sub_len, start); | |
} | |
Py_LOCAL_INLINE(Py_ssize_t) | |
stringlib_rfind_slice(const STRINGLIB_CHAR* str, Py_ssize_t str_len, | |
const STRINGLIB_CHAR* sub, Py_ssize_t sub_len, | |
Py_ssize_t start, Py_ssize_t end) | |
{ | |
ADJUST_INDICES(start, end, str_len); | |
return stringlib_rfind(str + start, end - start, sub, sub_len, start); | |
} | |
#ifdef STRINGLIB_WANT_CONTAINS_OBJ | |
Py_LOCAL_INLINE(int) | |
stringlib_contains_obj(PyObject* str, PyObject* sub) | |
{ | |
return stringlib_find( | |
STRINGLIB_STR(str), STRINGLIB_LEN(str), | |
STRINGLIB_STR(sub), STRINGLIB_LEN(sub), 0 | |
) != -1; | |
} | |
#endif /* STRINGLIB_WANT_CONTAINS_OBJ */ | |
/* | |
This function is a helper for the "find" family (find, rfind, index, | |
rindex) and for count, startswith and endswith, because they all have | |
the same behaviour for the arguments. | |
It does not touch the variables received until it knows everything | |
is ok. | |
*/ | |
#define FORMAT_BUFFER_SIZE 50 | |
Py_LOCAL_INLINE(int) | |
stringlib_parse_args_finds(const char * function_name, PyObject *args, | |
PyObject **subobj, | |
Py_ssize_t *start, Py_ssize_t *end) | |
{ | |
PyObject *tmp_subobj; | |
Py_ssize_t tmp_start = 0; | |
Py_ssize_t tmp_end = PY_SSIZE_T_MAX; | |
PyObject *obj_start=Py_None, *obj_end=Py_None; | |
char format[FORMAT_BUFFER_SIZE] = "O|OO:"; | |
size_t len = strlen(format); | |
strncpy(format + len, function_name, FORMAT_BUFFER_SIZE - len - 1); | |
format[FORMAT_BUFFER_SIZE - 1] = '\0'; | |
if (!PyArg_ParseTuple(args, format, &tmp_subobj, &obj_start, &obj_end)) | |
return 0; | |
/* To support None in "start" and "end" arguments, meaning | |
the same as if they were not passed. | |
*/ | |
if (obj_start != Py_None) | |
if (!_PyEval_SliceIndex(obj_start, &tmp_start)) | |
return 0; | |
if (obj_end != Py_None) | |
if (!_PyEval_SliceIndex(obj_end, &tmp_end)) | |
return 0; | |
*start = tmp_start; | |
*end = tmp_end; | |
*subobj = tmp_subobj; | |
return 1; | |
} | |
#undef FORMAT_BUFFER_SIZE | |
#if STRINGLIB_IS_UNICODE | |
/* | |
Wraps stringlib_parse_args_finds() and additionally ensures that the | |
first argument is a unicode object. | |
Note that we receive a pointer to the pointer of the substring object, | |
so when we create that object in this function we don't DECREF it, | |
because it continues living in the caller functions (those functions, | |
after finishing using the substring, must DECREF it). | |
*/ | |
Py_LOCAL_INLINE(int) | |
stringlib_parse_args_finds_unicode(const char * function_name, PyObject *args, | |
PyUnicodeObject **substring, | |
Py_ssize_t *start, Py_ssize_t *end) | |
{ | |
PyObject *tmp_substring; | |
if(stringlib_parse_args_finds(function_name, args, &tmp_substring, | |
start, end)) { | |
tmp_substring = PyUnicode_FromObject(tmp_substring); | |
if (!tmp_substring) | |
return 0; | |
*substring = (PyUnicodeObject *)tmp_substring; | |
return 1; | |
} | |
return 0; | |
} | |
#endif /* STRINGLIB_IS_UNICODE */ | |
#endif /* STRINGLIB_FIND_H */ |