1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145
|
% Generated by roxygen2: do not edit by hand
% Please edit documentation in R/search.R
\name{about_search}
\alias{about_search}
\alias{search}
\alias{stringi-search}
\title{String Searching}
\description{
This man page explains how to perform string search-based
operations in \pkg{stringi}.
}
\details{
The following independent string searching engines are available
in \pkg{stringi}.
\itemize{
\item \code{stri_*_regex} -- \pkg{ICU}'s regular expressions (regexes),
see \link{about_search_regex},
\item \code{stri_*_fixed} -- locale-independent byte-wise pattern matching,
see \link{about_search_fixed},
\item \code{stri_*_coll} -- \pkg{ICU}'s \code{StringSearch},
locale-sensitive, Collator-based pattern search,
useful for natural language processing tasks,
see \link{about_search_coll},
\item \code{stri_*_charclass} -- character classes search,
e.g., Unicode General Categories or Binary Properties,
see \link{about_search_charclass},
\item \code{stri_*_boundaries} -- text boundary analysis,
see \link{about_search_boundaries}
}
Each search engine is able to perform many search-based operations.
These may include:
\itemize{
\item \code{stri_detect_*} - detect if a pattern occurs in a string,
see, e.g., \code{\link{stri_detect}},
\item \code{stri_count_*} - count the number of pattern occurrences,
see, e.g., \code{\link{stri_count}},
\item \code{stri_locate_*} - locate all, first, or last occurrences
of a pattern, see, e.g., \code{\link{stri_locate}},
\item \code{stri_extract_*} - extract all, first, or last occurrences
of a pattern, see, e.g., \code{\link{stri_extract}}
and, in case of regexes, \code{\link{stri_match}},
\item \code{stri_replace_*} - replace all, first, or last occurrences
of a pattern, see, e.g., \code{\link{stri_replace}}
and also \code{\link{stri_trim}},
\item \code{stri_split_*} - split a string into chunks indicated
by occurrences of a pattern,
see, e.g., \code{\link{stri_split}},
\item \code{stri_startswith_*} and \code{stri_endswith_*} detect
if a string starts or ends with a pattern match, see,
e.g., \code{\link{stri_startswith}},
\item \code{stri_subset_*} - return a subset of a character vector
with strings that match a given pattern, see, e.g., \code{\link{stri_subset}}.
}
}
\seealso{
The official online manual of \pkg{stringi} at \url{https://stringi.gagolewski.com/}
Gagolewski M., \pkg{stringi}: Fast and portable character string processing in R, \emph{Journal of Statistical Software} 103(2), 2022, 1-59, \doi{10.18637/jss.v103.i02}
Other text_boundaries:
\code{\link{about_search_boundaries}},
\code{\link{stri_count_boundaries}()},
\code{\link{stri_extract_all_boundaries}()},
\code{\link{stri_locate_all_boundaries}()},
\code{\link{stri_opts_brkiter}()},
\code{\link{stri_split_boundaries}()},
\code{\link{stri_split_lines}()},
\code{\link{stri_trans_tolower}()},
\code{\link{stri_wrap}()}
Other search_regex:
\code{\link{about_search_regex}},
\code{\link{stri_opts_regex}()}
Other search_fixed:
\code{\link{about_search_fixed}},
\code{\link{stri_opts_fixed}()}
Other search_coll:
\code{\link{about_search_coll}},
\code{\link{stri_opts_collator}()}
Other search_charclass:
\code{\link{about_search_charclass}},
\code{\link{stri_trim_both}()}
Other search_detect:
\code{\link{stri_detect}()},
\code{\link{stri_startswith}()}
Other search_count:
\code{\link{stri_count_boundaries}()},
\code{\link{stri_count}()}
Other search_locate:
\code{\link{stri_locate_all_boundaries}()},
\code{\link{stri_locate_all}()}
Other search_replace:
\code{\link{stri_replace_all}()},
\code{\link{stri_replace_rstr}()},
\code{\link{stri_trim_both}()}
Other search_split:
\code{\link{stri_split_boundaries}()},
\code{\link{stri_split_lines}()},
\code{\link{stri_split}()}
Other search_subset:
\code{\link{stri_subset}()}
Other search_extract:
\code{\link{stri_extract_all_boundaries}()},
\code{\link{stri_extract_all}()},
\code{\link{stri_match_all}()}
Other stringi_general_topics:
\code{\link{about_arguments}},
\code{\link{about_encoding}},
\code{\link{about_locale}},
\code{\link{about_search_boundaries}},
\code{\link{about_search_charclass}},
\code{\link{about_search_coll}},
\code{\link{about_search_fixed}},
\code{\link{about_search_regex}},
\code{\link{about_stringi}}
}
\concept{search_charclass}
\concept{search_coll}
\concept{search_count}
\concept{search_detect}
\concept{search_extract}
\concept{search_fixed}
\concept{search_in}
\concept{search_locate}
\concept{search_regex}
\concept{search_replace}
\concept{search_split}
\concept{search_subset}
\concept{stringi_general_topics}
\concept{text_boundaries}
\author{
\href{https://www.gagolewski.com/}{Marek Gagolewski} and other contributors
}
|