diff --git a/DESCRIPTION b/DESCRIPTION index dae77c851..6461c055d 100644 --- a/DESCRIPTION +++ b/DESCRIPTION @@ -1,6 +1,6 @@ Package: stringi Version: 1.6.1 -Date: 2021-04-29 +Date: 2021-04-30 Title: Character String Processing Facilities Description: A multitude of character string/text/natural language processing tools: pattern searching (e.g., with 'Java'-like regular diff --git a/NAMESPACE b/NAMESPACE index e45c04f32..1a3029981 100644 --- a/NAMESPACE +++ b/NAMESPACE @@ -172,6 +172,7 @@ export(stri_paste_list) export(stri_rand_lipsum) export(stri_rand_shuffle) export(stri_rand_strings) +export(stri_rank) export(stri_read_lines) export(stri_read_raw) export(stri_remove_empty) diff --git a/NEWS b/NEWS index 194498f6b..4654ec6a4 100644 --- a/NEWS +++ b/NEWS @@ -18,14 +18,19 @@ The ICU4C bundle has been updated from version 61.1 to 69.1 which features Unicode 13.0 and CLDR 39. -* ...todo... #408 (stri_trans_casefold), +* [NEW FEATURE] #408: ...todo... `stri_trans_casefold()`, -* [INTERNAL] #414: Use `LEVELS(x)` macro instead of accessing `(x)->sxpinfo.gp` - directly (@lukaszdaniel). +* [NEW FEATURE] #421: `stri_rank()` ranks strings in a character vector + (e.g., for ordering data frames with regards to multiple criteria, + the ranks can be passed to `order()`, see #219). + +* [BUGFIX] `stri_sort_key()` now outputs `bytes`-encoded strings. * [BUGFIX] #415: `locale=''` was not equivalent to `locale=NULL` in `stri_opts_collator()`. +* [INTERNAL] #414: Use `LEVELS(x)` macro instead of accessing `(x)->sxpinfo.gp` + directly (@lukaszdaniel). ## 1.5.3 (2020-09-04) **CRAN** diff --git a/R/encoding.R b/R/encoding.R index 4b8db22ab..e36805d57 100644 --- a/R/encoding.R +++ b/R/encoding.R @@ -133,7 +133,7 @@ #' is a translation scheme: we need to communicate with \R somehow, #' relying on how it represents strings. #' -#' Basically, \R has a very simple encoding marking mechanism, +#' Overall, \R has a very simple encoding marking mechanism, #' see \code{\link{stri_enc_mark}}. There is an implicit assumption #' that your platform's default (native) encoding always extends #' ASCII -- \pkg{stringi} checks that whenever your native encoding diff --git a/R/sort.R b/R/sort.R index 8672d8e0b..7d20c2cb7 100644 --- a/R/sort.R +++ b/R/sort.R @@ -36,7 +36,7 @@ #' #' #' @description -#' This function sorts a character vector according to the locale-dependent +#' This function sorts a character vector according to a locale-dependent #' lexicographic order. #' #' @@ -45,7 +45,7 @@ #' in \pkg{stringi}, refer to \code{\link{stri_opts_collator}}. #' #' As usual in \pkg{stringi}, non-character inputs are coerced to strings, -#' see an example below for a perhaps non-intitive behavior of lexicographic +#' see an example below for a somewhat non-intuitive behavior of lexicographic #' sorting on numeric inputs. #' #' This function uses a stable sort algorithm (\pkg{STL}'s \code{stable_sort}), @@ -106,16 +106,16 @@ stri_sort <- function(str, decreasing = FALSE, na_last = NA, ..., opts_collator #' in \pkg{stringi}, refer to \code{\link{stri_opts_collator}}. #' #' As usual in \pkg{stringi}, non-character inputs are coerced to strings, -#' see an example below for a perhaps non-intuitive behavior of lexicographic +#' see an example below for a somewhat non-intuitive behavior of lexicographic #' sorting on numeric inputs. #' -#' -#' -#' #' This function uses a stable sort algorithm (\pkg{STL}'s \code{stable_sort}), #' which performs up to \eqn{N*log^2(N)} element comparisons, #' where \eqn{N} is the length of \code{str}. #' +#' For ordering with regards to multiple criteria (such as sorting +#' data frames by more than 1 column), see \code{\link{stri_rank}}. +#' #' @param str a character vector #' @param decreasing a single logical value; should the sort order #' be nondecreasing (\code{FALSE}, default) @@ -288,16 +288,20 @@ stri_duplicated_any <- function(str, from_last = FALSE, fromLast = from_last, .. #' Sort Keys #' #' @description -#' This function computes a locale-dependent 'sort key', which is an alternative +#' This function computes a locale-dependent sort key, which is an alternative #' character representation of the string that, when ordered in the C locale -#' (which orders using bytes directly), will give an equivalent ordering to the -#' original string. It is useful for enhancing algorithms that sort only in the -#' C locale with the ability to be locale-aware. +#' (which orders using the underlying bytes directly), will give an equivalent +#' ordering to the original string. It is useful for enhancing algorithms +#' that sort only in the C locale (e.g., the \code{strcmp} function in libc) +#' with the ability to be locale-aware. #' #' @details #' For more information on \pkg{ICU}'s Collator and how to tune it up #' in \pkg{stringi}, refer to \code{\link{stri_opts_collator}}. #' +#' See also \code{\link{stri_rank}} for ranking strings with a single character +#' vector, i.e., generating relative sort keys. +#' #' @param str a character vector #' @param opts_collator a named list with \pkg{ICU} Collator's options, #' see \code{\link{stri_opts_collator}}, \code{NULL} @@ -306,7 +310,7 @@ stri_duplicated_any <- function(str, from_last = FALSE, fromLast = from_last, .. #' #' @return #' The result is a character vector with the same length as \code{str} that -#' contains the sort keys. +#' contains the sort keys. The output is marked as \code{bytes}-encoded. #' #' @references #' \emph{Collation} - ICU User Guide, @@ -325,3 +329,58 @@ stri_sort_key <- function(str, ..., opts_collator = NULL) opts_collator <- do.call(stri_opts_collator, as.list(c(opts_collator, ...))) .Call(C_stri_sort_key, str, opts_collator) } + + + +#' @title +#' Ranking +#' +#' +#' @description +#' This function ranks each string in a character vector according to a +#' locale-dependent lexicographic order. +#' It is a portable replacement for the base \code{xtfrm} function. +#' +#' +#' @details +#' Missing values result in missing ranks and tied observations receive +#' the same ranks (based on min). +#' +#' For more information on \pkg{ICU}'s Collator and how to tune it up +#' in \pkg{stringi}, refer to \code{\link{stri_opts_collator}}. +#' +#' @param str a character vector +#' @param opts_collator a named list with \pkg{ICU} Collator's options, +#' see \code{\link{stri_opts_collator}}, \code{NULL} +#' for default collation options +#' @param ... additional settings for \code{opts_collator} +#' +#' @return +#' The result is a vector of ranks corresponding to each +#' string in \code{str}. +#' +#' @references +#' \emph{Collation} - ICU User Guide, +#' \url{http://userguide.icu-project.org/collation} +#' +#' @family locale_sensitive +#' @export +#' @rdname stri_rank +#' +#' @examples +#' stri_rank(c('hladny', 'chladny'), locale='pl_PL') +#' stri_rank(c('hladny', 'chladny'), locale='sk_SK') +#' +#' stri_rank("a" %s+% c(1, 100, 2, 101, 11, 10)) # lexicographic order +#' stri_rank("a" %s+% c(1, 100, 2, 101, 11, 10), numeric=TRUE) +#' +#' # Ordering a data frame with respect to two criteria: +#' X <- data.frame(a=c("b", NA, "b", "b", NA, "a", "a", "c"), b=runif(8)) +#' X[order(stri_rank(X$a), X$b), ] +stri_rank <- function(str, ..., opts_collator=NULL) +{ + if (!missing(...)) + opts_collator <- do.call(stri_opts_collator, as.list(c(opts_collator, ...))) + + .Call(C_stri_rank, str, opts_collator) +} diff --git a/R/stringi-package.R b/R/stringi-package.R index b1f58fbef..b277ca536 100644 --- a/R/stringi-package.R +++ b/R/stringi-package.R @@ -37,7 +37,7 @@ #' \pkg{stringi} is THE R package for fast, correct, consistent, #' and convenient string/text manipulation. #' It gives predictable results on every platform, in each locale, -#' and under any ``native'' character encoding. +#' and under any native character encoding. #' #' \bold{Keywords}: R, text processing, character strings, #' internationalization, localization, ICU, ICU4C, i18n, l10n, Unicode. @@ -61,7 +61,7 @@ #' locale-sensitive operations. In particular, see #' \code{\link{stri_opts_collator}} for a description of the string #' collation algorithm, which is used for string comparing, ordering, -#' sorting, case-folding, and searching. +#' ranking, sorting, case-folding, and searching. #' #' \item \link{about_arguments} -- information on how \pkg{stringi} #' treats its functions' arguments. @@ -119,8 +119,8 @@ #' text transforms, including transliteration. #' #' \item \code{\link{stri_cmp}}, \code{\link{\%s<\%}}, \code{\link{stri_order}}, -#' \code{\link{stri_sort}}, \code{\link{stri_unique}}, and -#' \code{\link{stri_duplicated}} for collation-based, +#' \code{\link{stri_sort}}, \code{\link{stri_rank}}, \code{\link{stri_unique}}, +#' and \code{\link{stri_duplicated}} for collation-based, #' locale-aware operations, see also \link{about_locale}. #' #' \item \code{\link{stri_split_lines}} (among others) @@ -147,9 +147,8 @@ #' @docType package #' @author Marek Gagolewski, #' with contributions from Bartek Tartanus and many others. -#' ICU4C was developed by IBM and others. -#' The Unicode Character Database is due to Unicode, Inc.; -#' see the COPYRIGHTS file for more details. +#' ICU4C was developed by IBM, Unicode, Inc., and others. +#' #' @references #' \emph{\pkg{stringi} Package homepage}, \url{https://stringi.gagolewski.com/} #' diff --git a/devel/sphinx/_build/doctrees/environment.pickle b/devel/sphinx/_build/doctrees/environment.pickle index b242c871a..a3bd0a1cf 100644 Binary files a/devel/sphinx/_build/doctrees/environment.pickle and b/devel/sphinx/_build/doctrees/environment.pickle differ diff --git a/devel/sphinx/_build/doctrees/news.doctree b/devel/sphinx/_build/doctrees/news.doctree index 42103a318..dc2f5dd84 100644 Binary files a/devel/sphinx/_build/doctrees/news.doctree and b/devel/sphinx/_build/doctrees/news.doctree differ diff --git a/devel/sphinx/_build/doctrees/rapi.doctree b/devel/sphinx/_build/doctrees/rapi.doctree index 0886736a4..59ecdd5f3 100644 Binary files a/devel/sphinx/_build/doctrees/rapi.doctree and b/devel/sphinx/_build/doctrees/rapi.doctree differ diff --git a/devel/sphinx/_build/doctrees/rapi/about_encoding.doctree b/devel/sphinx/_build/doctrees/rapi/about_encoding.doctree index c3459ee01..696d07319 100644 Binary files a/devel/sphinx/_build/doctrees/rapi/about_encoding.doctree and b/devel/sphinx/_build/doctrees/rapi/about_encoding.doctree differ diff --git a/devel/sphinx/_build/doctrees/rapi/about_locale.doctree b/devel/sphinx/_build/doctrees/rapi/about_locale.doctree index 54f26015b..47a2a0c9e 100644 Binary files a/devel/sphinx/_build/doctrees/rapi/about_locale.doctree and b/devel/sphinx/_build/doctrees/rapi/about_locale.doctree differ diff --git a/devel/sphinx/_build/doctrees/rapi/about_search_boundaries.doctree b/devel/sphinx/_build/doctrees/rapi/about_search_boundaries.doctree index 2969ad5f3..9f0e16193 100644 Binary files a/devel/sphinx/_build/doctrees/rapi/about_search_boundaries.doctree and b/devel/sphinx/_build/doctrees/rapi/about_search_boundaries.doctree differ diff --git a/devel/sphinx/_build/doctrees/rapi/about_search_coll.doctree b/devel/sphinx/_build/doctrees/rapi/about_search_coll.doctree index 535763a6a..b19cea118 100644 Binary files a/devel/sphinx/_build/doctrees/rapi/about_search_coll.doctree and b/devel/sphinx/_build/doctrees/rapi/about_search_coll.doctree differ diff --git a/devel/sphinx/_build/doctrees/rapi/about_stringi.doctree b/devel/sphinx/_build/doctrees/rapi/about_stringi.doctree index a29fd0142..07620d229 100644 Binary files a/devel/sphinx/_build/doctrees/rapi/about_stringi.doctree and b/devel/sphinx/_build/doctrees/rapi/about_stringi.doctree differ diff --git a/devel/sphinx/_build/doctrees/rapi/operator_compare.doctree b/devel/sphinx/_build/doctrees/rapi/operator_compare.doctree index c4ed9e610..425a37fe5 100644 Binary files a/devel/sphinx/_build/doctrees/rapi/operator_compare.doctree and b/devel/sphinx/_build/doctrees/rapi/operator_compare.doctree differ diff --git a/devel/sphinx/_build/doctrees/rapi/stri_compare.doctree b/devel/sphinx/_build/doctrees/rapi/stri_compare.doctree index 2efe3c130..e306dff5f 100644 Binary files a/devel/sphinx/_build/doctrees/rapi/stri_compare.doctree and b/devel/sphinx/_build/doctrees/rapi/stri_compare.doctree differ diff --git a/devel/sphinx/_build/doctrees/rapi/stri_count_boundaries.doctree b/devel/sphinx/_build/doctrees/rapi/stri_count_boundaries.doctree index 3283e140d..8a7bfb526 100644 Binary files a/devel/sphinx/_build/doctrees/rapi/stri_count_boundaries.doctree and b/devel/sphinx/_build/doctrees/rapi/stri_count_boundaries.doctree differ diff --git a/devel/sphinx/_build/doctrees/rapi/stri_duplicated.doctree b/devel/sphinx/_build/doctrees/rapi/stri_duplicated.doctree index 12db24ced..4eb23d513 100644 Binary files a/devel/sphinx/_build/doctrees/rapi/stri_duplicated.doctree and b/devel/sphinx/_build/doctrees/rapi/stri_duplicated.doctree differ diff --git a/devel/sphinx/_build/doctrees/rapi/stri_enc_detect2.doctree b/devel/sphinx/_build/doctrees/rapi/stri_enc_detect2.doctree index e9b3f0701..81f8a9efa 100644 Binary files a/devel/sphinx/_build/doctrees/rapi/stri_enc_detect2.doctree and b/devel/sphinx/_build/doctrees/rapi/stri_enc_detect2.doctree differ diff --git a/devel/sphinx/_build/doctrees/rapi/stri_extract_boundaries.doctree b/devel/sphinx/_build/doctrees/rapi/stri_extract_boundaries.doctree index f9c782dfa..02a245203 100644 Binary files a/devel/sphinx/_build/doctrees/rapi/stri_extract_boundaries.doctree and b/devel/sphinx/_build/doctrees/rapi/stri_extract_boundaries.doctree differ diff --git a/devel/sphinx/_build/doctrees/rapi/stri_locate_boundaries.doctree b/devel/sphinx/_build/doctrees/rapi/stri_locate_boundaries.doctree index afdfc9217..6a0149350 100644 Binary files a/devel/sphinx/_build/doctrees/rapi/stri_locate_boundaries.doctree and b/devel/sphinx/_build/doctrees/rapi/stri_locate_boundaries.doctree differ diff --git a/devel/sphinx/_build/doctrees/rapi/stri_opts_collator.doctree b/devel/sphinx/_build/doctrees/rapi/stri_opts_collator.doctree index 41d865eaa..020cfc248 100644 Binary files a/devel/sphinx/_build/doctrees/rapi/stri_opts_collator.doctree and b/devel/sphinx/_build/doctrees/rapi/stri_opts_collator.doctree differ diff --git a/devel/sphinx/_build/doctrees/rapi/stri_order.doctree b/devel/sphinx/_build/doctrees/rapi/stri_order.doctree index eeba2e037..77a56e597 100644 Binary files a/devel/sphinx/_build/doctrees/rapi/stri_order.doctree and b/devel/sphinx/_build/doctrees/rapi/stri_order.doctree differ diff --git a/devel/sphinx/_build/doctrees/rapi/stri_rank.doctree b/devel/sphinx/_build/doctrees/rapi/stri_rank.doctree new file mode 100644 index 000000000..c5a439a48 Binary files /dev/null and b/devel/sphinx/_build/doctrees/rapi/stri_rank.doctree differ diff --git a/devel/sphinx/_build/doctrees/rapi/stri_sort.doctree b/devel/sphinx/_build/doctrees/rapi/stri_sort.doctree index 8db4b7c50..c3836432f 100644 Binary files a/devel/sphinx/_build/doctrees/rapi/stri_sort.doctree and b/devel/sphinx/_build/doctrees/rapi/stri_sort.doctree differ diff --git a/devel/sphinx/_build/doctrees/rapi/stri_sort_key.doctree b/devel/sphinx/_build/doctrees/rapi/stri_sort_key.doctree index dd13f457b..fd748cba7 100644 Binary files a/devel/sphinx/_build/doctrees/rapi/stri_sort_key.doctree and b/devel/sphinx/_build/doctrees/rapi/stri_sort_key.doctree differ diff --git a/devel/sphinx/_build/doctrees/rapi/stri_split_boundaries.doctree b/devel/sphinx/_build/doctrees/rapi/stri_split_boundaries.doctree index ecb645a25..571f2065e 100644 Binary files a/devel/sphinx/_build/doctrees/rapi/stri_split_boundaries.doctree and b/devel/sphinx/_build/doctrees/rapi/stri_split_boundaries.doctree differ diff --git a/devel/sphinx/_build/doctrees/rapi/stri_trans_casemap.doctree b/devel/sphinx/_build/doctrees/rapi/stri_trans_casemap.doctree index 0840b73d3..ff3f69b62 100644 Binary files a/devel/sphinx/_build/doctrees/rapi/stri_trans_casemap.doctree and b/devel/sphinx/_build/doctrees/rapi/stri_trans_casemap.doctree differ diff --git a/devel/sphinx/_build/doctrees/rapi/stri_unique.doctree b/devel/sphinx/_build/doctrees/rapi/stri_unique.doctree index 24380dbc2..b3ebfaeb8 100644 Binary files a/devel/sphinx/_build/doctrees/rapi/stri_unique.doctree and b/devel/sphinx/_build/doctrees/rapi/stri_unique.doctree differ diff --git a/devel/sphinx/_build/doctrees/rapi/stri_wrap.doctree b/devel/sphinx/_build/doctrees/rapi/stri_wrap.doctree index 33fba1eab..739734d2a 100644 Binary files a/devel/sphinx/_build/doctrees/rapi/stri_wrap.doctree and b/devel/sphinx/_build/doctrees/rapi/stri_wrap.doctree differ diff --git a/devel/sphinx/_build/html/_sources/news.rst.txt b/devel/sphinx/_build/html/_sources/news.rst.txt index 1d1564f71..e89e51b5f 100644 --- a/devel/sphinx/_build/html/_sources/news.rst.txt +++ b/devel/sphinx/_build/html/_sources/news.rst.txt @@ -15,14 +15,20 @@ What Is New in *stringi* - …todo… #401 (update ICU4C to 69.1), The ICU4C bundle has been updated from version 61.1 to 69.1 which features Unicode 13.0 and CLDR 39. -- …todo… #408 (stri_trans_casefold), +- [NEW FEATURE] #408: …todo… ``stri_trans_casefold()``, -- [INTERNAL] #414: Use ``LEVELS(x)`` macro instead of accessing - ``(x)->sxpinfo.gp`` directly (@lukaszdaniel). +- [NEW FEATURE] #421: ``stri_rank()`` ranks strings in a character + vector (e.g., for ordering data frames with regards to multiple + criteria, the ranks can be passed to ``order()``, see #219). + +- [BUGFIX] ``stri_sort_key()`` now outputs ``bytes``-encoded strings. - [BUGFIX] #415: ``locale=''`` was not equivalent to ``locale=NULL`` in ``stri_opts_collator()``. +- [INTERNAL] #414: Use ``LEVELS(x)`` macro instead of accessing + ``(x)->sxpinfo.gp`` directly (@lukaszdaniel). + 1.5.3 (2020-09-04) **CRAN** --------------------------- diff --git a/devel/sphinx/_build/html/_sources/rapi.rst.txt b/devel/sphinx/_build/html/_sources/rapi.rst.txt index 216e166d7..687690722 100644 --- a/devel/sphinx/_build/html/_sources/rapi.rst.txt +++ b/devel/sphinx/_build/html/_sources/rapi.rst.txt @@ -72,6 +72,7 @@ R Package *stringi* Reference rapi/stri_rand_lipsum rapi/stri_rand_shuffle rapi/stri_rand_strings + rapi/stri_rank rapi/stri_read_lines rapi/stri_read_raw rapi/stri_remove_empty diff --git a/devel/sphinx/_build/html/_sources/rapi/about_encoding.rst.txt b/devel/sphinx/_build/html/_sources/rapi/about_encoding.rst.txt index ee364b6a0..0a43a6b40 100644 --- a/devel/sphinx/_build/html/_sources/rapi/about_encoding.rst.txt +++ b/devel/sphinx/_build/html/_sources/rapi/about_encoding.rst.txt @@ -43,7 +43,7 @@ Character Encodings in R Data in memory are just bytes (small integer values) – an en\ *coding* is a way to represent characters with such numbers, it is a semantic 'key' to understand a given byte sequence. For example, in ISO-8859-2 (Central European), the value 177 represents Polish “a with ogonek”, and in ISO-8859-1 (Western European), the same value denotes the “plus-minus” sign. Thus, a character encoding is a translation scheme: we need to communicate with R somehow, relying on how it represents strings. -Basically, R has a very simple encoding marking mechanism, see `stri_enc_mark `__. There is an implicit assumption that your platform's default (native) encoding always extends ASCII – stringi checks that whenever your native encoding is being detected automatically on ICU's initialization and each time when you change it manually by calling `stri_enc_set `__. +Overall, R has a very simple encoding marking mechanism, see `stri_enc_mark `__. There is an implicit assumption that your platform's default (native) encoding always extends ASCII – stringi checks that whenever your native encoding is being detected automatically on ICU's initialization and each time when you change it manually by calling `stri_enc_set `__. Character strings in R (internally) can be declared to be in: diff --git a/devel/sphinx/_build/html/_sources/rapi/about_locale.rst.txt b/devel/sphinx/_build/html/_sources/rapi/about_locale.rst.txt index 9257e65d1..014a69a9a 100644 --- a/devel/sphinx/_build/html/_sources/rapi/about_locale.rst.txt +++ b/devel/sphinx/_build/html/_sources/rapi/about_locale.rst.txt @@ -54,6 +54,6 @@ See Also Other locale_management: `stri_locale_info() `__, `stri_locale_list() `__, `stri_locale_set() `__ -Other locale_sensitive: `%s<%() `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ +Other locale_sensitive: `%s<%() `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_rank() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ Other stringi_general_topics: `about_arguments `__, `about_encoding `__, `about_search_boundaries `__, `about_search_charclass `__, `about_search_coll `__, `about_search_fixed `__, `about_search_regex `__, `about_search `__, `about_stringi `__ diff --git a/devel/sphinx/_build/html/_sources/rapi/about_search_boundaries.rst.txt b/devel/sphinx/_build/html/_sources/rapi/about_search_boundaries.rst.txt index 8e404b39f..831b2ee74 100644 --- a/devel/sphinx/_build/html/_sources/rapi/about_search_boundaries.rst.txt +++ b/devel/sphinx/_build/html/_sources/rapi/about_search_boundaries.rst.txt @@ -43,7 +43,7 @@ References See Also ~~~~~~~~ -Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ +Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_rank() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ Other text_boundaries: `about_search `__, `stri_count_boundaries() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_brkiter() `__, `stri_split_boundaries() `__, `stri_split_lines() `__, `stri_trans_tolower() `__, `stri_wrap() `__ diff --git a/devel/sphinx/_build/html/_sources/rapi/about_search_coll.rst.txt b/devel/sphinx/_build/html/_sources/rapi/about_search_coll.rst.txt index 5514cf651..13ce9358d 100644 --- a/devel/sphinx/_build/html/_sources/rapi/about_search_coll.rst.txt +++ b/devel/sphinx/_build/html/_sources/rapi/about_search_coll.rst.txt @@ -29,6 +29,6 @@ See Also Other search_coll: `about_search `__, `stri_opts_collator() `__ -Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ +Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_rank() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ Other stringi_general_topics: `about_arguments `__, `about_encoding `__, `about_locale `__, `about_search_boundaries `__, `about_search_charclass `__, `about_search_fixed `__, `about_search_regex `__, `about_search `__, `about_stringi `__ diff --git a/devel/sphinx/_build/html/_sources/rapi/about_stringi.rst.txt b/devel/sphinx/_build/html/_sources/rapi/about_stringi.rst.txt index 4f891e487..a82d1573a 100644 --- a/devel/sphinx/_build/html/_sources/rapi/about_stringi.rst.txt +++ b/devel/sphinx/_build/html/_sources/rapi/about_stringi.rst.txt @@ -4,7 +4,7 @@ about_stringi: THE String Processing Package Description ~~~~~~~~~~~ -stringi is THE R package for fast, correct, consistent, and convenient string/text manipulation. It gives predictable results on every platform, in each locale, and under any “native” character encoding. +stringi is THE R package for fast, correct, consistent, and convenient string/text manipulation. It gives predictable results on every platform, in each locale, and under any native character encoding. **Keywords**: R, text processing, character strings, internationalization, localization, ICU, ICU4C, i18n, l10n, Unicode. @@ -19,7 +19,7 @@ Manual pages on general topics: - `about_encoding `__ – character encoding issues, including information on encoding management in stringi, as well as on encoding detection and conversion. -- `about_locale `__ – locale issues, including locale management and specification in stringi, and the list of locale-sensitive operations. In particular, see `stri_opts_collator `__ for a description of the string collation algorithm, which is used for string comparing, ordering, sorting, case-folding, and searching. +- `about_locale `__ – locale issues, including locale management and specification in stringi, and the list of locale-sensitive operations. In particular, see `stri_opts_collator `__ for a description of the string collation algorithm, which is used for string comparing, ordering, ranking, sorting, case-folding, and searching. - `about_arguments `__ – information on how stringi treats its functions' arguments. @@ -54,7 +54,7 @@ Refer to the following: - `stri_trans_tolower `__ (among others) for case mapping, i.e., conversion to lower, UPPER, or Title Case, `stri_trans_nfc `__ (among others) for Unicode normalization, `stri_trans_char `__ for translating individual code points, and `stri_trans_general `__ for other universal yet powerful text transforms, including transliteration. -- `stri_cmp `__, `%s<% `__, `stri_order `__, `stri_sort `__, `stri_unique `__, and `stri_duplicated `__ for collation-based, locale-aware operations, see also `about_locale `__. +- `stri_cmp `__, `%s<% `__, `stri_order `__, `stri_sort `__, `stri_rank `__, `stri_unique `__, and `stri_duplicated `__ for collation-based, locale-aware operations, see also `about_locale `__. - `stri_split_lines `__ (among others) to split a string into text lines. @@ -69,7 +69,7 @@ Note that each man page provides many further links to other interesting facilit Author(s) ~~~~~~~~~ -Marek Gagolewski, with contributions from Bartek Tartanus and many others. ICU4C was developed by IBM and others. The Unicode Character Database is due to Unicode, Inc.; see the COPYRIGHTS file for more details. +Marek Gagolewski, with contributions from Bartek Tartanus and many others. ICU4C was developed by IBM, Unicode, Inc., and others. References ~~~~~~~~~~ diff --git a/devel/sphinx/_build/html/_sources/rapi/operator_compare.rst.txt b/devel/sphinx/_build/html/_sources/rapi/operator_compare.rst.txt index 5aebca12e..ebcfa325c 100644 --- a/devel/sphinx/_build/html/_sources/rapi/operator_compare.rst.txt +++ b/devel/sphinx/_build/html/_sources/rapi/operator_compare.rst.txt @@ -67,7 +67,7 @@ All the functions return a logical vector indicating the result of a pairwise co See Also ~~~~~~~~ -Other locale_sensitive: `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ +Other locale_sensitive: `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_rank() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ Examples ~~~~~~~~ diff --git a/devel/sphinx/_build/html/_sources/rapi/stri_compare.rst.txt b/devel/sphinx/_build/html/_sources/rapi/stri_compare.rst.txt index ec92c611c..2da14bd78 100644 --- a/devel/sphinx/_build/html/_sources/rapi/stri_compare.rst.txt +++ b/devel/sphinx/_build/html/_sources/rapi/stri_compare.rst.txt @@ -72,7 +72,7 @@ References See Also ~~~~~~~~ -Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ +Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_rank() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ Examples ~~~~~~~~ diff --git a/devel/sphinx/_build/html/_sources/rapi/stri_count_boundaries.rst.txt b/devel/sphinx/_build/html/_sources/rapi/stri_count_boundaries.rst.txt index cadcde0bd..308bbb4be 100644 --- a/devel/sphinx/_build/html/_sources/rapi/stri_count_boundaries.rst.txt +++ b/devel/sphinx/_build/html/_sources/rapi/stri_count_boundaries.rst.txt @@ -51,7 +51,7 @@ See Also Other search_count: `about_search `__, `stri_count() `__ -Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ +Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_rank() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ Other text_boundaries: `about_search_boundaries `__, `about_search `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_brkiter() `__, `stri_split_boundaries() `__, `stri_split_lines() `__, `stri_trans_tolower() `__, `stri_wrap() `__ diff --git a/devel/sphinx/_build/html/_sources/rapi/stri_duplicated.rst.txt b/devel/sphinx/_build/html/_sources/rapi/stri_duplicated.rst.txt index de02931dd..21173f55c 100644 --- a/devel/sphinx/_build/html/_sources/rapi/stri_duplicated.rst.txt +++ b/devel/sphinx/_build/html/_sources/rapi/stri_duplicated.rst.txt @@ -68,7 +68,7 @@ References See Also ~~~~~~~~ -Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ +Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_rank() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ Examples ~~~~~~~~ diff --git a/devel/sphinx/_build/html/_sources/rapi/stri_enc_detect2.rst.txt b/devel/sphinx/_build/html/_sources/rapi/stri_enc_detect2.rst.txt index bf07d139d..533a7b2bc 100644 --- a/devel/sphinx/_build/html/_sources/rapi/stri_enc_detect2.rst.txt +++ b/devel/sphinx/_build/html/_sources/rapi/stri_enc_detect2.rst.txt @@ -51,6 +51,6 @@ The guesses are ordered by decreasing confidence. See Also ~~~~~~~~ -Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ +Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_rank() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ Other encoding_detection: `about_encoding `__, `stri_enc_detect() `__, `stri_enc_isascii() `__, `stri_enc_isutf16be() `__, `stri_enc_isutf8() `__ diff --git a/devel/sphinx/_build/html/_sources/rapi/stri_extract_boundaries.rst.txt b/devel/sphinx/_build/html/_sources/rapi/stri_extract_boundaries.rst.txt index aecf953a6..4eb9875e0 100644 --- a/devel/sphinx/_build/html/_sources/rapi/stri_extract_boundaries.rst.txt +++ b/devel/sphinx/_build/html/_sources/rapi/stri_extract_boundaries.rst.txt @@ -74,7 +74,7 @@ See Also Other search_extract: `about_search `__, `stri_extract_all() `__, `stri_match_all() `__ -Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ +Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_rank() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ Other text_boundaries: `about_search_boundaries `__, `about_search `__, `stri_count_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_brkiter() `__, `stri_split_boundaries() `__, `stri_split_lines() `__, `stri_trans_tolower() `__, `stri_wrap() `__ diff --git a/devel/sphinx/_build/html/_sources/rapi/stri_locate_boundaries.rst.txt b/devel/sphinx/_build/html/_sources/rapi/stri_locate_boundaries.rst.txt index 3bdc3714e..96b5e6e31 100644 --- a/devel/sphinx/_build/html/_sources/rapi/stri_locate_boundaries.rst.txt +++ b/devel/sphinx/_build/html/_sources/rapi/stri_locate_boundaries.rst.txt @@ -66,7 +66,7 @@ Other search_locate: `about_search `__, `stri_locate_all() `__, `stri_sub_all() `__, `stri_sub() `__ -Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ +Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_rank() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ Other text_boundaries: `about_search_boundaries `__, `about_search `__, `stri_count_boundaries() `__, `stri_extract_all_boundaries() `__, `stri_opts_brkiter() `__, `stri_split_boundaries() `__, `stri_split_lines() `__, `stri_trans_tolower() `__, `stri_wrap() `__ diff --git a/devel/sphinx/_build/html/_sources/rapi/stri_opts_collator.rst.txt b/devel/sphinx/_build/html/_sources/rapi/stri_opts_collator.rst.txt index 85989bb7e..db1c9d606 100644 --- a/devel/sphinx/_build/html/_sources/rapi/stri_opts_collator.rst.txt +++ b/devel/sphinx/_build/html/_sources/rapi/stri_opts_collator.rst.txt @@ -84,7 +84,7 @@ References See Also ~~~~~~~~ -Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_order() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ +Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_order() `__, `stri_rank() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ Other search_coll: `about_search_coll `__, `about_search `__ diff --git a/devel/sphinx/_build/html/_sources/rapi/stri_order.rst.txt b/devel/sphinx/_build/html/_sources/rapi/stri_order.rst.txt index 81334a958..f7e49d7c8 100644 --- a/devel/sphinx/_build/html/_sources/rapi/stri_order.rst.txt +++ b/devel/sphinx/_build/html/_sources/rapi/stri_order.rst.txt @@ -33,10 +33,12 @@ Details For more information on ICU's Collator and how to tune it up in stringi, refer to `stri_opts_collator `__. -As usual in stringi, non-character inputs are coerced to strings, see an example below for a perhaps non-intuitive behavior of lexicographic sorting on numeric inputs. +As usual in stringi, non-character inputs are coerced to strings, see an example below for a somewhat non-intuitive behavior of lexicographic sorting on numeric inputs. This function uses a stable sort algorithm (STL's ``stable_sort``), which performs up to *N*log^2(N)* element comparisons, where *N* is the length of ``str``. +For ordering with regards to multiple criteria (such as sorting data frames by more than 1 column), see `stri_rank `__. + Value ~~~~~ @@ -50,7 +52,7 @@ References See Also ~~~~~~~~ -Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ +Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_rank() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ Examples ~~~~~~~~ diff --git a/devel/sphinx/_build/html/_sources/rapi/stri_rank.rst.txt b/devel/sphinx/_build/html/_sources/rapi/stri_rank.rst.txt new file mode 100644 index 000000000..1f13d4df6 --- /dev/null +++ b/devel/sphinx/_build/html/_sources/rapi/stri_rank.rst.txt @@ -0,0 +1,62 @@ +stri_rank: Ranking +================== + +Description +~~~~~~~~~~~ + +This function ranks each string in a character vector according to a locale-dependent lexicographic order. It is a portable replacement for the base ``xtfrm`` function. + +Usage +~~~~~ + +.. code-block:: r + + stri_rank(str, ..., opts_collator = NULL) + +Arguments +~~~~~~~~~ + ++-------------------+----------------------------------------------------------------------------------------------------------------------------------------+ +| ``str`` | a character vector | ++-------------------+----------------------------------------------------------------------------------------------------------------------------------------+ +| ``...`` | additional settings for ``opts_collator`` | ++-------------------+----------------------------------------------------------------------------------------------------------------------------------------+ +| ``opts_collator`` | a named list with ICU Collator's options, see `stri_opts_collator `__, ``NULL`` for default collation options | ++-------------------+----------------------------------------------------------------------------------------------------------------------------------------+ + +Details +~~~~~~~ + +Missing values result in missing ranks and tied observations receive the same ranks (based on min). + +For more information on ICU's Collator and how to tune it up in stringi, refer to `stri_opts_collator `__. + +Value +~~~~~ + +The result is a vector of ranks corresponding to each string in ``str``. + +References +~~~~~~~~~~ + +*Collation* - ICU User Guide, http://userguide.icu-project.org/collation + +See Also +~~~~~~~~ + +Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ + +Examples +~~~~~~~~ + +.. code-block:: r + + stri_rank(c('hladny', 'chladny'), locale='pl_PL') + stri_rank(c('hladny', 'chladny'), locale='sk_SK') + + stri_rank("a" %s+% c(1, 100, 2, 101, 11, 10)) # lexicographic order + stri_rank("a" %s+% c(1, 100, 2, 101, 11, 10), numeric=TRUE) + + # Ordering a data frame with respect to two criteria: + X <- data.frame(a=c("b", NA, "b", "b", NA, "a", "a", "c"), b=runif(8)) + X[order(stri_rank(X$a), X$b), ] diff --git a/devel/sphinx/_build/html/_sources/rapi/stri_sort.rst.txt b/devel/sphinx/_build/html/_sources/rapi/stri_sort.rst.txt index 64c922946..bff8c070d 100644 --- a/devel/sphinx/_build/html/_sources/rapi/stri_sort.rst.txt +++ b/devel/sphinx/_build/html/_sources/rapi/stri_sort.rst.txt @@ -4,7 +4,7 @@ stri_sort: Sorting Description ~~~~~~~~~~~ -This function sorts a character vector according to the locale-dependent lexicographic order. +This function sorts a character vector according to a locale-dependent lexicographic order. Usage ~~~~~ @@ -33,7 +33,7 @@ Details For more information on ICU's Collator and how to tune it up in stringi, refer to `stri_opts_collator `__. -As usual in stringi, non-character inputs are coerced to strings, see an example below for a perhaps non-intitive behavior of lexicographic sorting on numeric inputs. +As usual in stringi, non-character inputs are coerced to strings, see an example below for a somewhat non-intuitive behavior of lexicographic sorting on numeric inputs. This function uses a stable sort algorithm (STL's ``stable_sort``), which performs up to *N*log^2(N)* element comparisons, where *N* is the length of ``str``. @@ -50,7 +50,7 @@ References See Also ~~~~~~~~ -Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_sort_key() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ +Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_rank() `__, `stri_sort_key() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ Examples ~~~~~~~~ diff --git a/devel/sphinx/_build/html/_sources/rapi/stri_sort_key.rst.txt b/devel/sphinx/_build/html/_sources/rapi/stri_sort_key.rst.txt index fb1f33588..1fa67a493 100644 --- a/devel/sphinx/_build/html/_sources/rapi/stri_sort_key.rst.txt +++ b/devel/sphinx/_build/html/_sources/rapi/stri_sort_key.rst.txt @@ -4,7 +4,7 @@ stri_sort_key: Sort Keys Description ~~~~~~~~~~~ -This function computes a locale-dependent 'sort key', which is an alternative character representation of the string that, when ordered in the C locale (which orders using bytes directly), will give an equivalent ordering to the original string. It is useful for enhancing algorithms that sort only in the C locale with the ability to be locale-aware. +This function computes a locale-dependent sort key, which is an alternative character representation of the string that, when ordered in the C locale (which orders using the underlying bytes directly), will give an equivalent ordering to the original string. It is useful for enhancing algorithms that sort only in the C locale (e.g., the ``strcmp`` function in libc) with the ability to be locale-aware. Usage ~~~~~ @@ -29,10 +29,12 @@ Details For more information on ICU's Collator and how to tune it up in stringi, refer to `stri_opts_collator `__. +See also `stri_rank `__ for ranking strings with a single character vector, i.e., generating relative sort keys. + Value ~~~~~ -The result is a character vector with the same length as ``str`` that contains the sort keys. +The result is a character vector with the same length as ``str`` that contains the sort keys. The output is marked as ``bytes``-encoded. References ~~~~~~~~~~ @@ -42,7 +44,7 @@ References See Also ~~~~~~~~ -Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ +Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_rank() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ Examples ~~~~~~~~ diff --git a/devel/sphinx/_build/html/_sources/rapi/stri_split_boundaries.rst.txt b/devel/sphinx/_build/html/_sources/rapi/stri_split_boundaries.rst.txt index 4cf25d35e..fc2367aa6 100644 --- a/devel/sphinx/_build/html/_sources/rapi/stri_split_boundaries.rst.txt +++ b/devel/sphinx/_build/html/_sources/rapi/stri_split_boundaries.rst.txt @@ -60,7 +60,7 @@ See Also Other search_split: `about_search `__, `stri_split_lines() `__, `stri_split() `__ -Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ +Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_rank() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ Other text_boundaries: `about_search_boundaries `__, `about_search `__, `stri_count_boundaries() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_brkiter() `__, `stri_split_lines() `__, `stri_trans_tolower() `__, `stri_wrap() `__ diff --git a/devel/sphinx/_build/html/_sources/rapi/stri_trans_casemap.rst.txt b/devel/sphinx/_build/html/_sources/rapi/stri_trans_casemap.rst.txt index 0171d7399..54b76c9f1 100644 --- a/devel/sphinx/_build/html/_sources/rapi/stri_trans_casemap.rst.txt +++ b/devel/sphinx/_build/html/_sources/rapi/stri_trans_casemap.rst.txt @@ -60,7 +60,7 @@ References See Also ~~~~~~~~ -Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_unique() `__, `stri_wrap() `__ +Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_rank() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_unique() `__, `stri_wrap() `__ Other transform: `stri_trans_char() `__, `stri_trans_general() `__, `stri_trans_list() `__, `stri_trans_nfc() `__ diff --git a/devel/sphinx/_build/html/_sources/rapi/stri_unique.rst.txt b/devel/sphinx/_build/html/_sources/rapi/stri_unique.rst.txt index ea6906c9c..7feb971ae 100644 --- a/devel/sphinx/_build/html/_sources/rapi/stri_unique.rst.txt +++ b/devel/sphinx/_build/html/_sources/rapi/stri_unique.rst.txt @@ -44,7 +44,7 @@ References See Also ~~~~~~~~ -Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_wrap() `__ +Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_rank() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_wrap() `__ Examples ~~~~~~~~ diff --git a/devel/sphinx/_build/html/_sources/rapi/stri_wrap.rst.txt b/devel/sphinx/_build/html/_sources/rapi/stri_wrap.rst.txt index 1ffd8a838..25e4d7fea 100644 --- a/devel/sphinx/_build/html/_sources/rapi/stri_wrap.rst.txt +++ b/devel/sphinx/_build/html/_sources/rapi/stri_wrap.rst.txt @@ -84,7 +84,7 @@ D.E. Knuth, M.F. Plass, Breaking paragraphs into lines, *Software: Practice and See Also ~~~~~~~~ -Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__ +Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_rank() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__ Other text_boundaries: `about_search_boundaries `__, `about_search `__, `stri_count_boundaries() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_brkiter() `__, `stri_split_boundaries() `__, `stri_split_lines() `__, `stri_trans_tolower() `__ diff --git a/devel/sphinx/_build/html/index.html b/devel/sphinx/_build/html/index.html index 688ec3cda..56df7130b 100644 --- a/devel/sphinx/_build/html/index.html +++ b/devel/sphinx/_build/html/index.html @@ -301,6 +301,7 @@

stringi: THE String Processing Package for Rstri_rand_lipsum: A Lorem Ipsum Generator
  • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
  • stri_rand_strings: Generate Random Strings
  • +
  • stri_rank: Ranking
  • stri_read_lines: Read Text Lines from a Text File
  • stri_read_raw: Read Text File as Raw
  • stri_remove_empty: Remove All Empty Strings from a Character Vector
  • diff --git a/devel/sphinx/_build/html/news.html b/devel/sphinx/_build/html/news.html index 7b5df2542..3e3dad245 100644 --- a/devel/sphinx/_build/html/news.html +++ b/devel/sphinx/_build/html/news.html @@ -234,11 +234,15 @@

    1.6.1 (2021-XX-YY) develhttps://stringi.gagolewski.com/_static/vignette/stringi.pdf

  • …todo… #401 (update ICU4C to 69.1), The ICU4C bundle has been updated from version 61.1 to 69.1 which features Unicode 13.0 and CLDR 39.

  • -
  • …todo… #408 (stri_trans_casefold),

  • -
  • [INTERNAL] #414: Use LEVELS(x) macro instead of accessing -(x)->sxpinfo.gp directly (@lukaszdaniel).

  • +
  • [NEW FEATURE] #408: …todo… stri_trans_casefold(),

  • +
  • [NEW FEATURE] #421: stri_rank() ranks strings in a character +vector (e.g., for ordering data frames with regards to multiple +criteria, the ranks can be passed to order(), see #219).

  • +
  • [BUGFIX] stri_sort_key() now outputs bytes-encoded strings.

  • [BUGFIX] #415: locale='' was not equivalent to locale=NULL in stri_opts_collator().

  • +
  • [INTERNAL] #414: Use LEVELS(x) macro instead of accessing +(x)->sxpinfo.gp directly (@lukaszdaniel).

  • diff --git a/devel/sphinx/_build/html/objects.inv b/devel/sphinx/_build/html/objects.inv index ec7322b13..75b0d3775 100644 Binary files a/devel/sphinx/_build/html/objects.inv and b/devel/sphinx/_build/html/objects.inv differ diff --git a/devel/sphinx/_build/html/rapi.html b/devel/sphinx/_build/html/rapi.html index 6c33557b5..e66b02496 100644 --- a/devel/sphinx/_build/html/rapi.html +++ b/devel/sphinx/_build/html/rapi.html @@ -167,6 +167,7 @@
  • stri_rand_lipsum: A Lorem Ipsum Generator
  • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
  • stri_rand_strings: Generate Random Strings
  • +
  • stri_rank: Ranking
  • stri_read_lines: Read Text Lines from a Text File
  • stri_read_raw: Read Text File as Raw
  • stri_remove_empty: Remove All Empty Strings from a Character Vector
  • @@ -356,6 +357,7 @@

    R Package stringi Referencestri_rand_lipsum: A Lorem Ipsum Generator
  • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
  • stri_rand_strings: Generate Random Strings
  • +
  • stri_rank: Ranking
  • stri_read_lines: Read Text Lines from a Text File
  • stri_read_raw: Read Text File as Raw
  • stri_remove_empty: Remove All Empty Strings from a Character Vector
  • diff --git a/devel/sphinx/_build/html/rapi/about_arguments.html b/devel/sphinx/_build/html/rapi/about_arguments.html index 137a863c2..99bfa14dd 100644 --- a/devel/sphinx/_build/html/rapi/about_arguments.html +++ b/devel/sphinx/_build/html/rapi/about_arguments.html @@ -175,6 +175,7 @@
  • stri_rand_lipsum: A Lorem Ipsum Generator
  • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
  • stri_rand_strings: Generate Random Strings
  • +
  • stri_rank: Ranking
  • stri_read_lines: Read Text Lines from a Text File
  • stri_read_raw: Read Text File as Raw
  • stri_remove_empty: Remove All Empty Strings from a Character Vector
  • diff --git a/devel/sphinx/_build/html/rapi/about_encoding.html b/devel/sphinx/_build/html/rapi/about_encoding.html index c954301ef..8d00c4d62 100644 --- a/devel/sphinx/_build/html/rapi/about_encoding.html +++ b/devel/sphinx/_build/html/rapi/about_encoding.html @@ -177,6 +177,7 @@
  • stri_rand_lipsum: A Lorem Ipsum Generator
  • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
  • stri_rand_strings: Generate Random Strings
  • +
  • stri_rank: Ranking
  • stri_read_lines: Read Text Lines from a Text File
  • stri_read_raw: Read Text File as Raw
  • stri_remove_empty: Remove All Empty Strings from a Character Vector
  • @@ -326,7 +327,7 @@

    UTF-8 and UTF-16

    Character Encodings in R

    Data in memory are just bytes (small integer values) – an encoding is a way to represent characters with such numbers, it is a semantic ‘key’ to understand a given byte sequence. For example, in ISO-8859-2 (Central European), the value 177 represents Polish “a with ogonek”, and in ISO-8859-1 (Western European), the same value denotes the “plus-minus” sign. Thus, a character encoding is a translation scheme: we need to communicate with R somehow, relying on how it represents strings.

    -

    Basically, R has a very simple encoding marking mechanism, see stri_enc_mark. There is an implicit assumption that your platform’s default (native) encoding always extends ASCII – stringi checks that whenever your native encoding is being detected automatically on ICU’s initialization and each time when you change it manually by calling stri_enc_set.

    +

    Overall, R has a very simple encoding marking mechanism, see stri_enc_mark. There is an implicit assumption that your platform’s default (native) encoding always extends ASCII – stringi checks that whenever your native encoding is being detected automatically on ICU’s initialization and each time when you change it manually by calling stri_enc_set.

    Character strings in R (internally) can be declared to be in:

    diff --git a/devel/sphinx/_build/html/rapi/about_search.html b/devel/sphinx/_build/html/rapi/about_search.html index b8ec0646b..4629564b4 100644 --- a/devel/sphinx/_build/html/rapi/about_search.html +++ b/devel/sphinx/_build/html/rapi/about_search.html @@ -172,6 +172,7 @@
  • stri_rand_lipsum: A Lorem Ipsum Generator
  • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
  • stri_rand_strings: Generate Random Strings
  • +
  • stri_rank: Ranking
  • stri_read_lines: Read Text Lines from a Text File
  • stri_read_raw: Read Text File as Raw
  • stri_remove_empty: Remove All Empty Strings from a Character Vector
  • diff --git a/devel/sphinx/_build/html/rapi/about_search_boundaries.html b/devel/sphinx/_build/html/rapi/about_search_boundaries.html index c81859a70..01343a95d 100644 --- a/devel/sphinx/_build/html/rapi/about_search_boundaries.html +++ b/devel/sphinx/_build/html/rapi/about_search_boundaries.html @@ -173,6 +173,7 @@
  • stri_rand_lipsum: A Lorem Ipsum Generator
  • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
  • stri_rand_strings: Generate Random Strings
  • +
  • stri_rank: Ranking
  • stri_read_lines: Read Text Lines from a Text File
  • stri_read_raw: Read Text File as Raw
  • stri_remove_empty: Remove All Empty Strings from a Character Vector
  • @@ -324,7 +325,7 @@

    References

    See Also

    -

    Other locale_sensitive: %s<%(), about_locale, about_search_coll, stri_compare(), stri_count_boundaries(), stri_duplicated(), stri_enc_detect2(), stri_extract_all_boundaries(), stri_locate_all_boundaries(), stri_opts_collator(), stri_order(), stri_sort_key(), stri_sort(), stri_split_boundaries(), stri_trans_tolower(), stri_unique(), stri_wrap()

    +

    Other locale_sensitive: %s<%(), about_locale, about_search_coll, stri_compare(), stri_count_boundaries(), stri_duplicated(), stri_enc_detect2(), stri_extract_all_boundaries(), stri_locate_all_boundaries(), stri_opts_collator(), stri_order(), stri_rank(), stri_sort_key(), stri_sort(), stri_split_boundaries(), stri_trans_tolower(), stri_unique(), stri_wrap()

    Other text_boundaries: about_search, stri_count_boundaries(), stri_extract_all_boundaries(), stri_locate_all_boundaries(), stri_opts_brkiter(), stri_split_boundaries(), stri_split_lines(), stri_trans_tolower(), stri_wrap()

    Other stringi_general_topics: about_arguments, about_encoding, about_locale, about_search_charclass, about_search_coll, about_search_fixed, about_search_regex, about_search, about_stringi

    diff --git a/devel/sphinx/_build/html/rapi/about_search_charclass.html b/devel/sphinx/_build/html/rapi/about_search_charclass.html index c78258e28..d10504e8a 100644 --- a/devel/sphinx/_build/html/rapi/about_search_charclass.html +++ b/devel/sphinx/_build/html/rapi/about_search_charclass.html @@ -178,6 +178,7 @@
  • stri_rand_lipsum: A Lorem Ipsum Generator
  • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
  • stri_rand_strings: Generate Random Strings
  • +
  • stri_rank: Ranking
  • stri_read_lines: Read Text Lines from a Text File
  • stri_read_raw: Read Text File as Raw
  • stri_remove_empty: Remove All Empty Strings from a Character Vector
  • diff --git a/devel/sphinx/_build/html/rapi/about_search_coll.html b/devel/sphinx/_build/html/rapi/about_search_coll.html index 184c5989e..3edd82397 100644 --- a/devel/sphinx/_build/html/rapi/about_search_coll.html +++ b/devel/sphinx/_build/html/rapi/about_search_coll.html @@ -173,6 +173,7 @@
  • stri_rand_lipsum: A Lorem Ipsum Generator
  • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
  • stri_rand_strings: Generate Random Strings
  • +
  • stri_rank: Ranking
  • stri_read_lines: Read Text Lines from a Text File
  • stri_read_raw: Read Text File as Raw
  • stri_remove_empty: Remove All Empty Strings from a Character Vector
  • @@ -315,7 +316,7 @@

    References

    See Also

    Other search_coll: about_search, stri_opts_collator()

    -

    Other locale_sensitive: %s<%(), about_locale, about_search_boundaries, stri_compare(), stri_count_boundaries(), stri_duplicated(), stri_enc_detect2(), stri_extract_all_boundaries(), stri_locate_all_boundaries(), stri_opts_collator(), stri_order(), stri_sort_key(), stri_sort(), stri_split_boundaries(), stri_trans_tolower(), stri_unique(), stri_wrap()

    +

    Other locale_sensitive: %s<%(), about_locale, about_search_boundaries, stri_compare(), stri_count_boundaries(), stri_duplicated(), stri_enc_detect2(), stri_extract_all_boundaries(), stri_locate_all_boundaries(), stri_opts_collator(), stri_order(), stri_rank(), stri_sort_key(), stri_sort(), stri_split_boundaries(), stri_trans_tolower(), stri_unique(), stri_wrap()

    Other stringi_general_topics: about_arguments, about_encoding, about_locale, about_search_boundaries, about_search_charclass, about_search_fixed, about_search_regex, about_search, about_stringi

    diff --git a/devel/sphinx/_build/html/rapi/about_search_fixed.html b/devel/sphinx/_build/html/rapi/about_search_fixed.html index 622e0836a..60be5ab97 100644 --- a/devel/sphinx/_build/html/rapi/about_search_fixed.html +++ b/devel/sphinx/_build/html/rapi/about_search_fixed.html @@ -172,6 +172,7 @@
  • stri_rand_lipsum: A Lorem Ipsum Generator
  • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
  • stri_rand_strings: Generate Random Strings
  • +
  • stri_rank: Ranking
  • stri_read_lines: Read Text Lines from a Text File
  • stri_read_raw: Read Text File as Raw
  • stri_remove_empty: Remove All Empty Strings from a Character Vector
  • diff --git a/devel/sphinx/_build/html/rapi/about_search_regex.html b/devel/sphinx/_build/html/rapi/about_search_regex.html index 602233e0a..28e4bdc18 100644 --- a/devel/sphinx/_build/html/rapi/about_search_regex.html +++ b/devel/sphinx/_build/html/rapi/about_search_regex.html @@ -176,6 +176,7 @@
  • stri_rand_lipsum: A Lorem Ipsum Generator
  • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
  • stri_rand_strings: Generate Random Strings
  • +
  • stri_rank: Ranking
  • stri_read_lines: Read Text Lines from a Text File
  • stri_read_raw: Read Text File as Raw
  • stri_remove_empty: Remove All Empty Strings from a Character Vector
  • diff --git a/devel/sphinx/_build/html/rapi/about_stringi.html b/devel/sphinx/_build/html/rapi/about_stringi.html index 5f6ea8796..43dea5d37 100644 --- a/devel/sphinx/_build/html/rapi/about_stringi.html +++ b/devel/sphinx/_build/html/rapi/about_stringi.html @@ -175,6 +175,7 @@
  • stri_rand_lipsum: A Lorem Ipsum Generator
  • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
  • stri_rand_strings: Generate Random Strings
  • +
  • stri_rank: Ranking
  • stri_read_lines: Read Text Lines from a Text File
  • stri_read_raw: Read Text File as Raw
  • stri_remove_empty: Remove All Empty Strings from a Character Vector
  • @@ -298,7 +299,7 @@

    about_stringi: THE String Processing Package

    Description

    -

    stringi is THE R package for fast, correct, consistent, and convenient string/text manipulation. It gives predictable results on every platform, in each locale, and under any “native” character encoding.

    +

    stringi is THE R package for fast, correct, consistent, and convenient string/text manipulation. It gives predictable results on every platform, in each locale, and under any native character encoding.

    Keywords: R, text processing, character strings, internationalization, localization, ICU, ICU4C, i18n, l10n, Unicode.

    Homepage: https://stringi.gagolewski.com/

    License: The BSD-3-clause license for the package code, the ICU license for the accompanying ICU4C distribution, and the UCD license for the Unicode Character Database. See the COPYRIGHTS and LICENSE file for more details.

    @@ -308,7 +309,7 @@

    Details
  • about_encoding – character encoding issues, including information on encoding management in stringi, as well as on encoding detection and conversion.

  • -
  • about_locale – locale issues, including locale management and specification in stringi, and the list of locale-sensitive operations. In particular, see stri_opts_collator for a description of the string collation algorithm, which is used for string comparing, ordering, sorting, case-folding, and searching.

  • +
  • about_locale – locale issues, including locale management and specification in stringi, and the list of locale-sensitive operations. In particular, see stri_opts_collator for a description of the string collation algorithm, which is used for string comparing, ordering, ranking, sorting, case-folding, and searching.

  • about_arguments – information on how stringi treats its functions’ arguments.

  • @@ -332,7 +333,7 @@

    Facilities available

    stri_length (among others) for determining the number of code points in a string. See also stri_count_boundaries for counting the number of Unicode characters and stri_width for approximating the width of a string.

  • stri_trim (among others) for trimming characters from the beginning or/and end of a string, see also about_search_charclass, and stri_pad for padding strings so that they are of the same width. Additionally, stri_wrap wraps text into lines.

  • stri_trans_tolower (among others) for case mapping, i.e., conversion to lower, UPPER, or Title Case, stri_trans_nfc (among others) for Unicode normalization, stri_trans_char for translating individual code points, and stri_trans_general for other universal yet powerful text transforms, including transliteration.

  • -
  • stri_cmp, %s<%, stri_order, stri_sort, stri_unique, and stri_duplicated for collation-based, locale-aware operations, see also about_locale.

  • +
  • stri_cmp, %s<%, stri_order, stri_sort, stri_rank, stri_unique, and stri_duplicated for collation-based, locale-aware operations, see also about_locale.

  • stri_split_lines (among others) to split a string into text lines.

  • stri_escape_unicode (among others) for escaping some code points.

  • stri_rand_strings, stri_rand_shuffle, and stri_rand_lipsum for generating (pseudo)random strings.

  • @@ -342,7 +343,7 @@

    Facilities available

    Author(s)

    -

    Marek Gagolewski, with contributions from Bartek Tartanus and many others. ICU4C was developed by IBM and others. The Unicode Character Database is due to Unicode, Inc.; see the COPYRIGHTS file for more details.

    +

    Marek Gagolewski, with contributions from Bartek Tartanus and many others. ICU4C was developed by IBM, Unicode, Inc., and others.

    References

    diff --git a/devel/sphinx/_build/html/rapi/operator_add.html b/devel/sphinx/_build/html/rapi/operator_add.html index 7b22ea77a..fe6b403a5 100644 --- a/devel/sphinx/_build/html/rapi/operator_add.html +++ b/devel/sphinx/_build/html/rapi/operator_add.html @@ -176,6 +176,7 @@
  • stri_rand_lipsum: A Lorem Ipsum Generator
  • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
  • stri_rand_strings: Generate Random Strings
  • +
  • stri_rank: Ranking
  • stri_read_lines: Read Text Lines from a Text File
  • stri_read_raw: Read Text File as Raw
  • stri_remove_empty: Remove All Empty Strings from a Character Vector
  • diff --git a/devel/sphinx/_build/html/rapi/operator_compare.html b/devel/sphinx/_build/html/rapi/operator_compare.html index 1529bec5f..ffeb58fa8 100644 --- a/devel/sphinx/_build/html/rapi/operator_compare.html +++ b/devel/sphinx/_build/html/rapi/operator_compare.html @@ -176,6 +176,7 @@
  • stri_rand_lipsum: A Lorem Ipsum Generator
  • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
  • stri_rand_strings: Generate Random Strings
  • +
  • stri_rank: Ranking
  • stri_read_lines: Read Text Lines from a Text File
  • stri_read_raw: Read Text File as Raw
  • stri_remove_empty: Remove All Empty Strings from a Character Vector
  • @@ -363,7 +364,7 @@

    Value

    Examples

    diff --git a/devel/sphinx/_build/html/rapi/operator_dollar.html b/devel/sphinx/_build/html/rapi/operator_dollar.html index f649c5455..7c549dc0b 100644 --- a/devel/sphinx/_build/html/rapi/operator_dollar.html +++ b/devel/sphinx/_build/html/rapi/operator_dollar.html @@ -175,6 +175,7 @@
  • stri_rand_lipsum: A Lorem Ipsum Generator
  • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
  • stri_rand_strings: Generate Random Strings
  • +
  • stri_rank: Ranking
  • stri_read_lines: Read Text Lines from a Text File
  • stri_read_raw: Read Text File as Raw
  • stri_remove_empty: Remove All Empty Strings from a Character Vector
  • diff --git a/devel/sphinx/_build/html/rapi/stri_compare.html b/devel/sphinx/_build/html/rapi/stri_compare.html index a6786bb6e..7e40bf7eb 100644 --- a/devel/sphinx/_build/html/rapi/stri_compare.html +++ b/devel/sphinx/_build/html/rapi/stri_compare.html @@ -177,6 +177,7 @@
  • stri_rand_lipsum: A Lorem Ipsum Generator
  • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
  • stri_rand_strings: Generate Random Strings
  • +
  • stri_rank: Ranking
  • stri_read_lines: Read Text Lines from a Text File
  • stri_read_raw: Read Text File as Raw
  • stri_remove_empty: Remove All Empty Strings from a Character Vector
  • @@ -366,7 +367,7 @@

    References

    See Also

    -

    Other locale_sensitive: %s<%(), about_locale, about_search_boundaries, about_search_coll, stri_count_boundaries(), stri_duplicated(), stri_enc_detect2(), stri_extract_all_boundaries(), stri_locate_all_boundaries(), stri_opts_collator(), stri_order(), stri_sort_key(), stri_sort(), stri_split_boundaries(), stri_trans_tolower(), stri_unique(), stri_wrap()

    +

    Other locale_sensitive: %s<%(), about_locale, about_search_boundaries, about_search_coll, stri_count_boundaries(), stri_duplicated(), stri_enc_detect2(), stri_extract_all_boundaries(), stri_locate_all_boundaries(), stri_opts_collator(), stri_order(), stri_rank(), stri_sort_key(), stri_sort(), stri_split_boundaries(), stri_trans_tolower(), stri_unique(), stri_wrap()

    Examples

    diff --git a/devel/sphinx/_build/html/rapi/stri_count.html b/devel/sphinx/_build/html/rapi/stri_count.html index 04088f1e6..e4173d497 100644 --- a/devel/sphinx/_build/html/rapi/stri_count.html +++ b/devel/sphinx/_build/html/rapi/stri_count.html @@ -176,6 +176,7 @@
  • stri_rand_lipsum: A Lorem Ipsum Generator
  • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
  • stri_rand_strings: Generate Random Strings
  • +
  • stri_rank: Ranking
  • stri_read_lines: Read Text Lines from a Text File
  • stri_read_raw: Read Text File as Raw
  • stri_remove_empty: Remove All Empty Strings from a Character Vector
  • diff --git a/devel/sphinx/_build/html/rapi/stri_count_boundaries.html b/devel/sphinx/_build/html/rapi/stri_count_boundaries.html index 35da577a7..1e067cd88 100644 --- a/devel/sphinx/_build/html/rapi/stri_count_boundaries.html +++ b/devel/sphinx/_build/html/rapi/stri_count_boundaries.html @@ -176,6 +176,7 @@
  • stri_rand_lipsum: A Lorem Ipsum Generator
  • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
  • stri_rand_strings: Generate Random Strings
  • +
  • stri_rank: Ranking
  • stri_read_lines: Read Text Lines from a Text File
  • stri_read_raw: Read Text File as Raw
  • stri_remove_empty: Remove All Empty Strings from a Character Vector
  • @@ -347,7 +348,7 @@

    Value
    diff --git a/devel/sphinx/_build/html/rapi/stri_datetime_add.html b/devel/sphinx/_build/html/rapi/stri_datetime_add.html index c02323227..c4bc03f83 100644 --- a/devel/sphinx/_build/html/rapi/stri_datetime_add.html +++ b/devel/sphinx/_build/html/rapi/stri_datetime_add.html @@ -177,6 +177,7 @@
  • stri_rand_lipsum: A Lorem Ipsum Generator
  • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
  • stri_rand_strings: Generate Random Strings
  • +
  • stri_rank: Ranking
  • stri_read_lines: Read Text Lines from a Text File
  • stri_read_raw: Read Text File as Raw
  • stri_remove_empty: Remove All Empty Strings from a Character Vector
  • diff --git a/devel/sphinx/_build/html/rapi/stri_datetime_create.html b/devel/sphinx/_build/html/rapi/stri_datetime_create.html index eca18525b..ced2991b1 100644 --- a/devel/sphinx/_build/html/rapi/stri_datetime_create.html +++ b/devel/sphinx/_build/html/rapi/stri_datetime_create.html @@ -176,6 +176,7 @@
  • stri_rand_lipsum: A Lorem Ipsum Generator
  • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
  • stri_rand_strings: Generate Random Strings
  • +
  • stri_rank: Ranking
  • stri_read_lines: Read Text Lines from a Text File
  • stri_read_raw: Read Text File as Raw
  • stri_remove_empty: Remove All Empty Strings from a Character Vector
  • diff --git a/devel/sphinx/_build/html/rapi/stri_datetime_fields.html b/devel/sphinx/_build/html/rapi/stri_datetime_fields.html index 47b59136d..28cd824dd 100644 --- a/devel/sphinx/_build/html/rapi/stri_datetime_fields.html +++ b/devel/sphinx/_build/html/rapi/stri_datetime_fields.html @@ -176,6 +176,7 @@
  • stri_rand_lipsum: A Lorem Ipsum Generator
  • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
  • stri_rand_strings: Generate Random Strings
  • +
  • stri_rank: Ranking
  • stri_read_lines: Read Text Lines from a Text File
  • stri_read_raw: Read Text File as Raw
  • stri_remove_empty: Remove All Empty Strings from a Character Vector
  • diff --git a/devel/sphinx/_build/html/rapi/stri_datetime_format.html b/devel/sphinx/_build/html/rapi/stri_datetime_format.html index 464dffaab..d94cd8338 100644 --- a/devel/sphinx/_build/html/rapi/stri_datetime_format.html +++ b/devel/sphinx/_build/html/rapi/stri_datetime_format.html @@ -177,6 +177,7 @@
  • stri_rand_lipsum: A Lorem Ipsum Generator
  • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
  • stri_rand_strings: Generate Random Strings
  • +
  • stri_rank: Ranking
  • stri_read_lines: Read Text Lines from a Text File
  • stri_read_raw: Read Text File as Raw
  • stri_remove_empty: Remove All Empty Strings from a Character Vector
  • diff --git a/devel/sphinx/_build/html/rapi/stri_datetime_fstr.html b/devel/sphinx/_build/html/rapi/stri_datetime_fstr.html index 9790c6fc6..e9cde107a 100644 --- a/devel/sphinx/_build/html/rapi/stri_datetime_fstr.html +++ b/devel/sphinx/_build/html/rapi/stri_datetime_fstr.html @@ -176,6 +176,7 @@
  • stri_rand_lipsum: A Lorem Ipsum Generator
  • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
  • stri_rand_strings: Generate Random Strings
  • +
  • stri_rank: Ranking
  • stri_read_lines: Read Text Lines from a Text File
  • stri_read_raw: Read Text File as Raw
  • stri_remove_empty: Remove All Empty Strings from a Character Vector
  • diff --git a/devel/sphinx/_build/html/rapi/stri_datetime_now.html b/devel/sphinx/_build/html/rapi/stri_datetime_now.html index d7619955d..01cc34988 100644 --- a/devel/sphinx/_build/html/rapi/stri_datetime_now.html +++ b/devel/sphinx/_build/html/rapi/stri_datetime_now.html @@ -174,6 +174,7 @@
  • stri_rand_lipsum: A Lorem Ipsum Generator
  • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
  • stri_rand_strings: Generate Random Strings
  • +
  • stri_rank: Ranking
  • stri_read_lines: Read Text Lines from a Text File
  • stri_read_raw: Read Text File as Raw
  • stri_remove_empty: Remove All Empty Strings from a Character Vector
  • diff --git a/devel/sphinx/_build/html/rapi/stri_datetime_symbols.html b/devel/sphinx/_build/html/rapi/stri_datetime_symbols.html index f48a836bd..35fba4bda 100644 --- a/devel/sphinx/_build/html/rapi/stri_datetime_symbols.html +++ b/devel/sphinx/_build/html/rapi/stri_datetime_symbols.html @@ -177,6 +177,7 @@
  • stri_rand_lipsum: A Lorem Ipsum Generator
  • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
  • stri_rand_strings: Generate Random Strings
  • +
  • stri_rank: Ranking
  • stri_read_lines: Read Text Lines from a Text File
  • stri_read_raw: Read Text File as Raw
  • stri_remove_empty: Remove All Empty Strings from a Character Vector
  • diff --git a/devel/sphinx/_build/html/rapi/stri_detect.html b/devel/sphinx/_build/html/rapi/stri_detect.html index 4d7c4241d..acbd039cb 100644 --- a/devel/sphinx/_build/html/rapi/stri_detect.html +++ b/devel/sphinx/_build/html/rapi/stri_detect.html @@ -176,6 +176,7 @@
  • stri_rand_lipsum: A Lorem Ipsum Generator
  • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
  • stri_rand_strings: Generate Random Strings
  • +
  • stri_rank: Ranking
  • stri_read_lines: Read Text Lines from a Text File
  • stri_read_raw: Read Text File as Raw
  • stri_remove_empty: Remove All Empty Strings from a Character Vector
  • diff --git a/devel/sphinx/_build/html/rapi/stri_dup.html b/devel/sphinx/_build/html/rapi/stri_dup.html index fa63ddf18..3e7617307 100644 --- a/devel/sphinx/_build/html/rapi/stri_dup.html +++ b/devel/sphinx/_build/html/rapi/stri_dup.html @@ -176,6 +176,7 @@
  • stri_rand_lipsum: A Lorem Ipsum Generator
  • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
  • stri_rand_strings: Generate Random Strings
  • +
  • stri_rank: Ranking
  • stri_read_lines: Read Text Lines from a Text File
  • stri_read_raw: Read Text File as Raw
  • stri_remove_empty: Remove All Empty Strings from a Character Vector
  • diff --git a/devel/sphinx/_build/html/rapi/stri_duplicated.html b/devel/sphinx/_build/html/rapi/stri_duplicated.html index 21f5f58f5..3dd0db54a 100644 --- a/devel/sphinx/_build/html/rapi/stri_duplicated.html +++ b/devel/sphinx/_build/html/rapi/stri_duplicated.html @@ -177,6 +177,7 @@
  • stri_rand_lipsum: A Lorem Ipsum Generator
  • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
  • stri_rand_strings: Generate Random Strings
  • +
  • stri_rank: Ranking
  • stri_read_lines: Read Text Lines from a Text File
  • stri_read_raw: Read Text File as Raw
  • stri_remove_empty: Remove All Empty Strings from a Character Vector
  • @@ -366,7 +367,7 @@

    References

    See Also

    -

    Other locale_sensitive: %s<%(), about_locale, about_search_boundaries, about_search_coll, stri_compare(), stri_count_boundaries(), stri_enc_detect2(), stri_extract_all_boundaries(), stri_locate_all_boundaries(), stri_opts_collator(), stri_order(), stri_sort_key(), stri_sort(), stri_split_boundaries(), stri_trans_tolower(), stri_unique(), stri_wrap()

    +

    Other locale_sensitive: %s<%(), about_locale, about_search_boundaries, about_search_coll, stri_compare(), stri_count_boundaries(), stri_enc_detect2(), stri_extract_all_boundaries(), stri_locate_all_boundaries(), stri_opts_collator(), stri_order(), stri_rank(), stri_sort_key(), stri_sort(), stri_split_boundaries(), stri_trans_tolower(), stri_unique(), stri_wrap()

    Examples

    diff --git a/devel/sphinx/_build/html/rapi/stri_enc_detect.html b/devel/sphinx/_build/html/rapi/stri_enc_detect.html index bbcc68e67..62f6f0ec5 100644 --- a/devel/sphinx/_build/html/rapi/stri_enc_detect.html +++ b/devel/sphinx/_build/html/rapi/stri_enc_detect.html @@ -177,6 +177,7 @@
  • stri_rand_lipsum: A Lorem Ipsum Generator
  • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
  • stri_rand_strings: Generate Random Strings
  • +
  • stri_rank: Ranking
  • stri_read_lines: Read Text Lines from a Text File
  • stri_read_raw: Read Text File as Raw
  • stri_remove_empty: Remove All Empty Strings from a Character Vector
  • diff --git a/devel/sphinx/_build/html/rapi/stri_enc_detect2.html b/devel/sphinx/_build/html/rapi/stri_enc_detect2.html index 053083895..4a886fc84 100644 --- a/devel/sphinx/_build/html/rapi/stri_enc_detect2.html +++ b/devel/sphinx/_build/html/rapi/stri_enc_detect2.html @@ -175,6 +175,7 @@
  • stri_rand_lipsum: A Lorem Ipsum Generator
  • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
  • stri_rand_strings: Generate Random Strings
  • +
  • stri_rank: Ranking
  • stri_read_lines: Read Text Lines from a Text File
  • stri_read_raw: Read Text File as Raw
  • stri_remove_empty: Remove All Empty Strings from a Character Vector
  • @@ -343,7 +344,7 @@

    Value

    diff --git a/devel/sphinx/_build/html/rapi/stri_enc_fromutf32.html b/devel/sphinx/_build/html/rapi/stri_enc_fromutf32.html index 097e69ad3..51b45ce4a 100644 --- a/devel/sphinx/_build/html/rapi/stri_enc_fromutf32.html +++ b/devel/sphinx/_build/html/rapi/stri_enc_fromutf32.html @@ -175,6 +175,7 @@
  • stri_rand_lipsum: A Lorem Ipsum Generator
  • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
  • stri_rand_strings: Generate Random Strings
  • +
  • stri_rank: Ranking
  • stri_read_lines: Read Text Lines from a Text File
  • stri_read_raw: Read Text File as Raw
  • stri_remove_empty: Remove All Empty Strings from a Character Vector
  • diff --git a/devel/sphinx/_build/html/rapi/stri_enc_info.html b/devel/sphinx/_build/html/rapi/stri_enc_info.html index ce5bf2e52..fce5a0ce0 100644 --- a/devel/sphinx/_build/html/rapi/stri_enc_info.html +++ b/devel/sphinx/_build/html/rapi/stri_enc_info.html @@ -175,6 +175,7 @@
  • stri_rand_lipsum: A Lorem Ipsum Generator
  • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
  • stri_rand_strings: Generate Random Strings
  • +
  • stri_rank: Ranking
  • stri_read_lines: Read Text Lines from a Text File
  • stri_read_raw: Read Text File as Raw
  • stri_remove_empty: Remove All Empty Strings from a Character Vector
  • diff --git a/devel/sphinx/_build/html/rapi/stri_enc_isascii.html b/devel/sphinx/_build/html/rapi/stri_enc_isascii.html index b09a58570..53ecfbc01 100644 --- a/devel/sphinx/_build/html/rapi/stri_enc_isascii.html +++ b/devel/sphinx/_build/html/rapi/stri_enc_isascii.html @@ -176,6 +176,7 @@
  • stri_rand_lipsum: A Lorem Ipsum Generator
  • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
  • stri_rand_strings: Generate Random Strings
  • +
  • stri_rank: Ranking
  • stri_read_lines: Read Text Lines from a Text File
  • stri_read_raw: Read Text File as Raw
  • stri_remove_empty: Remove All Empty Strings from a Character Vector
  • diff --git a/devel/sphinx/_build/html/rapi/stri_enc_isutf16.html b/devel/sphinx/_build/html/rapi/stri_enc_isutf16.html index 49cdc0163..2ac558345 100644 --- a/devel/sphinx/_build/html/rapi/stri_enc_isutf16.html +++ b/devel/sphinx/_build/html/rapi/stri_enc_isutf16.html @@ -175,6 +175,7 @@
  • stri_rand_lipsum: A Lorem Ipsum Generator
  • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
  • stri_rand_strings: Generate Random Strings
  • +
  • stri_rank: Ranking
  • stri_read_lines: Read Text Lines from a Text File
  • stri_read_raw: Read Text File as Raw
  • stri_remove_empty: Remove All Empty Strings from a Character Vector
  • diff --git a/devel/sphinx/_build/html/rapi/stri_enc_isutf8.html b/devel/sphinx/_build/html/rapi/stri_enc_isutf8.html index 4831b3919..e596cec78 100644 --- a/devel/sphinx/_build/html/rapi/stri_enc_isutf8.html +++ b/devel/sphinx/_build/html/rapi/stri_enc_isutf8.html @@ -176,6 +176,7 @@
  • stri_rand_lipsum: A Lorem Ipsum Generator
  • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
  • stri_rand_strings: Generate Random Strings
  • +
  • stri_rank: Ranking
  • stri_read_lines: Read Text Lines from a Text File
  • stri_read_raw: Read Text File as Raw
  • stri_remove_empty: Remove All Empty Strings from a Character Vector
  • diff --git a/devel/sphinx/_build/html/rapi/stri_enc_list.html b/devel/sphinx/_build/html/rapi/stri_enc_list.html index e09673e29..96013b309 100644 --- a/devel/sphinx/_build/html/rapi/stri_enc_list.html +++ b/devel/sphinx/_build/html/rapi/stri_enc_list.html @@ -175,6 +175,7 @@
  • stri_rand_lipsum: A Lorem Ipsum Generator
  • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
  • stri_rand_strings: Generate Random Strings
  • +
  • stri_rank: Ranking
  • stri_read_lines: Read Text Lines from a Text File
  • stri_read_raw: Read Text File as Raw
  • stri_remove_empty: Remove All Empty Strings from a Character Vector
  • diff --git a/devel/sphinx/_build/html/rapi/stri_enc_mark.html b/devel/sphinx/_build/html/rapi/stri_enc_mark.html index 1f55d8973..77c4c15d9 100644 --- a/devel/sphinx/_build/html/rapi/stri_enc_mark.html +++ b/devel/sphinx/_build/html/rapi/stri_enc_mark.html @@ -175,6 +175,7 @@
  • stri_rand_lipsum: A Lorem Ipsum Generator
  • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
  • stri_rand_strings: Generate Random Strings
  • +
  • stri_rank: Ranking
  • stri_read_lines: Read Text Lines from a Text File
  • stri_read_raw: Read Text File as Raw
  • stri_remove_empty: Remove All Empty Strings from a Character Vector
  • diff --git a/devel/sphinx/_build/html/rapi/stri_enc_set.html b/devel/sphinx/_build/html/rapi/stri_enc_set.html index 237e23ddd..bf5b266df 100644 --- a/devel/sphinx/_build/html/rapi/stri_enc_set.html +++ b/devel/sphinx/_build/html/rapi/stri_enc_set.html @@ -175,6 +175,7 @@
  • stri_rand_lipsum: A Lorem Ipsum Generator
  • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
  • stri_rand_strings: Generate Random Strings
  • +
  • stri_rank: Ranking
  • stri_read_lines: Read Text Lines from a Text File
  • stri_read_raw: Read Text File as Raw
  • stri_remove_empty: Remove All Empty Strings from a Character Vector
  • diff --git a/devel/sphinx/_build/html/rapi/stri_enc_toascii.html b/devel/sphinx/_build/html/rapi/stri_enc_toascii.html index bc4f73506..480ad9cbf 100644 --- a/devel/sphinx/_build/html/rapi/stri_enc_toascii.html +++ b/devel/sphinx/_build/html/rapi/stri_enc_toascii.html @@ -175,6 +175,7 @@
  • stri_rand_lipsum: A Lorem Ipsum Generator
  • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
  • stri_rand_strings: Generate Random Strings
  • +
  • stri_rank: Ranking
  • stri_read_lines: Read Text Lines from a Text File
  • stri_read_raw: Read Text File as Raw
  • stri_remove_empty: Remove All Empty Strings from a Character Vector
  • diff --git a/devel/sphinx/_build/html/rapi/stri_enc_tonative.html b/devel/sphinx/_build/html/rapi/stri_enc_tonative.html index 40aee40ff..66f569785 100644 --- a/devel/sphinx/_build/html/rapi/stri_enc_tonative.html +++ b/devel/sphinx/_build/html/rapi/stri_enc_tonative.html @@ -175,6 +175,7 @@
  • stri_rand_lipsum: A Lorem Ipsum Generator
  • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
  • stri_rand_strings: Generate Random Strings
  • +
  • stri_rank: Ranking
  • stri_read_lines: Read Text Lines from a Text File
  • stri_read_raw: Read Text File as Raw
  • stri_remove_empty: Remove All Empty Strings from a Character Vector
  • diff --git a/devel/sphinx/_build/html/rapi/stri_enc_toutf32.html b/devel/sphinx/_build/html/rapi/stri_enc_toutf32.html index 51f2b5146..1bcf418ba 100644 --- a/devel/sphinx/_build/html/rapi/stri_enc_toutf32.html +++ b/devel/sphinx/_build/html/rapi/stri_enc_toutf32.html @@ -175,6 +175,7 @@
  • stri_rand_lipsum: A Lorem Ipsum Generator
  • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
  • stri_rand_strings: Generate Random Strings
  • +
  • stri_rank: Ranking
  • stri_read_lines: Read Text Lines from a Text File
  • stri_read_raw: Read Text File as Raw
  • stri_remove_empty: Remove All Empty Strings from a Character Vector
  • diff --git a/devel/sphinx/_build/html/rapi/stri_enc_toutf8.html b/devel/sphinx/_build/html/rapi/stri_enc_toutf8.html index 250391e9e..5cbf81b03 100644 --- a/devel/sphinx/_build/html/rapi/stri_enc_toutf8.html +++ b/devel/sphinx/_build/html/rapi/stri_enc_toutf8.html @@ -175,6 +175,7 @@
  • stri_rand_lipsum: A Lorem Ipsum Generator
  • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
  • stri_rand_strings: Generate Random Strings
  • +
  • stri_rank: Ranking
  • stri_read_lines: Read Text Lines from a Text File
  • stri_read_raw: Read Text File as Raw
  • stri_remove_empty: Remove All Empty Strings from a Character Vector
  • diff --git a/devel/sphinx/_build/html/rapi/stri_encode.html b/devel/sphinx/_build/html/rapi/stri_encode.html index 577fbf20d..48d118afc 100644 --- a/devel/sphinx/_build/html/rapi/stri_encode.html +++ b/devel/sphinx/_build/html/rapi/stri_encode.html @@ -176,6 +176,7 @@
  • stri_rand_lipsum: A Lorem Ipsum Generator
  • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
  • stri_rand_strings: Generate Random Strings
  • +
  • stri_rank: Ranking
  • stri_read_lines: Read Text Lines from a Text File
  • stri_read_raw: Read Text File as Raw
  • stri_remove_empty: Remove All Empty Strings from a Character Vector
  • diff --git a/devel/sphinx/_build/html/rapi/stri_escape_unicode.html b/devel/sphinx/_build/html/rapi/stri_escape_unicode.html index 1009e95bf..bf04ac1e9 100644 --- a/devel/sphinx/_build/html/rapi/stri_escape_unicode.html +++ b/devel/sphinx/_build/html/rapi/stri_escape_unicode.html @@ -176,6 +176,7 @@
  • stri_rand_lipsum: A Lorem Ipsum Generator
  • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
  • stri_rand_strings: Generate Random Strings
  • +
  • stri_rank: Ranking
  • stri_read_lines: Read Text Lines from a Text File
  • stri_read_raw: Read Text File as Raw
  • stri_remove_empty: Remove All Empty Strings from a Character Vector
  • diff --git a/devel/sphinx/_build/html/rapi/stri_extract.html b/devel/sphinx/_build/html/rapi/stri_extract.html index 55386de46..f9e5b5528 100644 --- a/devel/sphinx/_build/html/rapi/stri_extract.html +++ b/devel/sphinx/_build/html/rapi/stri_extract.html @@ -176,6 +176,7 @@
  • stri_rand_lipsum: A Lorem Ipsum Generator
  • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
  • stri_rand_strings: Generate Random Strings
  • +
  • stri_rank: Ranking
  • stri_read_lines: Read Text Lines from a Text File
  • stri_read_raw: Read Text File as Raw
  • stri_remove_empty: Remove All Empty Strings from a Character Vector
  • diff --git a/devel/sphinx/_build/html/rapi/stri_extract_boundaries.html b/devel/sphinx/_build/html/rapi/stri_extract_boundaries.html index 004c856fa..b31b065b3 100644 --- a/devel/sphinx/_build/html/rapi/stri_extract_boundaries.html +++ b/devel/sphinx/_build/html/rapi/stri_extract_boundaries.html @@ -176,6 +176,7 @@
  • stri_rand_lipsum: A Lorem Ipsum Generator
  • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
  • stri_rand_strings: Generate Random Strings
  • +
  • stri_rank: Ranking
  • stri_read_lines: Read Text Lines from a Text File
  • stri_read_raw: Read Text File as Raw
  • stri_remove_empty: Remove All Empty Strings from a Character Vector
  • @@ -372,7 +373,7 @@

    Value
    diff --git a/devel/sphinx/_build/html/rapi/stri_flatten.html b/devel/sphinx/_build/html/rapi/stri_flatten.html index 1081d15aa..d27338776 100644 --- a/devel/sphinx/_build/html/rapi/stri_flatten.html +++ b/devel/sphinx/_build/html/rapi/stri_flatten.html @@ -176,6 +176,7 @@
  • stri_rand_lipsum: A Lorem Ipsum Generator
  • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
  • stri_rand_strings: Generate Random Strings
  • +
  • stri_rank: Ranking
  • stri_read_lines: Read Text Lines from a Text File
  • stri_read_raw: Read Text File as Raw
  • stri_remove_empty: Remove All Empty Strings from a Character Vector
  • diff --git a/devel/sphinx/_build/html/rapi/stri_info.html b/devel/sphinx/_build/html/rapi/stri_info.html index e7ac1c13c..7fbaa0f58 100644 --- a/devel/sphinx/_build/html/rapi/stri_info.html +++ b/devel/sphinx/_build/html/rapi/stri_info.html @@ -173,6 +173,7 @@
  • stri_rand_lipsum: A Lorem Ipsum Generator
  • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
  • stri_rand_strings: Generate Random Strings
  • +
  • stri_rank: Ranking
  • stri_read_lines: Read Text Lines from a Text File
  • stri_read_raw: Read Text File as Raw
  • stri_remove_empty: Remove All Empty Strings from a Character Vector
  • diff --git a/devel/sphinx/_build/html/rapi/stri_isempty.html b/devel/sphinx/_build/html/rapi/stri_isempty.html index 8a81aa562..e19285757 100644 --- a/devel/sphinx/_build/html/rapi/stri_isempty.html +++ b/devel/sphinx/_build/html/rapi/stri_isempty.html @@ -176,6 +176,7 @@
  • stri_rand_lipsum: A Lorem Ipsum Generator
  • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
  • stri_rand_strings: Generate Random Strings
  • +
  • stri_rank: Ranking
  • stri_read_lines: Read Text Lines from a Text File
  • stri_read_raw: Read Text File as Raw
  • stri_remove_empty: Remove All Empty Strings from a Character Vector
  • diff --git a/devel/sphinx/_build/html/rapi/stri_join.html b/devel/sphinx/_build/html/rapi/stri_join.html index 4c54a1c40..0b6e14862 100644 --- a/devel/sphinx/_build/html/rapi/stri_join.html +++ b/devel/sphinx/_build/html/rapi/stri_join.html @@ -176,6 +176,7 @@
  • stri_rand_lipsum: A Lorem Ipsum Generator
  • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
  • stri_rand_strings: Generate Random Strings
  • +
  • stri_rank: Ranking
  • stri_read_lines: Read Text Lines from a Text File
  • stri_read_raw: Read Text File as Raw
  • stri_remove_empty: Remove All Empty Strings from a Character Vector
  • diff --git a/devel/sphinx/_build/html/rapi/stri_join_list.html b/devel/sphinx/_build/html/rapi/stri_join_list.html index 241915e66..247ab31d2 100644 --- a/devel/sphinx/_build/html/rapi/stri_join_list.html +++ b/devel/sphinx/_build/html/rapi/stri_join_list.html @@ -176,6 +176,7 @@
  • stri_rand_lipsum: A Lorem Ipsum Generator
  • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
  • stri_rand_strings: Generate Random Strings
  • +
  • stri_rank: Ranking
  • stri_read_lines: Read Text Lines from a Text File
  • stri_read_raw: Read Text File as Raw
  • stri_remove_empty: Remove All Empty Strings from a Character Vector
  • diff --git a/devel/sphinx/_build/html/rapi/stri_length.html b/devel/sphinx/_build/html/rapi/stri_length.html index 7d895ba7f..024276cda 100644 --- a/devel/sphinx/_build/html/rapi/stri_length.html +++ b/devel/sphinx/_build/html/rapi/stri_length.html @@ -176,6 +176,7 @@
  • stri_rand_lipsum: A Lorem Ipsum Generator
  • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
  • stri_rand_strings: Generate Random Strings
  • +
  • stri_rank: Ranking
  • stri_read_lines: Read Text Lines from a Text File
  • stri_read_raw: Read Text File as Raw
  • stri_remove_empty: Remove All Empty Strings from a Character Vector
  • diff --git a/devel/sphinx/_build/html/rapi/stri_list2matrix.html b/devel/sphinx/_build/html/rapi/stri_list2matrix.html index 42ad87dc5..30decfca4 100644 --- a/devel/sphinx/_build/html/rapi/stri_list2matrix.html +++ b/devel/sphinx/_build/html/rapi/stri_list2matrix.html @@ -176,6 +176,7 @@
  • stri_rand_lipsum: A Lorem Ipsum Generator
  • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
  • stri_rand_strings: Generate Random Strings
  • +
  • stri_rank: Ranking
  • stri_read_lines: Read Text Lines from a Text File
  • stri_read_raw: Read Text File as Raw
  • stri_remove_empty: Remove All Empty Strings from a Character Vector
  • diff --git a/devel/sphinx/_build/html/rapi/stri_locale_info.html b/devel/sphinx/_build/html/rapi/stri_locale_info.html index 3b7c1a431..efe29be22 100644 --- a/devel/sphinx/_build/html/rapi/stri_locale_info.html +++ b/devel/sphinx/_build/html/rapi/stri_locale_info.html @@ -176,6 +176,7 @@
  • stri_rand_lipsum: A Lorem Ipsum Generator
  • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
  • stri_rand_strings: Generate Random Strings
  • +
  • stri_rank: Ranking
  • stri_read_lines: Read Text Lines from a Text File
  • stri_read_raw: Read Text File as Raw
  • stri_remove_empty: Remove All Empty Strings from a Character Vector
  • diff --git a/devel/sphinx/_build/html/rapi/stri_locale_list.html b/devel/sphinx/_build/html/rapi/stri_locale_list.html index d37a6385f..46dc9f2f3 100644 --- a/devel/sphinx/_build/html/rapi/stri_locale_list.html +++ b/devel/sphinx/_build/html/rapi/stri_locale_list.html @@ -174,6 +174,7 @@
  • stri_rand_lipsum: A Lorem Ipsum Generator
  • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
  • stri_rand_strings: Generate Random Strings
  • +
  • stri_rank: Ranking
  • stri_read_lines: Read Text Lines from a Text File
  • stri_read_raw: Read Text File as Raw
  • stri_remove_empty: Remove All Empty Strings from a Character Vector
  • diff --git a/devel/sphinx/_build/html/rapi/stri_locale_set.html b/devel/sphinx/_build/html/rapi/stri_locale_set.html index dc839f488..20ffe2cbf 100644 --- a/devel/sphinx/_build/html/rapi/stri_locale_set.html +++ b/devel/sphinx/_build/html/rapi/stri_locale_set.html @@ -176,6 +176,7 @@
  • stri_rand_lipsum: A Lorem Ipsum Generator
  • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
  • stri_rand_strings: Generate Random Strings
  • +
  • stri_rank: Ranking
  • stri_read_lines: Read Text Lines from a Text File
  • stri_read_raw: Read Text File as Raw
  • stri_remove_empty: Remove All Empty Strings from a Character Vector
  • diff --git a/devel/sphinx/_build/html/rapi/stri_locate.html b/devel/sphinx/_build/html/rapi/stri_locate.html index c14ae0c37..931e5e1e1 100644 --- a/devel/sphinx/_build/html/rapi/stri_locate.html +++ b/devel/sphinx/_build/html/rapi/stri_locate.html @@ -176,6 +176,7 @@
  • stri_rand_lipsum: A Lorem Ipsum Generator
  • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
  • stri_rand_strings: Generate Random Strings
  • +
  • stri_rank: Ranking
  • stri_read_lines: Read Text Lines from a Text File
  • stri_read_raw: Read Text File as Raw
  • stri_remove_empty: Remove All Empty Strings from a Character Vector
  • diff --git a/devel/sphinx/_build/html/rapi/stri_locate_boundaries.html b/devel/sphinx/_build/html/rapi/stri_locate_boundaries.html index b11188328..220095c62 100644 --- a/devel/sphinx/_build/html/rapi/stri_locate_boundaries.html +++ b/devel/sphinx/_build/html/rapi/stri_locate_boundaries.html @@ -176,6 +176,7 @@
  • stri_rand_lipsum: A Lorem Ipsum Generator
  • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
  • stri_rand_strings: Generate Random Strings
  • +
  • stri_rank: Ranking
  • stri_read_lines: Read Text Lines from a Text File
  • stri_read_raw: Read Text File as Raw
  • stri_remove_empty: Remove All Empty Strings from a Character Vector
  • @@ -363,7 +364,7 @@

    Value

    See Also

    Other search_locate: about_search, stri_locate_all()

    Other indexing: stri_locate_all(), stri_sub_all(), stri_sub()

    -

    Other locale_sensitive: %s<%(), about_locale, about_search_boundaries, about_search_coll, stri_compare(), stri_count_boundaries(), stri_duplicated(), stri_enc_detect2(), stri_extract_all_boundaries(), stri_opts_collator(), stri_order(), stri_sort_key(), stri_sort(), stri_split_boundaries(), stri_trans_tolower(), stri_unique(), stri_wrap()

    +

    Other locale_sensitive: %s<%(), about_locale, about_search_boundaries, about_search_coll, stri_compare(), stri_count_boundaries(), stri_duplicated(), stri_enc_detect2(), stri_extract_all_boundaries(), stri_opts_collator(), stri_order(), stri_rank(), stri_sort_key(), stri_sort(), stri_split_boundaries(), stri_trans_tolower(), stri_unique(), stri_wrap()

    Other text_boundaries: about_search_boundaries, about_search, stri_count_boundaries(), stri_extract_all_boundaries(), stri_opts_brkiter(), stri_split_boundaries(), stri_split_lines(), stri_trans_tolower(), stri_wrap()

    diff --git a/devel/sphinx/_build/html/rapi/stri_match.html b/devel/sphinx/_build/html/rapi/stri_match.html index 3db8d43d5..d41dacd94 100644 --- a/devel/sphinx/_build/html/rapi/stri_match.html +++ b/devel/sphinx/_build/html/rapi/stri_match.html @@ -176,6 +176,7 @@
  • stri_rand_lipsum: A Lorem Ipsum Generator
  • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
  • stri_rand_strings: Generate Random Strings
  • +
  • stri_rank: Ranking
  • stri_read_lines: Read Text Lines from a Text File
  • stri_read_raw: Read Text File as Raw
  • stri_remove_empty: Remove All Empty Strings from a Character Vector
  • diff --git a/devel/sphinx/_build/html/rapi/stri_na2empty.html b/devel/sphinx/_build/html/rapi/stri_na2empty.html index a34448b78..802599dc0 100644 --- a/devel/sphinx/_build/html/rapi/stri_na2empty.html +++ b/devel/sphinx/_build/html/rapi/stri_na2empty.html @@ -175,6 +175,7 @@
  • stri_rand_lipsum: A Lorem Ipsum Generator
  • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
  • stri_rand_strings: Generate Random Strings
  • +
  • stri_rank: Ranking
  • stri_read_lines: Read Text Lines from a Text File
  • stri_read_raw: Read Text File as Raw
  • stri_remove_empty: Remove All Empty Strings from a Character Vector
  • diff --git a/devel/sphinx/_build/html/rapi/stri_numbytes.html b/devel/sphinx/_build/html/rapi/stri_numbytes.html index ceb98ac0c..48d6a0289 100644 --- a/devel/sphinx/_build/html/rapi/stri_numbytes.html +++ b/devel/sphinx/_build/html/rapi/stri_numbytes.html @@ -176,6 +176,7 @@
  • stri_rand_lipsum: A Lorem Ipsum Generator
  • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
  • stri_rand_strings: Generate Random Strings
  • +
  • stri_rank: Ranking
  • stri_read_lines: Read Text Lines from a Text File
  • stri_read_raw: Read Text File as Raw
  • stri_remove_empty: Remove All Empty Strings from a Character Vector
  • diff --git a/devel/sphinx/_build/html/rapi/stri_opts_brkiter.html b/devel/sphinx/_build/html/rapi/stri_opts_brkiter.html index 2ea5d2b0b..8e4af294b 100644 --- a/devel/sphinx/_build/html/rapi/stri_opts_brkiter.html +++ b/devel/sphinx/_build/html/rapi/stri_opts_brkiter.html @@ -176,6 +176,7 @@
  • stri_rand_lipsum: A Lorem Ipsum Generator
  • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
  • stri_rand_strings: Generate Random Strings
  • +
  • stri_rank: Ranking
  • stri_read_lines: Read Text Lines from a Text File
  • stri_read_raw: Read Text File as Raw
  • stri_remove_empty: Remove All Empty Strings from a Character Vector
  • diff --git a/devel/sphinx/_build/html/rapi/stri_opts_collator.html b/devel/sphinx/_build/html/rapi/stri_opts_collator.html index b1f83f1c5..c6dc0d66c 100644 --- a/devel/sphinx/_build/html/rapi/stri_opts_collator.html +++ b/devel/sphinx/_build/html/rapi/stri_opts_collator.html @@ -177,6 +177,7 @@
  • stri_rand_lipsum: A Lorem Ipsum Generator
  • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
  • stri_rand_strings: Generate Random Strings
  • +
  • stri_rank: Ranking
  • stri_read_lines: Read Text Lines from a Text File
  • stri_read_raw: Read Text File as Raw
  • stri_remove_empty: Remove All Empty Strings from a Character Vector
  • @@ -389,7 +390,7 @@

    References

    See Also

    -

    Other locale_sensitive: %s<%(), about_locale, about_search_boundaries, about_search_coll, stri_compare(), stri_count_boundaries(), stri_duplicated(), stri_enc_detect2(), stri_extract_all_boundaries(), stri_locate_all_boundaries(), stri_order(), stri_sort_key(), stri_sort(), stri_split_boundaries(), stri_trans_tolower(), stri_unique(), stri_wrap()

    +

    Other locale_sensitive: %s<%(), about_locale, about_search_boundaries, about_search_coll, stri_compare(), stri_count_boundaries(), stri_duplicated(), stri_enc_detect2(), stri_extract_all_boundaries(), stri_locate_all_boundaries(), stri_order(), stri_rank(), stri_sort_key(), stri_sort(), stri_split_boundaries(), stri_trans_tolower(), stri_unique(), stri_wrap()

    Other search_coll: about_search_coll, about_search

    diff --git a/devel/sphinx/_build/html/rapi/stri_opts_fixed.html b/devel/sphinx/_build/html/rapi/stri_opts_fixed.html index bc3d4ceca..d1e63d7e8 100644 --- a/devel/sphinx/_build/html/rapi/stri_opts_fixed.html +++ b/devel/sphinx/_build/html/rapi/stri_opts_fixed.html @@ -177,6 +177,7 @@
  • stri_rand_lipsum: A Lorem Ipsum Generator
  • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
  • stri_rand_strings: Generate Random Strings
  • +
  • stri_rank: Ranking
  • stri_read_lines: Read Text Lines from a Text File
  • stri_read_raw: Read Text File as Raw
  • stri_remove_empty: Remove All Empty Strings from a Character Vector
  • diff --git a/devel/sphinx/_build/html/rapi/stri_opts_regex.html b/devel/sphinx/_build/html/rapi/stri_opts_regex.html index 37264b316..ce99b5fce 100644 --- a/devel/sphinx/_build/html/rapi/stri_opts_regex.html +++ b/devel/sphinx/_build/html/rapi/stri_opts_regex.html @@ -177,6 +177,7 @@
  • stri_rand_lipsum: A Lorem Ipsum Generator
  • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
  • stri_rand_strings: Generate Random Strings
  • +
  • stri_rank: Ranking
  • stri_read_lines: Read Text Lines from a Text File
  • stri_read_raw: Read Text File as Raw
  • stri_remove_empty: Remove All Empty Strings from a Character Vector
  • diff --git a/devel/sphinx/_build/html/rapi/stri_order.html b/devel/sphinx/_build/html/rapi/stri_order.html index 248de7ba5..f5e3b6250 100644 --- a/devel/sphinx/_build/html/rapi/stri_order.html +++ b/devel/sphinx/_build/html/rapi/stri_order.html @@ -177,6 +177,7 @@
  • stri_rand_lipsum: A Lorem Ipsum Generator
  • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
  • stri_rand_strings: Generate Random Strings
  • +
  • stri_rank: Ranking
  • stri_read_lines: Read Text Lines from a Text File
  • stri_read_raw: Read Text File as Raw
  • stri_remove_empty: Remove All Empty Strings from a Character Vector
  • @@ -337,8 +338,9 @@

    Arguments

    Details

    For more information on ICU’s Collator and how to tune it up in stringi, refer to stri_opts_collator.

    -

    As usual in stringi, non-character inputs are coerced to strings, see an example below for a perhaps non-intuitive behavior of lexicographic sorting on numeric inputs.

    +

    As usual in stringi, non-character inputs are coerced to strings, see an example below for a somewhat non-intuitive behavior of lexicographic sorting on numeric inputs.

    This function uses a stable sort algorithm (STL’s stable_sort), which performs up to N*log^2(N) element comparisons, where N is the length of str.

    +

    For ordering with regards to multiple criteria (such as sorting data frames by more than 1 column), see stri_rank.

    Examples

    diff --git a/devel/sphinx/_build/html/rapi/stri_pad.html b/devel/sphinx/_build/html/rapi/stri_pad.html index 1b327f1b6..6073303d3 100644 --- a/devel/sphinx/_build/html/rapi/stri_pad.html +++ b/devel/sphinx/_build/html/rapi/stri_pad.html @@ -175,6 +175,7 @@
  • stri_rand_lipsum: A Lorem Ipsum Generator
  • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
  • stri_rand_strings: Generate Random Strings
  • +
  • stri_rank: Ranking
  • stri_read_lines: Read Text Lines from a Text File
  • stri_read_raw: Read Text File as Raw
  • stri_remove_empty: Remove All Empty Strings from a Character Vector
  • diff --git a/devel/sphinx/_build/html/rapi/stri_rand_lipsum.html b/devel/sphinx/_build/html/rapi/stri_rand_lipsum.html index df5fce3c3..108dd0f1b 100644 --- a/devel/sphinx/_build/html/rapi/stri_rand_lipsum.html +++ b/devel/sphinx/_build/html/rapi/stri_rand_lipsum.html @@ -176,6 +176,7 @@
  • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
  • stri_rand_strings: Generate Random Strings
  • +
  • stri_rank: Ranking
  • stri_read_lines: Read Text Lines from a Text File
  • stri_read_raw: Read Text File as Raw
  • stri_remove_empty: Remove All Empty Strings from a Character Vector
  • diff --git a/devel/sphinx/_build/html/rapi/stri_rand_shuffle.html b/devel/sphinx/_build/html/rapi/stri_rand_shuffle.html index 66f813899..df65684da 100644 --- a/devel/sphinx/_build/html/rapi/stri_rand_shuffle.html +++ b/devel/sphinx/_build/html/rapi/stri_rand_shuffle.html @@ -176,6 +176,7 @@
  • stri_rand_strings: Generate Random Strings
  • +
  • stri_rank: Ranking
  • stri_read_lines: Read Text Lines from a Text File
  • stri_read_raw: Read Text File as Raw
  • stri_remove_empty: Remove All Empty Strings from a Character Vector
  • diff --git a/devel/sphinx/_build/html/rapi/stri_rand_strings.html b/devel/sphinx/_build/html/rapi/stri_rand_strings.html index 82e123588..69f4807ee 100644 --- a/devel/sphinx/_build/html/rapi/stri_rand_strings.html +++ b/devel/sphinx/_build/html/rapi/stri_rand_strings.html @@ -41,7 +41,7 @@ - + @@ -176,6 +176,7 @@
  • Examples
  • +
  • stri_rank: Ranking
  • stri_read_lines: Read Text Lines from a Text File
  • stri_read_raw: Read Text File as Raw
  • stri_remove_empty: Remove All Empty Strings from a Character Vector
  • @@ -283,7 +284,7 @@ diff --git a/devel/sphinx/_build/html/rapi/stri_rank.html b/devel/sphinx/_build/html/rapi/stri_rank.html new file mode 100644 index 000000000..33ad57ba0 --- /dev/null +++ b/devel/sphinx/_build/html/rapi/stri_rank.html @@ -0,0 +1,413 @@ + + + + + + + + + + stri_rank: Ranking — stringi 1.5.4 documentation + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
    + + + +
    + + + + + +
    + +
    + + + + + + + + + + + + + + + + + + + +
    + + + + + + +
    +
    +
    +
    + +
    +

    stri_rank: Ranking

    +
    +

    Description

    +

    This function ranks each string in a character vector according to a locale-dependent lexicographic order. It is a portable replacement for the base xtfrm function.

    +
    +
    +

    Usage

    +
    stri_rank(str, ..., opts_collator = NULL)
    +
    +
    +
    +
    +

    Arguments

    + ++++ + + + + + + + + + + + +

    str

    a character vector

    ...

    additional settings for opts_collator

    opts_collator

    a named list with ICU Collator’s options, see stri_opts_collator, NULL for default collation options

    +
    +
    +

    Details

    +

    Missing values result in missing ranks and tied observations receive the same ranks (based on min).

    +

    For more information on ICU’s Collator and how to tune it up in stringi, refer to stri_opts_collator.

    +
    +
    +

    Value

    +

    The result is a vector of ranks corresponding to each string in str.

    +
    +
    +

    References

    +

    Collation - ICU User Guide, http://userguide.icu-project.org/collation

    +
    + +
    +

    Examples

    +
    stri_rank(c('hladny', 'chladny'), locale='pl_PL')
    +stri_rank(c('hladny', 'chladny'), locale='sk_SK')
    +
    +stri_rank("a" %s+% c(1, 100, 2, 101, 11, 10))  # lexicographic order
    +stri_rank("a" %s+% c(1, 100, 2, 101, 11, 10), numeric=TRUE)
    +
    +# Ordering a data frame with respect to two criteria:
    +X <- data.frame(a=c("b", NA, "b", "b", NA, "a", "a", "c"), b=runif(8))
    +X[order(stri_rank(X$a), X$b), ]
    +
    +
    +
    +
    + + +
    + +
    + +
    +
    + +
    + +
    + + + + + + + + + + + \ No newline at end of file diff --git a/devel/sphinx/_build/html/rapi/stri_read_lines.html b/devel/sphinx/_build/html/rapi/stri_read_lines.html index f621c4185..0e94d653b 100644 --- a/devel/sphinx/_build/html/rapi/stri_read_lines.html +++ b/devel/sphinx/_build/html/rapi/stri_read_lines.html @@ -42,7 +42,7 @@ - + @@ -167,6 +167,7 @@
  • stri_rand_lipsum: A Lorem Ipsum Generator
  • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
  • stri_rand_strings: Generate Random Strings
  • +
  • stri_rank: Ranking
  • stri_read_lines: Read Text Lines from a Text File
  • @@ -352,7 +353,7 @@

    See Also - +
    diff --git a/devel/sphinx/_build/html/rapi/stri_read_raw.html b/devel/sphinx/_build/html/rapi/stri_read_raw.html index 8e9d123de..200a616d7 100644 --- a/devel/sphinx/_build/html/rapi/stri_read_raw.html +++ b/devel/sphinx/_build/html/rapi/stri_read_raw.html @@ -167,6 +167,7 @@
  • stri_rand_lipsum: A Lorem Ipsum Generator
  • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
  • stri_rand_strings: Generate Random Strings
  • +
  • stri_rank: Ranking
  • stri_read_lines: Read Text Lines from a Text File
  • stri_read_raw: Read Text File as Raw
    • Description
    • diff --git a/devel/sphinx/_build/html/rapi/stri_remove_empty.html b/devel/sphinx/_build/html/rapi/stri_remove_empty.html index 1c6194a73..d678a2763 100644 --- a/devel/sphinx/_build/html/rapi/stri_remove_empty.html +++ b/devel/sphinx/_build/html/rapi/stri_remove_empty.html @@ -167,6 +167,7 @@
    • stri_rand_lipsum: A Lorem Ipsum Generator
    • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
    • stri_rand_strings: Generate Random Strings
    • +
    • stri_rank: Ranking
    • stri_read_lines: Read Text Lines from a Text File
    • stri_read_raw: Read Text File as Raw
    • stri_remove_empty: Remove All Empty Strings from a Character Vector
        diff --git a/devel/sphinx/_build/html/rapi/stri_replace.html b/devel/sphinx/_build/html/rapi/stri_replace.html index 8122059f5..f6a1f038e 100644 --- a/devel/sphinx/_build/html/rapi/stri_replace.html +++ b/devel/sphinx/_build/html/rapi/stri_replace.html @@ -167,6 +167,7 @@
      • stri_rand_lipsum: A Lorem Ipsum Generator
      • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
      • stri_rand_strings: Generate Random Strings
      • +
      • stri_rank: Ranking
      • stri_read_lines: Read Text Lines from a Text File
      • stri_read_raw: Read Text File as Raw
      • stri_remove_empty: Remove All Empty Strings from a Character Vector
      • diff --git a/devel/sphinx/_build/html/rapi/stri_replace_na.html b/devel/sphinx/_build/html/rapi/stri_replace_na.html index 0e13617b8..cf5d00a98 100644 --- a/devel/sphinx/_build/html/rapi/stri_replace_na.html +++ b/devel/sphinx/_build/html/rapi/stri_replace_na.html @@ -167,6 +167,7 @@
      • stri_rand_lipsum: A Lorem Ipsum Generator
      • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
      • stri_rand_strings: Generate Random Strings
      • +
      • stri_rank: Ranking
      • stri_read_lines: Read Text Lines from a Text File
      • stri_read_raw: Read Text File as Raw
      • stri_remove_empty: Remove All Empty Strings from a Character Vector
      • diff --git a/devel/sphinx/_build/html/rapi/stri_reverse.html b/devel/sphinx/_build/html/rapi/stri_reverse.html index d513674e2..8623eb78f 100644 --- a/devel/sphinx/_build/html/rapi/stri_reverse.html +++ b/devel/sphinx/_build/html/rapi/stri_reverse.html @@ -167,6 +167,7 @@
      • stri_rand_lipsum: A Lorem Ipsum Generator
      • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
      • stri_rand_strings: Generate Random Strings
      • +
      • stri_rank: Ranking
      • stri_read_lines: Read Text Lines from a Text File
      • stri_read_raw: Read Text File as Raw
      • stri_remove_empty: Remove All Empty Strings from a Character Vector
      • diff --git a/devel/sphinx/_build/html/rapi/stri_sort.html b/devel/sphinx/_build/html/rapi/stri_sort.html index e4206baab..0ea743e6e 100644 --- a/devel/sphinx/_build/html/rapi/stri_sort.html +++ b/devel/sphinx/_build/html/rapi/stri_sort.html @@ -167,6 +167,7 @@
      • stri_rand_lipsum: A Lorem Ipsum Generator
      • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
      • stri_rand_strings: Generate Random Strings
      • +
      • stri_rank: Ranking
      • stri_read_lines: Read Text Lines from a Text File
      • stri_read_raw: Read Text File as Raw
      • stri_remove_empty: Remove All Empty Strings from a Character Vector
      • @@ -300,7 +301,7 @@

        stri_sort: Sorting

        Description

        -

        This function sorts a character vector according to the locale-dependent lexicographic order.

        +

        This function sorts a character vector according to a locale-dependent lexicographic order.

        Usage

        @@ -337,7 +338,7 @@

        Arguments

        Details

        For more information on ICU’s Collator and how to tune it up in stringi, refer to stri_opts_collator.

        -

        As usual in stringi, non-character inputs are coerced to strings, see an example below for a perhaps non-intitive behavior of lexicographic sorting on numeric inputs.

        +

        As usual in stringi, non-character inputs are coerced to strings, see an example below for a somewhat non-intuitive behavior of lexicographic sorting on numeric inputs.

        This function uses a stable sort algorithm (STL’s stable_sort), which performs up to N*log^2(N) element comparisons, where N is the length of str.

        Examples

        diff --git a/devel/sphinx/_build/html/rapi/stri_sort_key.html b/devel/sphinx/_build/html/rapi/stri_sort_key.html index ea24498b3..c2ca1c21b 100644 --- a/devel/sphinx/_build/html/rapi/stri_sort_key.html +++ b/devel/sphinx/_build/html/rapi/stri_sort_key.html @@ -167,6 +167,7 @@
      • stri_rand_lipsum: A Lorem Ipsum Generator
      • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
      • stri_rand_strings: Generate Random Strings
      • +
      • stri_rank: Ranking
      • stri_read_lines: Read Text Lines from a Text File
      • stri_read_raw: Read Text File as Raw
      • stri_remove_empty: Remove All Empty Strings from a Character Vector
      • @@ -300,7 +301,7 @@

        stri_sort_key: Sort Keys

        Description

        -

        This function computes a locale-dependent ‘sort key’, which is an alternative character representation of the string that, when ordered in the C locale (which orders using bytes directly), will give an equivalent ordering to the original string. It is useful for enhancing algorithms that sort only in the C locale with the ability to be locale-aware.

        +

        This function computes a locale-dependent sort key, which is an alternative character representation of the string that, when ordered in the C locale (which orders using the underlying bytes directly), will give an equivalent ordering to the original string. It is useful for enhancing algorithms that sort only in the C locale (e.g., the strcmp function in libc) with the ability to be locale-aware.

        Usage

        @@ -331,10 +332,11 @@

        Arguments

        Details

        For more information on ICU’s Collator and how to tune it up in stringi, refer to stri_opts_collator.

        +

        See also stri_rank for ranking strings with a single character vector, i.e., generating relative sort keys.

        Value

        -

        The result is a character vector with the same length as str that contains the sort keys.

        +

        The result is a character vector with the same length as str that contains the sort keys. The output is marked as bytes-encoded.

        Examples

        diff --git a/devel/sphinx/_build/html/rapi/stri_split.html b/devel/sphinx/_build/html/rapi/stri_split.html index 30cbdcebd..9321fb959 100644 --- a/devel/sphinx/_build/html/rapi/stri_split.html +++ b/devel/sphinx/_build/html/rapi/stri_split.html @@ -167,6 +167,7 @@
      • stri_rand_lipsum: A Lorem Ipsum Generator
      • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
      • stri_rand_strings: Generate Random Strings
      • +
      • stri_rank: Ranking
      • stri_read_lines: Read Text Lines from a Text File
      • stri_read_raw: Read Text File as Raw
      • stri_remove_empty: Remove All Empty Strings from a Character Vector
      • diff --git a/devel/sphinx/_build/html/rapi/stri_split_boundaries.html b/devel/sphinx/_build/html/rapi/stri_split_boundaries.html index 254659a0b..51da1d774 100644 --- a/devel/sphinx/_build/html/rapi/stri_split_boundaries.html +++ b/devel/sphinx/_build/html/rapi/stri_split_boundaries.html @@ -167,6 +167,7 @@
      • stri_rand_lipsum: A Lorem Ipsum Generator
      • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
      • stri_rand_strings: Generate Random Strings
      • +
      • stri_rank: Ranking
      • stri_read_lines: Read Text Lines from a Text File
      • stri_read_raw: Read Text File as Raw
      • stri_remove_empty: Remove All Empty Strings from a Character Vector
      • @@ -358,7 +359,7 @@

        Value
        diff --git a/devel/sphinx/_build/html/rapi/stri_split_lines.html b/devel/sphinx/_build/html/rapi/stri_split_lines.html index 75ac36590..e68ce334d 100644 --- a/devel/sphinx/_build/html/rapi/stri_split_lines.html +++ b/devel/sphinx/_build/html/rapi/stri_split_lines.html @@ -167,6 +167,7 @@
      • stri_rand_lipsum: A Lorem Ipsum Generator
      • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
      • stri_rand_strings: Generate Random Strings
      • +
      • stri_rank: Ranking
      • stri_read_lines: Read Text Lines from a Text File
      • stri_read_raw: Read Text File as Raw
      • stri_remove_empty: Remove All Empty Strings from a Character Vector
      • diff --git a/devel/sphinx/_build/html/rapi/stri_startsendswith.html b/devel/sphinx/_build/html/rapi/stri_startsendswith.html index 2e0ec7824..c74edbd3b 100644 --- a/devel/sphinx/_build/html/rapi/stri_startsendswith.html +++ b/devel/sphinx/_build/html/rapi/stri_startsendswith.html @@ -167,6 +167,7 @@
      • stri_rand_lipsum: A Lorem Ipsum Generator
      • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
      • stri_rand_strings: Generate Random Strings
      • +
      • stri_rank: Ranking
      • stri_read_lines: Read Text Lines from a Text File
      • stri_read_raw: Read Text File as Raw
      • stri_remove_empty: Remove All Empty Strings from a Character Vector
      • diff --git a/devel/sphinx/_build/html/rapi/stri_stats_general.html b/devel/sphinx/_build/html/rapi/stri_stats_general.html index 95da6a66c..c8b566b69 100644 --- a/devel/sphinx/_build/html/rapi/stri_stats_general.html +++ b/devel/sphinx/_build/html/rapi/stri_stats_general.html @@ -167,6 +167,7 @@
      • stri_rand_lipsum: A Lorem Ipsum Generator
      • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
      • stri_rand_strings: Generate Random Strings
      • +
      • stri_rank: Ranking
      • stri_read_lines: Read Text Lines from a Text File
      • stri_read_raw: Read Text File as Raw
      • stri_remove_empty: Remove All Empty Strings from a Character Vector
      • diff --git a/devel/sphinx/_build/html/rapi/stri_stats_latex.html b/devel/sphinx/_build/html/rapi/stri_stats_latex.html index 818f90eae..1decdff26 100644 --- a/devel/sphinx/_build/html/rapi/stri_stats_latex.html +++ b/devel/sphinx/_build/html/rapi/stri_stats_latex.html @@ -167,6 +167,7 @@
      • stri_rand_lipsum: A Lorem Ipsum Generator
      • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
      • stri_rand_strings: Generate Random Strings
      • +
      • stri_rank: Ranking
      • stri_read_lines: Read Text Lines from a Text File
      • stri_read_raw: Read Text File as Raw
      • stri_remove_empty: Remove All Empty Strings from a Character Vector
      • diff --git a/devel/sphinx/_build/html/rapi/stri_sub.html b/devel/sphinx/_build/html/rapi/stri_sub.html index a54538613..d2525df81 100644 --- a/devel/sphinx/_build/html/rapi/stri_sub.html +++ b/devel/sphinx/_build/html/rapi/stri_sub.html @@ -167,6 +167,7 @@
      • stri_rand_lipsum: A Lorem Ipsum Generator
      • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
      • stri_rand_strings: Generate Random Strings
      • +
      • stri_rank: Ranking
      • stri_read_lines: Read Text Lines from a Text File
      • stri_read_raw: Read Text File as Raw
      • stri_remove_empty: Remove All Empty Strings from a Character Vector
      • diff --git a/devel/sphinx/_build/html/rapi/stri_sub_all.html b/devel/sphinx/_build/html/rapi/stri_sub_all.html index 335c545d7..33c26525b 100644 --- a/devel/sphinx/_build/html/rapi/stri_sub_all.html +++ b/devel/sphinx/_build/html/rapi/stri_sub_all.html @@ -167,6 +167,7 @@
      • stri_rand_lipsum: A Lorem Ipsum Generator
      • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
      • stri_rand_strings: Generate Random Strings
      • +
      • stri_rank: Ranking
      • stri_read_lines: Read Text Lines from a Text File
      • stri_read_raw: Read Text File as Raw
      • stri_remove_empty: Remove All Empty Strings from a Character Vector
      • diff --git a/devel/sphinx/_build/html/rapi/stri_subset.html b/devel/sphinx/_build/html/rapi/stri_subset.html index dbfc78f35..d367019e8 100644 --- a/devel/sphinx/_build/html/rapi/stri_subset.html +++ b/devel/sphinx/_build/html/rapi/stri_subset.html @@ -167,6 +167,7 @@
      • stri_rand_lipsum: A Lorem Ipsum Generator
      • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
      • stri_rand_strings: Generate Random Strings
      • +
      • stri_rank: Ranking
      • stri_read_lines: Read Text Lines from a Text File
      • stri_read_raw: Read Text File as Raw
      • stri_remove_empty: Remove All Empty Strings from a Character Vector
      • diff --git a/devel/sphinx/_build/html/rapi/stri_timezone_info.html b/devel/sphinx/_build/html/rapi/stri_timezone_info.html index 94e6558e1..4a2e4a055 100644 --- a/devel/sphinx/_build/html/rapi/stri_timezone_info.html +++ b/devel/sphinx/_build/html/rapi/stri_timezone_info.html @@ -167,6 +167,7 @@
      • stri_rand_lipsum: A Lorem Ipsum Generator
      • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
      • stri_rand_strings: Generate Random Strings
      • +
      • stri_rank: Ranking
      • stri_read_lines: Read Text Lines from a Text File
      • stri_read_raw: Read Text File as Raw
      • stri_remove_empty: Remove All Empty Strings from a Character Vector
      • diff --git a/devel/sphinx/_build/html/rapi/stri_timezone_list.html b/devel/sphinx/_build/html/rapi/stri_timezone_list.html index 873b4cd00..4172bf590 100644 --- a/devel/sphinx/_build/html/rapi/stri_timezone_list.html +++ b/devel/sphinx/_build/html/rapi/stri_timezone_list.html @@ -167,6 +167,7 @@
      • stri_rand_lipsum: A Lorem Ipsum Generator
      • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
      • stri_rand_strings: Generate Random Strings
      • +
      • stri_rank: Ranking
      • stri_read_lines: Read Text Lines from a Text File
      • stri_read_raw: Read Text File as Raw
      • stri_remove_empty: Remove All Empty Strings from a Character Vector
      • diff --git a/devel/sphinx/_build/html/rapi/stri_timezone_set.html b/devel/sphinx/_build/html/rapi/stri_timezone_set.html index 7388286e4..178bcad31 100644 --- a/devel/sphinx/_build/html/rapi/stri_timezone_set.html +++ b/devel/sphinx/_build/html/rapi/stri_timezone_set.html @@ -167,6 +167,7 @@
      • stri_rand_lipsum: A Lorem Ipsum Generator
      • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
      • stri_rand_strings: Generate Random Strings
      • +
      • stri_rank: Ranking
      • stri_read_lines: Read Text Lines from a Text File
      • stri_read_raw: Read Text File as Raw
      • stri_remove_empty: Remove All Empty Strings from a Character Vector
      • diff --git a/devel/sphinx/_build/html/rapi/stri_trans_casemap.html b/devel/sphinx/_build/html/rapi/stri_trans_casemap.html index c108a3f0c..b95b246d0 100644 --- a/devel/sphinx/_build/html/rapi/stri_trans_casemap.html +++ b/devel/sphinx/_build/html/rapi/stri_trans_casemap.html @@ -167,6 +167,7 @@
      • stri_rand_lipsum: A Lorem Ipsum Generator
      • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
      • stri_rand_strings: Generate Random Strings
      • +
      • stri_rank: Ranking
      • stri_read_lines: Read Text Lines from a Text File
      • stri_read_raw: Read Text File as Raw
      • stri_remove_empty: Remove All Empty Strings from a Character Vector
      • @@ -357,7 +358,7 @@

        References

        See Also

        -

        Other locale_sensitive: %s<%(), about_locale, about_search_boundaries, about_search_coll, stri_compare(), stri_count_boundaries(), stri_duplicated(), stri_enc_detect2(), stri_extract_all_boundaries(), stri_locate_all_boundaries(), stri_opts_collator(), stri_order(), stri_sort_key(), stri_sort(), stri_split_boundaries(), stri_unique(), stri_wrap()

        +

        Other locale_sensitive: %s<%(), about_locale, about_search_boundaries, about_search_coll, stri_compare(), stri_count_boundaries(), stri_duplicated(), stri_enc_detect2(), stri_extract_all_boundaries(), stri_locate_all_boundaries(), stri_opts_collator(), stri_order(), stri_rank(), stri_sort_key(), stri_sort(), stri_split_boundaries(), stri_unique(), stri_wrap()

        Other transform: stri_trans_char(), stri_trans_general(), stri_trans_list(), stri_trans_nfc()

        Other text_boundaries: about_search_boundaries, about_search, stri_count_boundaries(), stri_extract_all_boundaries(), stri_locate_all_boundaries(), stri_opts_brkiter(), stri_split_boundaries(), stri_split_lines(), stri_wrap()

        diff --git a/devel/sphinx/_build/html/rapi/stri_trans_char.html b/devel/sphinx/_build/html/rapi/stri_trans_char.html index c3c1169c4..6e7abe467 100644 --- a/devel/sphinx/_build/html/rapi/stri_trans_char.html +++ b/devel/sphinx/_build/html/rapi/stri_trans_char.html @@ -167,6 +167,7 @@
      • stri_rand_lipsum: A Lorem Ipsum Generator
      • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
      • stri_rand_strings: Generate Random Strings
      • +
      • stri_rank: Ranking
      • stri_read_lines: Read Text Lines from a Text File
      • stri_read_raw: Read Text File as Raw
      • stri_remove_empty: Remove All Empty Strings from a Character Vector
      • diff --git a/devel/sphinx/_build/html/rapi/stri_trans_general.html b/devel/sphinx/_build/html/rapi/stri_trans_general.html index 40dfcfc61..61316a009 100644 --- a/devel/sphinx/_build/html/rapi/stri_trans_general.html +++ b/devel/sphinx/_build/html/rapi/stri_trans_general.html @@ -167,6 +167,7 @@
      • stri_rand_lipsum: A Lorem Ipsum Generator
      • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
      • stri_rand_strings: Generate Random Strings
      • +
      • stri_rank: Ranking
      • stri_read_lines: Read Text Lines from a Text File
      • stri_read_raw: Read Text File as Raw
      • stri_remove_empty: Remove All Empty Strings from a Character Vector
      • diff --git a/devel/sphinx/_build/html/rapi/stri_trans_list.html b/devel/sphinx/_build/html/rapi/stri_trans_list.html index ba0f342ad..5ebf9be1d 100644 --- a/devel/sphinx/_build/html/rapi/stri_trans_list.html +++ b/devel/sphinx/_build/html/rapi/stri_trans_list.html @@ -167,6 +167,7 @@
      • stri_rand_lipsum: A Lorem Ipsum Generator
      • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
      • stri_rand_strings: Generate Random Strings
      • +
      • stri_rank: Ranking
      • stri_read_lines: Read Text Lines from a Text File
      • stri_read_raw: Read Text File as Raw
      • stri_remove_empty: Remove All Empty Strings from a Character Vector
      • diff --git a/devel/sphinx/_build/html/rapi/stri_trans_nf.html b/devel/sphinx/_build/html/rapi/stri_trans_nf.html index 016448178..ece7199f6 100644 --- a/devel/sphinx/_build/html/rapi/stri_trans_nf.html +++ b/devel/sphinx/_build/html/rapi/stri_trans_nf.html @@ -167,6 +167,7 @@
      • stri_rand_lipsum: A Lorem Ipsum Generator
      • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
      • stri_rand_strings: Generate Random Strings
      • +
      • stri_rank: Ranking
      • stri_read_lines: Read Text Lines from a Text File
      • stri_read_raw: Read Text File as Raw
      • stri_remove_empty: Remove All Empty Strings from a Character Vector
      • diff --git a/devel/sphinx/_build/html/rapi/stri_trim.html b/devel/sphinx/_build/html/rapi/stri_trim.html index 9d7f20134..0720939d0 100644 --- a/devel/sphinx/_build/html/rapi/stri_trim.html +++ b/devel/sphinx/_build/html/rapi/stri_trim.html @@ -167,6 +167,7 @@
      • stri_rand_lipsum: A Lorem Ipsum Generator
      • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
      • stri_rand_strings: Generate Random Strings
      • +
      • stri_rank: Ranking
      • stri_read_lines: Read Text Lines from a Text File
      • stri_read_raw: Read Text File as Raw
      • stri_remove_empty: Remove All Empty Strings from a Character Vector
      • diff --git a/devel/sphinx/_build/html/rapi/stri_unescape_unicode.html b/devel/sphinx/_build/html/rapi/stri_unescape_unicode.html index 9e0357bea..8e53e931b 100644 --- a/devel/sphinx/_build/html/rapi/stri_unescape_unicode.html +++ b/devel/sphinx/_build/html/rapi/stri_unescape_unicode.html @@ -167,6 +167,7 @@
      • stri_rand_lipsum: A Lorem Ipsum Generator
      • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
      • stri_rand_strings: Generate Random Strings
      • +
      • stri_rank: Ranking
      • stri_read_lines: Read Text Lines from a Text File
      • stri_read_raw: Read Text File as Raw
      • stri_remove_empty: Remove All Empty Strings from a Character Vector
      • diff --git a/devel/sphinx/_build/html/rapi/stri_unique.html b/devel/sphinx/_build/html/rapi/stri_unique.html index 1f86b591b..ada34d95a 100644 --- a/devel/sphinx/_build/html/rapi/stri_unique.html +++ b/devel/sphinx/_build/html/rapi/stri_unique.html @@ -167,6 +167,7 @@
      • stri_rand_lipsum: A Lorem Ipsum Generator
      • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
      • stri_rand_strings: Generate Random Strings
      • +
      • stri_rank: Ranking
      • stri_read_lines: Read Text Lines from a Text File
      • stri_read_raw: Read Text File as Raw
      • stri_remove_empty: Remove All Empty Strings from a Character Vector
      • @@ -343,7 +344,7 @@

        References

        See Also

        -

        Other locale_sensitive: %s<%(), about_locale, about_search_boundaries, about_search_coll, stri_compare(), stri_count_boundaries(), stri_duplicated(), stri_enc_detect2(), stri_extract_all_boundaries(), stri_locate_all_boundaries(), stri_opts_collator(), stri_order(), stri_sort_key(), stri_sort(), stri_split_boundaries(), stri_trans_tolower(), stri_wrap()

        +

        Other locale_sensitive: %s<%(), about_locale, about_search_boundaries, about_search_coll, stri_compare(), stri_count_boundaries(), stri_duplicated(), stri_enc_detect2(), stri_extract_all_boundaries(), stri_locate_all_boundaries(), stri_opts_collator(), stri_order(), stri_rank(), stri_sort_key(), stri_sort(), stri_split_boundaries(), stri_trans_tolower(), stri_wrap()

        Examples

        diff --git a/devel/sphinx/_build/html/rapi/stri_width.html b/devel/sphinx/_build/html/rapi/stri_width.html index 0d10b47ac..c2288b965 100644 --- a/devel/sphinx/_build/html/rapi/stri_width.html +++ b/devel/sphinx/_build/html/rapi/stri_width.html @@ -167,6 +167,7 @@
      • stri_rand_lipsum: A Lorem Ipsum Generator
      • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
      • stri_rand_strings: Generate Random Strings
      • +
      • stri_rank: Ranking
      • stri_read_lines: Read Text Lines from a Text File
      • stri_read_raw: Read Text File as Raw
      • stri_remove_empty: Remove All Empty Strings from a Character Vector
      • diff --git a/devel/sphinx/_build/html/rapi/stri_wrap.html b/devel/sphinx/_build/html/rapi/stri_wrap.html index 44111465e..17318f94e 100644 --- a/devel/sphinx/_build/html/rapi/stri_wrap.html +++ b/devel/sphinx/_build/html/rapi/stri_wrap.html @@ -167,6 +167,7 @@
      • stri_rand_lipsum: A Lorem Ipsum Generator
      • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
      • stri_rand_strings: Generate Random Strings
      • +
      • stri_rank: Ranking
      • stri_read_lines: Read Text Lines from a Text File
      • stri_read_raw: Read Text File as Raw
      • stri_remove_empty: Remove All Empty Strings from a Character Vector
      • @@ -388,7 +389,7 @@

        References

        See Also

        -

        Other locale_sensitive: %s<%(), about_locale, about_search_boundaries, about_search_coll, stri_compare(), stri_count_boundaries(), stri_duplicated(), stri_enc_detect2(), stri_extract_all_boundaries(), stri_locate_all_boundaries(), stri_opts_collator(), stri_order(), stri_sort_key(), stri_sort(), stri_split_boundaries(), stri_trans_tolower(), stri_unique()

        +

        Other locale_sensitive: %s<%(), about_locale, about_search_boundaries, about_search_coll, stri_compare(), stri_count_boundaries(), stri_duplicated(), stri_enc_detect2(), stri_extract_all_boundaries(), stri_locate_all_boundaries(), stri_opts_collator(), stri_order(), stri_rank(), stri_sort_key(), stri_sort(), stri_split_boundaries(), stri_trans_tolower(), stri_unique()

        Other text_boundaries: about_search_boundaries, about_search, stri_count_boundaries(), stri_extract_all_boundaries(), stri_locate_all_boundaries(), stri_opts_brkiter(), stri_split_boundaries(), stri_split_lines(), stri_trans_tolower()

        diff --git a/devel/sphinx/_build/html/rapi/stri_write_lines.html b/devel/sphinx/_build/html/rapi/stri_write_lines.html index 23ff4e7dc..1c9395ddc 100644 --- a/devel/sphinx/_build/html/rapi/stri_write_lines.html +++ b/devel/sphinx/_build/html/rapi/stri_write_lines.html @@ -167,6 +167,7 @@
      • stri_rand_lipsum: A Lorem Ipsum Generator
      • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
      • stri_rand_strings: Generate Random Strings
      • +
      • stri_rank: Ranking
      • stri_read_lines: Read Text Lines from a Text File
      • stri_read_raw: Read Text File as Raw
      • stri_remove_empty: Remove All Empty Strings from a Character Vector
      • diff --git a/devel/sphinx/_build/html/searchindex.js b/devel/sphinx/_build/html/searchindex.js index ad8b44947..90b3eb05c 100644 --- a/devel/sphinx/_build/html/searchindex.js +++ b/devel/sphinx/_build/html/searchindex.js @@ -1 +1 @@ -Search.setIndex({docnames:["index","install","news","rapi","rapi/about_arguments","rapi/about_encoding","rapi/about_locale","rapi/about_search","rapi/about_search_boundaries","rapi/about_search_charclass","rapi/about_search_coll","rapi/about_search_fixed","rapi/about_search_regex","rapi/about_stringi","rapi/operator_add","rapi/operator_compare","rapi/operator_dollar","rapi/stri_compare","rapi/stri_count","rapi/stri_count_boundaries","rapi/stri_datetime_add","rapi/stri_datetime_create","rapi/stri_datetime_fields","rapi/stri_datetime_format","rapi/stri_datetime_fstr","rapi/stri_datetime_now","rapi/stri_datetime_symbols","rapi/stri_detect","rapi/stri_dup","rapi/stri_duplicated","rapi/stri_enc_detect","rapi/stri_enc_detect2","rapi/stri_enc_fromutf32","rapi/stri_enc_info","rapi/stri_enc_isascii","rapi/stri_enc_isutf16","rapi/stri_enc_isutf8","rapi/stri_enc_list","rapi/stri_enc_mark","rapi/stri_enc_set","rapi/stri_enc_toascii","rapi/stri_enc_tonative","rapi/stri_enc_toutf32","rapi/stri_enc_toutf8","rapi/stri_encode","rapi/stri_escape_unicode","rapi/stri_extract","rapi/stri_extract_boundaries","rapi/stri_flatten","rapi/stri_info","rapi/stri_isempty","rapi/stri_join","rapi/stri_join_list","rapi/stri_length","rapi/stri_list2matrix","rapi/stri_locale_info","rapi/stri_locale_list","rapi/stri_locale_set","rapi/stri_locate","rapi/stri_locate_boundaries","rapi/stri_match","rapi/stri_na2empty","rapi/stri_numbytes","rapi/stri_opts_brkiter","rapi/stri_opts_collator","rapi/stri_opts_fixed","rapi/stri_opts_regex","rapi/stri_order","rapi/stri_pad","rapi/stri_rand_lipsum","rapi/stri_rand_shuffle","rapi/stri_rand_strings","rapi/stri_read_lines","rapi/stri_read_raw","rapi/stri_remove_empty","rapi/stri_replace","rapi/stri_replace_na","rapi/stri_reverse","rapi/stri_sort","rapi/stri_sort_key","rapi/stri_split","rapi/stri_split_boundaries","rapi/stri_split_lines","rapi/stri_startsendswith","rapi/stri_stats_general","rapi/stri_stats_latex","rapi/stri_sub","rapi/stri_sub_all","rapi/stri_subset","rapi/stri_timezone_info","rapi/stri_timezone_list","rapi/stri_timezone_set","rapi/stri_trans_casemap","rapi/stri_trans_char","rapi/stri_trans_general","rapi/stri_trans_list","rapi/stri_trans_nf","rapi/stri_trim","rapi/stri_unescape_unicode","rapi/stri_unique","rapi/stri_width","rapi/stri_wrap","rapi/stri_write_lines"],envversion:{"sphinx.domains.c":2,"sphinx.domains.changeset":1,"sphinx.domains.citation":1,"sphinx.domains.cpp":3,"sphinx.domains.index":1,"sphinx.domains.javascript":2,"sphinx.domains.math":2,"sphinx.domains.python":2,"sphinx.domains.rst":2,"sphinx.domains.std":2,sphinx:56},filenames:["index.rst","install.rst","news.rst","rapi.rst","rapi/about_arguments.rst","rapi/about_encoding.rst","rapi/about_locale.rst","rapi/about_search.rst","rapi/about_search_boundaries.rst","rapi/about_search_charclass.rst","rapi/about_search_coll.rst","rapi/about_search_fixed.rst","rapi/about_search_regex.rst","rapi/about_stringi.rst","rapi/operator_add.rst","rapi/operator_compare.rst","rapi/operator_dollar.rst","rapi/stri_compare.rst","rapi/stri_count.rst","rapi/stri_count_boundaries.rst","rapi/stri_datetime_add.rst","rapi/stri_datetime_create.rst","rapi/stri_datetime_fields.rst","rapi/stri_datetime_format.rst","rapi/stri_datetime_fstr.rst","rapi/stri_datetime_now.rst","rapi/stri_datetime_symbols.rst","rapi/stri_detect.rst","rapi/stri_dup.rst","rapi/stri_duplicated.rst","rapi/stri_enc_detect.rst","rapi/stri_enc_detect2.rst","rapi/stri_enc_fromutf32.rst","rapi/stri_enc_info.rst","rapi/stri_enc_isascii.rst","rapi/stri_enc_isutf16.rst","rapi/stri_enc_isutf8.rst","rapi/stri_enc_list.rst","rapi/stri_enc_mark.rst","rapi/stri_enc_set.rst","rapi/stri_enc_toascii.rst","rapi/stri_enc_tonative.rst","rapi/stri_enc_toutf32.rst","rapi/stri_enc_toutf8.rst","rapi/stri_encode.rst","rapi/stri_escape_unicode.rst","rapi/stri_extract.rst","rapi/stri_extract_boundaries.rst","rapi/stri_flatten.rst","rapi/stri_info.rst","rapi/stri_isempty.rst","rapi/stri_join.rst","rapi/stri_join_list.rst","rapi/stri_length.rst","rapi/stri_list2matrix.rst","rapi/stri_locale_info.rst","rapi/stri_locale_list.rst","rapi/stri_locale_set.rst","rapi/stri_locate.rst","rapi/stri_locate_boundaries.rst","rapi/stri_match.rst","rapi/stri_na2empty.rst","rapi/stri_numbytes.rst","rapi/stri_opts_brkiter.rst","rapi/stri_opts_collator.rst","rapi/stri_opts_fixed.rst","rapi/stri_opts_regex.rst","rapi/stri_order.rst","rapi/stri_pad.rst","rapi/stri_rand_lipsum.rst","rapi/stri_rand_shuffle.rst","rapi/stri_rand_strings.rst","rapi/stri_read_lines.rst","rapi/stri_read_raw.rst","rapi/stri_remove_empty.rst","rapi/stri_replace.rst","rapi/stri_replace_na.rst","rapi/stri_reverse.rst","rapi/stri_sort.rst","rapi/stri_sort_key.rst","rapi/stri_split.rst","rapi/stri_split_boundaries.rst","rapi/stri_split_lines.rst","rapi/stri_startsendswith.rst","rapi/stri_stats_general.rst","rapi/stri_stats_latex.rst","rapi/stri_sub.rst","rapi/stri_sub_all.rst","rapi/stri_subset.rst","rapi/stri_timezone_info.rst","rapi/stri_timezone_list.rst","rapi/stri_timezone_set.rst","rapi/stri_trans_casemap.rst","rapi/stri_trans_char.rst","rapi/stri_trans_general.rst","rapi/stri_trans_list.rst","rapi/stri_trans_nf.rst","rapi/stri_trim.rst","rapi/stri_unescape_unicode.rst","rapi/stri_unique.rst","rapi/stri_width.rst","rapi/stri_wrap.rst","rapi/stri_write_lines.rst"],objects:{},objnames:{},objtypes:{},terms:{"0000":[5,9],"000a":66,"001a":44,"00ad":100,"0100":23,"0105":9,"0123456789":70,"032":40,"0377":12,"0530":23,"075258":23,"0800":23,"0ooo":12,"0x0a":82,"0x0b":82,"0x0c":82,"0x0d":82,"0x1a":40,"0x1f":98,"0x2028":82,"0x2029":82,"0x3000":100,"0x85":82,"0xff01":100,"0xff5e":100,"100":[2,64,67,78],"100000":30,"101":[67,78],"102":2,"105":2,"106":2,"10646":13,"107":2,"108":2,"109":2,"10ffff":[5,9],"110":2,"111":2,"1119":101,"112":2,"114":2,"116":2,"117":2,"118":2,"1184":101,"119":2,"120":2,"122":2,"123":[2,14,18,27,47,50,51,52,53,62,75,77,81,88,92,93],"1234":75,"124":2,"1250":[30,36],"1251":30,"1252":[2,5,30],"1253":30,"1254":30,"1255":30,"1256":30,"126":2,"127":[5,34,38,40,43],"128":2,"129":2,"12l":21,"132":2,"133":2,"134":2,"135":2,"137":2,"138":2,"139":2,"141":2,"143":2,"144":2,"149":2,"154":2,"157":2,"164":2,"165":2,"168":2,"169":2,"16be":[30,31,35],"16le":[30,31,35],"170":2,"174":2,"175":2,"176":2,"177":5,"180":2,"183":2,"187":2,"188":2,"189":23,"190":69,"193":2,"1970":25,"1981":101,"199":2,"1990":9,"1996":23,"1999":[10,23],"1bc":[21,22],"1st":23,"1to1":33,"2001":2,"2002":12,"200b":100,"2013":0,"2014":[0,20],"2015":[0,21,23],"2016":[0,20],"2017":0,"2018":0,"2019":0,"2020":0,"2021":0,"2022":30,"2028":[9,82],"2029":[9,82],"205":2,"2060":9,"206f":9,"207":2,"210":2,"214":2,"216":2,"220":2,"227":2,"230":2,"231":2,"232":2,"235":23,"2350":23,"238":2,"242":2,"2451334":23,"253":2,"254":2,"258":2,"263":2,"266":2,"267":2,"270":2,"285":2,"288":2,"289":2,"296":2,"2bc":[21,22],"2nd":23,"314":2,"3166":[6,90],"317":2,"318":2,"319":2,"31t23":23,"325":2,"32be":[30,31,35],"32le":[30,31,35],"334":2,"335":2,"337":2,"338":2,"341":2,"343":2,"344":2,"345":2,"3456":[86,87],"347":2,"348":2,"355":2,"362":2,"3629":13,"363":2,"364":2,"366":2,"369":2,"370":2,"372":2,"382":2,"386":2,"393":2,"398":2,"399":2,"3rd":2,"400":2,"401":2,"405":2,"408":2,"414":2,"415":2,"456":[27,52,75,81],"4601":23,"5198":96,"55200":46,"5775":21,"61201235":23,"639":6,"667":[86,87],"789":[27,52,75,81,86,87],"822":23,"8601":23,"8859":[5,30],"8bit":33,"9899":9,"999":21,"abstract":12,"bart\u0142omiej":0,"break":[2,8,19,47,59,63,81,92,101],"byte":[0,2,3,5,7,12,13,30,31,32,33,34,35,36,38,40,41,42,43,44,53,66,79,86,98],"case":[0,1,2,3,4,5,6,7,8,9,10,11,12,13,17,19,24,27,30,31,43,44,46,47,51,53,55,59,63,64,65,66,70,75,80,81,87,94,96,101],"char":84,"class":[0,2,3,7,8,12,13,20,21,22,23,25,26,64,71,90,91,97],"default":[0,1,2,3,5,12,15,17,18,19,20,21,22,23,26,27,29,31,33,37,38,43,44,46,47,55,58,59,60,63,64,65,66,67,68,72,75,78,79,80,81,82,83,88,89,90,92,97,99,101,102],"enum":[2,66],"export":2,"final":[5,6,9,12,100],"float":2,"function":[0,1,2,3,5,9,10,11,13,15,17,18,19,20,23,24,27,29,30,31,32,34,35,36,38,40,41,42,43,44,46,47,51,52,53,54,55,57,58,59,60,61,62,63,64,65,66,67,68,72,75,76,78,79,80,81,82,83,84,85,86,87,88,89,90,91,92,94,96,97,98,99,100,101,102],"import":[2,4],"long":[1,2,4,23,89,90],"new":[0,12,14,81,101],"null":[1,2,6,17,18,19,20,21,22,23,26,27,29,31,32,33,39,41,42,44,46,47,51,52,55,57,58,59,60,63,64,67,72,75,78,79,80,81,83,88,89,91,92,99,101,102],"public":9,"return":[2,5,7,12,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,68,69,70,71,72,73,74,75,76,77,80,81,82,83,84,85,86,87,88,89,90,91,92,93,94,95,96,97,98,99,100,101,102],"short":[1,2,9,11,23,49,89],"static":2,"strin\u0261i":0,"switch":[2,5],"throw":2,"true":[2,5,9,12,17,19,21,23,27,29,37,43,44,46,47,48,49,51,52,54,58,59,64,65,66,67,68,69,71,74,75,78,80,81,82,86,87,88,101],"try":[1,2,31],"var":1,"while":[2,5,6,8,17,39],Added:2,For:[0,1,3,4,5,6,8,9,10,12,17,19,23,24,30,32,36,37,43,44,45,46,47,53,58,59,60,62,63,66,67,75,78,79,81,83,86,87,89,91,92,94,97,98],Into:[0,3],Its:[12,36,86,87],Los:23,Mrs:[59,81],NAs:[0,3],NFs:96,Not:[30,46,57,62,75,86,91],One:6,Such:[5,29,86,87,99],Sys:[5,38,39],THE:[3,47,80],The:[0,1,2,5,6,7,8,9,10,11,12,13,17,19,20,23,25,27,30,31,34,36,37,41,48,54,58,59,60,62,63,67,69,72,75,78,79,80,81,88,90,96,98,100,101],Their:[6,12],There:5,These:[5,7,8,9,14,15,17,18,19,23,27,35,44,46,47,51,52,58,59,60,68,75,80,82,83,88,92,96,97],Use:[2,58,59],Used:89,Useful:2,Uses:98,Using:2,With:[12,55,92],_boundari:[2,7,59],_charclass:[2,7,9,83],_coll:[2,7,10,83],_count:2,_euro:6,_fix:[2,7,65,83],_limit:2,_regex:[2,7,12,58,60,75],_static:2,_word:[47,59],_xpg6:2,a_b_c__d:80,a_b_c_d:80,aaa:[23,46,58,97],aaaa:[46,58,75],aaaaaaaa:[46,58],aabbcc:[46,58],ab_c:80,aba:46,ababa:83,abababa:46,abaca:75,abbrevi:[23,26],abc:[9,14,27,28,46,50,51,53,58,62,77,86,87,92],abcd:[60,68],abcdefghi:70,abcdefghijk:[46,58],abil:[72,79,102],abl:[2,7],about:[0,2],about_argu:[0,3,5,6,7,8,9,10,11,12,13],about_encod:[0,3,4,6,7,8,9,10,11,12,13,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44],about_local:[0,3,4,5,7,8,9,10,11,12,13,15,17,19,29,31,47,55,56,57,59,64,67,78,79,81,92,99,101],about_search:[0,3,4,5,6,8,9,10,11,12,13,18,19,27,46,47,58,59,60,63,64,65,66,75,80,81,82,83,88,92,97,101],about_search_boundari:[0,3,4,5,6,7,9,10,11,12,13,15,17,19,29,31,47,59,63,64,67,78,79,81,82,92,99,101],about_search_charclass:[0,3,4,5,6,7,8,10,11,12,13,97],about_search_col:[0,3,4,5,6,7,8,9,11,12,13,15,17,19,29,31,47,59,64,67,78,79,81,92,99,101],about_search_fix:[0,3,4,5,6,7,8,9,10,12,13,65],about_search_regex:[0,3,4,5,6,7,8,9,10,11,13,66],about_stringi:[0,3,4,5,6,7,8,9,10,11,12],abov:[9,31,54,60,64],absolut:1,ac_config_fil:2,ac_subst:2,acagagactttagatagagaaga:[58,60],accent:[9,10,11,94],accept:[2,63,88],access:[1,2,9,16,42],accompani:13,accord:[9,38,44,46,62,64,78,80,92],accordingli:2,account:[8,10,17,30,65,68,89,101],acd:9,acgt:[60,93],achiev:94,across:2,act:[2,14,35,63,68,101],action:63,activ:[5,9,62,96],actual:[11,101],add:[2,20,44,68],added:[2,68],adding:20,addit:[1,2,17,18,19,23,27,29,46,47,58,59,60,67,75,78,79,80,81,83,88,90,92,99],addition:[2,5,13,17,37,38,60],address:2,adipis:[18,75,84,85,86,101],adjac:23,adjust:97,advanc:[4,9,12,63],aesthet:101,affect:[2,80,81,94],after:[2,12,30,64],aga:[46,58,75],agaga:[46,58,75],again:[2,9],against:[1,2,30],aggreg:[84,85],agonek:77,ahead:12,aim:[2,9,19,44,72],ala:[65,66],algorithm:[2,9,10,11,13,67,78,79,85,96,101],alia:[2,17,29,44,54,64,66,69,72,73,74,75,86,87,101,102],alias:[2,9,37,51,52],align:[0,3],alik:64,aliquet:[84,101],all:[0,1,2,3,4,5,6,7,9,10,12,13,15,17,18,19,22,23,26,27,28,29,30,31,33,34,36,38,40,43,44,45,46,47,52,56,57,58,59,60,61,64,75,80,81,90,91,96,97,101,102],alloc:2,allow:[2,5,9,10,12,17,18,21,27,32,46,58,60,66,86,101],almost:[4,5,90],alon:23,along:30,alpha:27,alphabet:[9,12],alphanumer:5,alreadi:[1,29,91],also:[0,1,2,68,77],alter:12,altern:[2,9,12,58,79,86],alternate_shift:64,alwai:[5,9,17,31,39,40,44,51,54,56,57,71,72,88,90,96,101],ambigu:5,america:23,amet:[18,52,69,75,80,84,85,86,101],among:[0,2,5,9,13,60,68],amount:[5,20,30,90],ampm:[22,26],analog:94,analysi:[0,2,3,7,12,13,19,47,59,63,81,101],angel:23,angl:[12,30],ani:[0,2,4,5,6,9,12,13,17,23,29,32,43,45,51,55,63,64,65,66,75,82,86,87,89,94,96,100],annex:[9,96,100],anno:23,anoth:[9,94],anydupl:29,anymor:2,anyth:[55,86],anywai:[1,2],apart:[5,37],api:[0,2,9,13,24,26,32,38,63,64,66,90,91],apidoc:[9,13,26,63,64,66,90,91],appear:[5,6,12,23,63,71,80,82,84,85],append:23,appli:[4,9,12,14,80,82,87,90,100,101],applic:[2,5,86,87],appreci:0,appropri:[1,8,44,46,64,80],approxim:[2,13,100],arab:30,arbitrari:[32,83,97],architectur:64,archiv:1,area:90,arg:[1,2],argument:[0,1,2,3,5,6,13],aris:96,arithmet:[0,3],arrai:2,arrang:101,asan:2,ascend:67,ascii:[0,2,3,5,9,12,23,31,33,36,38,39,43,44,45,66,71,94,98,100,101],ascii_hex_digit:9,asian:100,ask:6,assert:12,assum:[1,2,4,5,38,39,40,43,44,96],assumpt:[5,38,40],asymmetr:9,atom:[2,4,12,16,51,54],atomic_vector:16,attempt:2,attr:22,attrib:2,attribut:[2,37,64,99],augu:[84,85,101],australian:6,author:0,auto:2,autoconf:2,autom:5,automat:[5,6,9,38,44,96],avail:[0,2,3,6,7,9,12,37,46,65,66,75,89,94],avoid:[2,6,9,96],awar:[6,11,12,13,27,64,79],baaab:18,baab:18,bab:18,babaab:93,babab:18,back:[6,9,12,23,86],backslash:[9,66,75],backtrack:66,backward:[2,64],bacon:[19,52,59,60,81],bartek:13,bartolini:[46,58],base:[1,2,5,7,9,10,13,15,16,21,22,24,29,31,59,64,69,83,86,87,94,99,100,101],basic:[2,5,8,23,33,54,55,89],bastienfr:2,bbbbb:58,bear:75,becam:2,becaus:[1,2,4,6,11,14,30,31,36,44,65,72,96],becom:[1,23,80,102],been:[0,1,2,5,9,30,53,63,83,91],befor:[2,9,12,30,45,64,89,101],begin:[12,13,67,78,85,90],behavior:[4,6,8,12,43,51,63,64,65,66,67,78,90],behaviour:2,behind:[2,12],being:[2,5,12,23,55,64,86,101],bell:12,belong:9,below:[2,4,5,8,9,12,17,23,33,46,58,64,67,75,78,84],best:[5,6,30,31],better:[5,12,29,65,70,99],between:[0,2,3,5,9,10,12,17,24,48,59,64,80,97,101],bewar:98,biarch:2,bibliograph:9,bidi:9,bidi_control:9,bidi_mirror:9,bidirect:[9,70,71,77,86],big5:30,big:[1,2,71],bin:[1,2],binari:[0,2,3,7,14,18,72,73,84,97,102],bit:[5,31,32,33,36,39,40,42,43,62,90],bitcoin:97,bitwis:11,black:75,bogu:43,bom:[2,5,17,43,44],both:[2,5,17,19,20,35,43,68,74,86,97,101],bound:[9,86],boundari:[0,2,3,7,12,13,63,66,80,92,101],boundaryanalysi:[8,63],box:[1,2],bracket:[9,12,30],breakfast:60,breakiter:[0,2,3,8,19,47,59,81,92,101],briefli:9,bring:2,british:2,broader:94,broken:2,brown:[59,75,81],bsd:[0,2,13],buddhist:26,buffer:2,bug:[0,1,2],bugfix:2,build:[0,2],built:[1,2,49,51,54,94],bundl:[1,2],by_row:54,byrow:[2,46,47,54,80,81],bytewis:[29,64,99],c90:9,calendar:[2,6,20,21,22,23,26,89],call:[0,1,2,4,5,6,11,14,15,17,18,19,27,30,41,42,43,44,46,47,48,55,57,58,59,60,72,75,80,81,83,87,88,90,94,101],cam:100,can:[0,1,2,5,8,9,30,32,38,41,43,44,70,73,87,92,94,97,101],canadian:64,cannot:[2,8,44,72,98],canon:[2,10,15,17,29,33,37,96,99],capabl:94,capit:[8,92],captur:[0,2,3,12,46,75],care:[4,86],carefulli:5,carriag:[12,82],cascad:5,case_ignor:9,case_insensit:[2,27,46,58,65,66,75],case_level:[17,64],case_map:65,case_sensit:9,casemap:92,cat:[1,5,68,69,100,101],categori:[5,7,12,18,38,39,63,97,100],caus:[2,9,43,64],cbind:[86,87],ccc:23,cccc:23,ccccc:23,cccccc:23,center:[0,3],cento:[1,2],central:5,certain:[23,45],certainli:36,cflag:1,cg_miss:[2,60],chain:[2,69,94],chang:[2,5,6,9,12,30,39,42,57,66,68,86,90,91,92,101],changes_when_casefold:9,changes_when_casemap:9,changes_when_lowercas:9,changes_when_nfkc_casefold:9,changes_when_titlecas:9,changes_when_uppercas:9,charact:[0,2,3,4,6,7,8,13,15,16,17,18,19,23,24,27,28,29,32,34,35,36,38,40,41,42,43,44,45,46,47,48,49,50,52,53,55,56,58,59,60,61,62,63,67,68,69,70,71,72,75,77,78,79,80,81,82,83,87,88,90,92,94,95,96,98,99,100,101,102],character_set:30,charclass:[2,9,18,27,46,58,71,75,80,83,84,88,97,100],charmod:96,charscmdenvir:85,charset:[39,49],charsiz:33,charsnwhit:84,charswhit:85,charsword:85,charsxp:2,chartr:2,check:[0,1,2,3,5,6,9,17,30,31,38,46,64,68,83],chines:[8,9,23,30],chladni:[17,67,78,79],choic:[5,23],choos:1,chunk:7,circul:6,circumst:24,citi:23,civil:6,cjkv:9,clang:2,clariti:9,classicu_1_1col:64,classicu_1_1dateformatsymbol:26,classicu_1_1timezon:[90,91],classicu_1_1unicodeset:9,classif:9,classifi:35,claus:[0,2,13],cldr:2,clean:2,clever:[17,44],clock:[22,23],close:[1,9],closer:90,cluster:12,cmd:[1,85],code:[0,2,3,5,6,8,9,12,13,15,17,19,31,32,33,40,42,43,44,59,62,64,65,68,71,77,83,84,86,90,92,93,99,101],codec:2,codepoint:96,coerc:[2,37,48,54,67,78],coercibl:[4,14,15,17,19,20,22,23,32,38,42,47,50,51,53,59,62,76,81,100],coercion:2,coexist:5,coll:[18,27,46,58,64,65,75,80,83,88],collaps:[2,4,30,48,51,52,69,70],collat:[0,2,3,6,7,10,13,29,67,78,79,99],collect:2,colour:1,column:[2,22,54,58,59,60,86,87,100],com:[1,2,13],combin:[9,12,55,94,96],come:[8,92],command:[0,1,3],comment:[12,66],common:[1,2,40,89],commonli:[9,30],commun:[5,6],compar:[0,3,5,6,12,13,29,60,62,75],comparison:[2,5,6,15,17,64,67,78],compat:[2,23,96,100,101],competit:5,compil:[1,2],complement:9,complex:[1,5,10,11,64,93,101],complic:55,compon:[13,26,31,33,49,89],composit:[94,96],compound:94,comprehens:[2,9],comput:[5,6,22,62,79],con:[2,72,73,102],concaten:[0,2,3,5,13,28],concept:6,concern:90,concis:49,conclus:0,condition:2,confid:[30,31],config:[1,2],configur:[1,2,30,86],conform:[2,12,72],confus:51,conjoin:[10,11],conjunct:2,connect:[2,9,54,72,73,102],connector_punctu:12,consectetur:[18,75,84,85,86,101],consecut:[27,46,58,75,101],consequ:[15,39],consid:[44,64],consider:5,consist:[0,2,4,5,9,13,17,24,40,47,52,60,68,69,71,92,93],consol:[5,53,68,101],conson:100,consortium:13,constant:[2,12,66],construct:[2,21],contain:[0,3,9,49,63,66,75,79,84,101],content:[13,82,96],context:[12,23,26,65,85,92],continu:9,contrari:[97,101],contribut:[0,13],contributor:85,control:[2,8,9,12,64,66,67,78,83,98,100],conveni:[0,2,13,18,27,32,46,57,58,60,63,64,65,66,68,75,76,80,83,88,94,97],convent:[6,19,45,47,59,92,101],convers:[2,11,13,24,30,44,73,94],convert:[0,2,3,4,5,9,23,31,37,45,94,96],converted_str:44,cooki:92,coordin:90,copi:[1,2,4,86,87,99],coptic:26,copyright:[2,13],correct:[0,2,6,10,11,13,86],correctli:[1,2,5,39],correspond:[2,4,9,15,17,27,32,34,36,42,51,53,60,75,82,86,87,90,93],cost:[2,101],cost_expon:101,could:[2,6,30],count:[0,2,3,7,8,13,23,83,85,86],counterpart:[29,99],countri:[6,55,90],cours:[2,4,30,31,83],cover:[5,12,31],cpp:[2,31],cppflag:1,cpu:66,cra:[84,101],cran:0,creat:[0,1,3,5,14,56],crlf:82,csrucod:31,cstring:2,cultur:6,currenc:[6,9],current:[0,1,2,3,6,9,12,22,23,39,41,44,49,57,60,62,69,72,89,91,102],custom:[1,2,63],customis:0,cxx11:[1,2],cxx1x:2,cxxcpp:2,cxxflag:1,cyclic:23,cyril:[9,94],czech:30,czw:23,d_ef_g:80,dai:[20,21,22,23],danish:30,dash:[2,9],dat:2,data:[0,1,2,3,5,9,11,22,23,30,31,38,44,59,62,64,69,80,90,102],databas:[9,13],date:[0,2,3,13,24,90,91],date_long:23,dateformatsymbol:26,datetim:[20,21,22,23,24,25,26,89,90,91],datetime_relative_medium:23,davisvaughan:2,daylight:[23,89,90],dayofweek:22,dayofyear:22,de_d:[17,92],deal:[2,4,5,42,53],debian:1,debug:2,decid:5,decim:[9,12],decimal_numb:12,declar:[0,2,3,5,39,40,41,43,44],decnumb:2,decod:[32,94],decomposit:96,decreas:[30,31,67,78],def:27,default_ignorable_code_point:9,default_local:2,defin:[9,10,12,32,39,49,64,80,82,83,86,87,90,96,98],definit:[64,66],delimit:80,deliv:6,denorm:5,denot:[5,9,22,48,75,83,86,101],depend:[1,2,5,6,8,9,12,15,17,18,22,23,27,29,46,57,58,66,67,75,78,79,80,82,83,88,91,92,99,101],deprec:[0,2,3,9,29,63,64,65,66,69,72,73,102],descend:67,describ:[9,10,11,12,54],design:[2,5,23,90,94],desir:[6,66,71,76,94],dessert:60,detail:4,detect:[0,2,3,6,7,13,35,38,39,42,53,60,65,73,84],determin:[0,2,3,5,9,13,17,19,27,30,40,80,82,91,96,101],dev:[1,2,9,13,26,63,64,66,90,91],devel:[0,1],develop:[1,5,13],diacrit:[8,9,17],diagnos:44,diagnost:2,did:[2,6],differ:[2,5,6,8,9,12,17,18,19,30,46,48,51,58,60,66,75,92,93,94,96,97],digit:[5,9,12,13,23,45,64,71,90,98],digraph:9,dim:4,dimitri:2,dir:[1,2],directli:[2,58,79,83],directori:1,disabl:[1,2,12],disallow:[9,44],disappear:9,discourag:9,discret:69,discuss:[5,39,44,55],disjoint:87,dispatch:68,displai:[2,5,8,9,23,69],display_typ:89,distinguish:12,distribut:[1,2,13,69],divers:1,doc:[9,10,13,26,63,64,66,90,91],document:[2,8,9,13,26,63,64,66,90,91,96],doe:[1,2,5,6,8,9,12,17,23,24,33,55,60,64,90,100,101],dog:75,doing:[4,5,39],dolor:[18,52,69,75,80,84,85,86,101],domini:23,done:[11,71],dot:9,dot_al:66,dotal:66,download:[0,1,2],draft:[0,2,13,96],drastic:2,draw:71,drop:4,dst:[89,90],dt_relative_styl:23,dt_style:23,du_disable_renam:2,dual:[32,42],due:[1,4,5,13,37],dummi:[2,69],duplic:[0,2,3,37,99],dure:[6,56,80,90],dutch:30,dynam:[2,101],dynlib:2,e0000:9,e0fff:9,each:[0,2,3,4,5,6,7,8,9,13,14,18,24,27,28,29,30,31,32,37,40,42,46,47,51,52,53,54,58,60,62,68,71,72,75,76,80,82,83,84,85,86,87,92,93,94,95,96,101,102],eagerli:2,earli:2,eas:2,easier:[5,88],easili:[2,42,102],east:100,eee:23,eeee:23,eeeee:23,eeeeee:23,effect:[39,57,90],effici:[2,4,10,12,43],efficient_text_searching_in_java:10,egg:[19,59,60,81],eight:12,either:[1,5,9,12,18,23,24,27,44,45,46,63,80,83,88,90,92],element:[0,2,3,4,6,13,15,17,18,27,30,31,34,36,37,42,46,47,48,50,51,53,54,58,60,67,71,75,78,80,82,83,84,85,87,102],elit:[18,75,84,85,86,101],ellipsi:36,embed:44,emoji:[2,9,46],emoji_modifi:9,emoji_modifier_bas:9,emoji_present:9,emploi:9,empti:[0,2,3,4,6,9,12,18,27,31,46,47,48,50,51,80,81,82,83,86],emul:2,en_au:6,en_u:[6,57,59,81,92],enabl:[12,30,65,66],enc2utf8:[42,43],enc:[33,39],enclos:[9,23],encod:[0,2,3,9,13,30,32,34,35,36,40,42,43,49,53,62,72,73,88,96,102],encoding_convers:[5,32,40,41,42,43,44],encoding_detect:[5,30,31,34,35,36],encoding_manag:[5,33,37,38,39],encodingnam:44,encount:[5,12,39],encourag:[1,100],end:[0,2,3,7,8,9,12,13,27,30,32,46,57,58,59,62,63,66,67,75,78,82,85,86,87,90,91,97,101],endian:[1,2],engin:[0,2,3,7,9,11,12,13,18,27,30,46,58,60,75,80,83,88],english:[6,10,30],enhanc:79,entir:66,entireti:72,entri:[0,37,66],enumer:100,envir:85,environ:[1,2,41,85],equal:[17,23,29,30,31,51,52,64,68,71,80,81,99,100],equat:90,equip:2,equival:[2,5,9,10,15,16,17,19,29,38,42,48,51,59,64,65,66,75,76,79,82,88,96,99,100],era:[22,23,26],erron:44,error:[2,4,9,12,33,53,66,84,101],error_on_unknown_escap:66,escap:[0,3,12,13,23,66,75],especi:[1,5,10,30,86],essenti:96,establish:[2,4,57,64,91],eszett:92,etc:[1,2,4,5,12,21,22,26,42,46,63,80],etiam:[84,101],euc:30,euro:[2,6],europ:[89,91],european:[5,6],evalu:12,even:[5,8,12,23,30,54,55],evenli:101,ever:5,everi:[13,60,75,77,101],everyth:9,exact:[2,12],exactli:[5,12,17,32,33,38,42,68],examin:[5,27],exampl:[0,2,5,6,8,9,11,12],examplercppstringi:2,exce:[44,72],except:[2,9,12,23,101],exclud:[63,88],exclus:[86,87],exdent:[2,101],execut:[1,45],exemplar:23,exemplari:23,exercis:69,exist:[1,2,5,12],expand:2,expect:[1,4,6,9,66],experi:[1,101],expert:39,explain:[4,5,6,7],explicit:5,explicitli:[44,86],expon:101,express:[0,3,4,5,7,9,13,66,82,97],extend:[5,9,23,36,38,40,43],extens:2,extern:[2,5],extra:[1,64,93],extract:[0,2,3,7,12,13,29,58,80,81],face:1,facil:[10,11,30,31,66,98],fact:[30,37],factor:4,fail:[1,2,5,6,12,30,31,39,41,43,62,66],failur:[2,12,30,31],fall:[9,23],fallback:1,fallback_encod:[2,72],fals:[2,5,21,23,27,29,30,35,36,37,43,44,46,47,48,49,51,54,58,59,60,63,64,65,67,68,69,74,75,78,80,81,82,83,86,87,88,101],famili:[2,31,37,63],familiar:2,fanci:[13,48],faq:5,fashion:[2,17],fast:[0,2,11,12,13],faster:[9,44,83,88],fastest:50,fcd:64,featur:[0,1,2,12,19,59,68,81,101],feature_test:2,februari:20,fedora:1,feed:[12,82],feel:[14,15,17,83],fetch:[1,89,90],few:[0,1,12,30,31],fewer:12,fff0:9,fffb:9,fffd:44,field:[0,2,3,23,80],file:[0,1,2,3,5,13,30,63,82,84,85],fill:[2,46,47,54,80,81],filter:[30,81],filter_angle_bracket:30,find:[1,4,8,9,50,58,67],first:[1,2,4,7,8,9,10,12,17,22,23,29,31,33,46,48,51,52,58,59,60,75,83,90,92,94,97,101],fit:[5,8,63],fix:[0,2,3,10,12,18,27,43,46,49,58,62,66,75,80,83,88],flag:[1,2,12,23,49,66],flatten:[0,3],flavor:[1,9],flavour:2,floor:[68,101],fname:[2,72,73,102],fold:[2,13,96],follow:[1,2,5,6,7,9,12,13,19,22,26,29,30,31,33,45,47,49,55,59,63,69,82,84,85,89,92,94,96,98,100,101],font:100,food:60,forc:[1,2,64],form:[5,6,9,12,16,23,24,36,40,42,49,55,57,60,64,75,82,86,96,98],formal:[96,100],format:[0,2,3,8,9,12,13,30,90,96],formatpars:[23,26],formatt:24,found:[29,40,44,46,58],four:5,fox:75,fraction:[21,23],fragment:12,frame:[2,22,30,31,90],free:12,freeli:9,french:[6,30,64],frequent:[2,30],friedl:12,friend:15,friendli:[2,5,33,39,86,87],from:[0,1,2,3,4,5,9,12,13,17,21,23,29,30,37,43,44,46,51,58,66,67,69,71,75,78,80,82,83,87,88,90,94,96],from_last:[2,29],fromlast:[2,29],front:86,full:[2,23,65,80,81,92,94,100],fulli:[0,31,60],fundament:6,further:[5,13],futur:[2,23,63,64,65,66,84,85],gaertner:17,gagolew:[1,2],gagolewski:[0,2,13],gain:2,garbag:2,gather:13,gb18030:30,gcing:2,gcmask:2,gcuacggagcuucggagcuag:93,gener:[0,1,2,3,4,7,8,12,13,18,23,27,32,39,40,42,44,46,53,61,70,83,86,87,92,95,96,97,100],general_categori:9,generic_loc:89,generic_long:89,generic_short:89,german:[6,30,92],get:[0,1,2,3,4,5,6,33,45,51,52,53,55,58,59,64,74,84,94,97,101],getlocal:[5,38,39],getopt:[68,101],ggg:23,gggg:23,ggggg:23,ghi:27,github:[0,1,2,9,13,26,63,64,66,90,91],give:[0,2,5,11,12,13,23,29,37,38,49,57,58,59,60,67,68,70,71,76,77,79,80,81,83,84,85,86,87,93,101],given:[0,2,3,4,5,7,12,17,18,23,24,27,32,33,35,36,37,38,39,46,47,49,52,53,54,58,60,66,67,68,69,75,76,80,81,82,83,86,90,93,94,97,98,101,102],glanc:[9,10],glibc:2,gmt:[23,89,90],gmt_long:89,gmt_short:89,good:[12,46],graphem:[5,12],great:4,greater:[5,17,36,38,40,51,52,62,71,101],greatest:31,greatli:0,greedi:[2,101],greek:[9,30,94],greenwich:90,gregorian:[2,20,21,22,23,26,89],gro:[29,94,99],gross:[29,99],group:[0,2,3,5,6,12,30,46,75],gru:23,grudnia:23,guarante:[1,2],guess:[30,31],guid:[5,6,8,9,10,12,17,20,23,26,29,30,44,63,64,65,66,67,78,79,90,92,94,95,96,99],guidelin:[23,72,82],had:[2,5],hadlei:0,half:90,halfwidth:94,hand:[80,81],handl:[2,5,6,8,30,38,50,53,62,76,86,94,98],hangul:100,happi:[59,81],hard:63,has:[0,1,2,5,30,38,39,43,48,51,52,53,83,86,91],have:[1,2,5,6,8,9,12,23,29,31,33,39,44,54,63,68,100,101],hbox:2,he_il:26,heap:66,hebrew:[20,21,22,26,30],help:1,hemispher:90,henc:[29,99],here:[9,10,11,12,17,23,30,38,41,43,53,58,60,92],hesit:1,heurist:[30,31],hex:[12,45,94,98],hex_digit:9,hexadecim:9,hhhh:12,hhhhhhhh:12,higher:[30,31],hiragana:63,histor:90,hit:31,hladn:17,hladni:[17,67,78,79],hms:23,hold:[17,38],home:[2,13],homepag:[0,13],honour:2,hopefulli:1,horizont:[12,101],host:0,hour12:22,hour:[20,21,22,23,89,90],how:[2,4,5,6,7,9,10,12,13,17,55,67,78,79],howev:[1,2,5,6,9,14,30,35,36,44,54,55,62,75,94],html:[5,6,9,10,12,13,26,30,63,64,66,82,90,91],http:[1,2,5,6,8,9,10,12,13,17,20,23,26,29,30,44,63,64,65,66,67,78,79,82,85,90,91,92,94,95,96,99,100],human:[6,89],hundr:[5,30,31],hungarian:30,hyphen:[9,100],i18n:[2,13,31],iana:33,ibm420:30,ibm424:30,ibm:[13,33],icecream:60,iconv:44,icu4c:[0,2,9,13,26,63,64,66,90,91],icu52dt:2,icu55:[1,2],icu61:2,icu:[0,1,2,5,6,7,8,9,10,13,17,19,20,23,24,26,29,30,31,33,37,38,39,44,46,47,49,55,56,59,60,63,64,65,66,67,75,78,79,81,89,90,91,92,94,95,96,98,99,101],icudt52b:2,icudt61b:2,icudt61l:2,icudt:[1,2],icudt_dir:1,id456:88,id_:14,id_continu:9,id_start:9,ident:90,identifi:[0,2,3,9,19,20,21,22,23,26,31,33,37,47,55,56,59,89,91,92,94,95,101],ideograph:[9,63],iec:9,ietf:[13,96],ifels:102,iff:31,ignor:[2,5,6,9,10,11,12,17,19,23,25,30,44,47,51,52,59,64,71,80,86,90,93,96],ignore_nul:[2,51],ill:[32,40,42,98],imag:30,imbal:2,implement:[2,6,10,11,12,44,69,72,83,85,92],impli:36,implicit:[5,9,38],imprecis:[5,30,31],improp:6,improv:2,inc:13,incident:5,includ:[0,1,2,3,6,7,8,9,12,13,18,26,27,46,58,60,62,75,80,83,85,86,88,100],inclus:[9,86],incompat:2,inconsist:24,incorrect:[2,43,44,53],incorrectli:2,increas:78,increment:64,inde:36,indent:[2,101],independ:[2,7,13,15,17,34,35,36,75],index:[2,29,58,59,83,86,87],indian:26,indic:[2,7,15,17,29,31,34,36,44,46,47,49,58,59,60,81,86,87,99],individu:[2,6,13,42,46,80],influenti:1,info:[12,90],inform:[2,5,6,10,12,13,17,19,33,37,47,49,55,56,57,59,67,78,79,81,89,90,91],initi:[2,5,6,9,31,101],inject:86,input:[2,5,11,12,17,30,32,38,40,44,45,51,59,63,64,66,67,72,75,78,80,82,86,87,92,93,94,96,101],ins:72,insensit:[0,3,5,9,12,17,65,66],insert:2,insid:[12,23,66],insight:55,inspect:27,inspir:[0,12,31],instal:[0,2],instanc:[4,5,18,23,27,36,37,46,58,60,83,86,97],instead:[2,62,68,101],instruct:2,integ:[4,5,17,18,19,20,21,27,28,29,32,42,53,54,58,59,62,64,66,67,68,69,71,80,81,83,84,85,86,87,100,101],intellig:2,intens:2,interact:6,interchang:[90,96],interest:[4,13,27,83,88],interestingli:10,interfer:30,intern:[2,5,13,30,32,39,44,49,62,91],internation:13,internet:1,interoper:[5,96],interpret:[5,23,40,43],intersect:9,intit:78,introduc:[2,96],introduct:[0,12],inttoutf8:32,intuit:[5,38,67],invalid:[2,43],invis:[39,57,91],ipa:0,ipsum:[0,2,3,18,52,75,80,84,85,86,101],is_unknown_8bit:[5,43],isalnum:9,ish:2,islam:[6,26],ismwx:12,iso8601:23,iso:[5,6,9,13,23,30,90],ispunct:9,issu:[1,2,4,13,42,44],italian:30,iter:[2,4,8,9,19,47,59,63,81,92,101],its:[2,4,5,6,9,12,13,15,17,29,37,86,99],itself:[40,90],ja_jp_tradit:26,jamo:100,januari:[20,22],japanes:[8,9,26,30,94],java:[0,10,12,13,33],jdk:12,jkl:27,john:2,join:[14,28,48,51,52],jone:[59,81],joy:13,juli:23,julian:23,jump:75,just:[2,5,6,8,12,19,29,31,41,47,58,59,60,69,75,87,99],kana:63,katakana:[9,63,94],keep:58,kei:[0,2,3,5,64],keyboard:[5,38],keyword:[6,13,20,21,22,23],kile:85,kind:9,know:[4,5,39],knowledg:5,known:[0,2,3,5,31,45,56,66,98],knuth:[2,11,101],koi8:30,korean:[9,30],l10n:13,lacinia:[84,85,101],lai:69,languag:[0,2,3,5,6,7,8,11,13,17,29,31,55,57,64,65,92,94,99,101],language_countri:[6,55,57],language_country_vari:[6,57],lappli:90,larg:9,larger:[2,5],largest:12,last:[2,7,12,29,46,58,59,60,75,82,83,86,93,97,101],latest:1,latex:[0,3],latin1:[2,5,38,44],latin:[9,68,69,71,94,101],lazi:75,lc_ctype:[5,38,39],ldflag:[1,2],lead:[4,5,9,12,17],leak:2,leap:[25,90],least:[4,12,27,30,31,68,71,84],leav:[86,87],led:2,ledkov:2,left:[0,3,9,46,58,64,66,75,101],legal:9,legibl:30,length:[0,2,3,4,9,11,12,29,30,31,38,46,47,48,51,52,53,54,58,59,62,67,68,69,71,75,78,79,80,81,86,87,96,100,101],lenient:[21,23],less:[12,17,54,58],let:5,letter:[6,8,9,10,11,14,18,23,24,30,34,36,48,50,51,53,62,63,64,66,70,71,78,90,92,94,100],level:[2,64],lexicograph:[17,67,78],lib64:1,lib:[1,2,49],libc:2,libicu:[1,2],librari:[1,2,17,31,49,97],licens:[0,2,13],ligatur:17,like:[0,1,2,4,5,9,13,14,19,23,31,47,51,58,59,68,75,81,87,92,99,101],limit:[30,66],line:[0,1,2,3,8,9,12,13,19,30,59,63,66,68,73,81,84,85,101],line_break:[8,19,47,59,63,81],linesnempti:84,linguist:[8,9],link:[1,2,9,13],linker:1,linux:[2,5],lipca:23,list:[0,1,2,3,4,5,6,8,9,12,13,16,17,18,19,27,29,30,31,32,33,34,35,36,39,42,44,46,47,49,55,58,59,60,67,75,78,79,80,81,82,83,87,88,89,92,94,99,100,101],liter:[12,23,66,75],littl:1,lll:23,llll:23,lllll:23,load:[2,5,30,84,85],local:[0,2,3,7,8,9,12,13,15,17,19,20,21,22,23,26,29,46,47,49,58,59,63,64,67,78,79,81,89,90,92,99,101],locale_manag:[6,55,56,57],locale_sensit:[6,8,10,15,17,19,29,31,47,59,64,67,78,79,81,92,99,101],localiz:[0,2,3],locat:[0,2,3,7,8,10,11,19,23,44,47,81],locate_first:58,locate_last:58,log:[67,78],logic:[4,15,17,21,23,27,29,30,34,35,36,37,43,44,46,47,48,49,50,51,54,58,59,60,63,64,65,66,67,68,69,75,78,80,81,82,83,86,87,88,96,101],london:89,longer:[2,36,72,93],longest:[51,54],look:[2,12,14,15,17,30,80,83],lookahead:58,lookup:12,loos:12,lorem:[0,2,3,18,52,75,80,84,85,86,101],los_angel:23,lower:[13,64,92,94],lowercas:[9,94],lukaszdaniel:2,lunar:23,lunch:60,machin:[1,5,39],macro:2,made:2,magrittr:[2,86,87],mai:[1,2,4,5,6,7,8,9,11,12,17,19,20,21,22,23,24,30,33,35,38,39,40,42,43,44,53,54,55,56,57,58,59,62,63,66,68,70,71,75,76,77,80,81,83,84,85,86,92,95,96,97,101],main:30,mainli:94,major:5,make:[1,2,5,8,83,96],makeconf:1,makevar:2,malform:[2,9,55],malici:2,man:[4,7,9,13,45],manag:[1,2,13],mandatori:63,mani:[0,2,6,7,9,12,13,55,57,91,96,97,101],manipul:[5,13],manual:[0,1,2,4,5,12,13,24],map:[0,2,3,5,6,13,40,43,55,65],marek:[0,13],margin:8,mario:17,mark:[2,5,8,9,12,27,30,32,34,35,36,38,40,41,43,44,62,72,86,96],marker:[23,44,72],markov:69,markup:30,mask:98,master:[1,12],match:[0,2,3,6,7,8,9,10,12,13,30,31,38,39,46,47,58,59,65,66,75,82,97],matcher:[0,3,4],math:9,mathemat:[9,94],matric:[2,58,59,60,86,87],matrix:[0,3,46,47,58,59,60,80,81,86],max:33,max_count:[2,27],maxim:[33,44,66,72,80,81,101],maximum:1,mean:[9,23,35,36,57,66,84,90,91],meaning:5,mechan:[5,38],medial:100,medium:23,memcheck:2,memori:[2,5,62,73],mention:[19,59,64,81],mere:46,merg:[2,30,46,58,75],messag:[2,12],met:1,meta:83,metacharact:66,method:[53,91,101],mgk25:100,microsystem:2,middl:[8,9,86],might:[9,11,17,19,23,27,30,37,44,86,90],migrat:[9,65],mileston:2,millisecond:[20,22,23,66],mime:33,mimic:2,min:33,mind:[5,58],minim:[2,33,54,68,101],minu:5,minut:[20,21,22,23],mirror:[1,2],misalign:2,mislead:[5,53],miss:[0,2,3,27,29,38,40,42,43,44,46,47,48,50,51,53,58,59,60,61,62,64,66,67,74,78,80,84,86,87,88],mmm:23,mmmm:23,mmmmm:23,mode:[46,58,60,66,72,73,75,101,102],model:[69,96],modifi:[6,9,20,23,57,85,88],mondai:23,mono:100,monster:92,month:[20,21,22,23,26],more:[0,1,2,4,5,6,8,9,10,12,13,17,18,19,23,24,27,30,31,33,37,43,44,46,47,48,56,57,58,59,60,64,67,72,75,78,79,80,81,83,88,89,91,92,96,97,101],moreov:[0,1,2,5,9,19,24,27,38,51,53,54,58,75,82,98,101],morri:[2,11],most:[0,1,2,4,5,9,23,24,26,30,35,36,64,66,96,97,101],mostli:30,move:[2,64],much:[2,10,17,29,72,94,99],multi:[5,9,30],multi_lin:66,multilin:66,multipl:[0,2,3,23,68,86,101],multitud:0,must:[6,8,12,75,87],mutual:[86,87],n_max:2,n_min:[2,54,80,81],n_paragraph:[2,69],na_character_:[2,32,54,60,90],na_empti:[2,48,74],na_integer_:90,na_last:[2,67,78],name:[1,2,4,5,9,12,17,18,19,20,21,22,23,26,27,29,30,31,33,37,39,44,46,47,55,57,58,59,60,63,64,65,66,67,72,73,75,78,79,80,81,83,84,85,88,89,90,92,94,99,102],narrow:26,nativ:[0,2,3,5,9,13,38,39,43,44,49,62,96],natur:[2,5,7,11,13,17,29,64,99,101],nchar:[2,100],necessari:[1,4,15,18,27,46,58,60,71,75,80,83,88],necessarili:6,need:[2,4,5,12,30,62,86,87,90,97],neg:[12,27,29,80,81,83,86,101],negat:[2,9,27,83,88],neither:[39,43],nel:82,network:96,never:[80,82],new_substr:86,newer:1,newlin:[12,72,82,102],next:82,nfc:[86,96,100],nfd:[64,94,96],nfkc:96,nfkc_casefold:96,nfkd:[94,96],nibh:[84,85,101],nice:2,nie:94,nil:2,nisan:21,nix:2,non:[2,4,5,9,10,12,17,19,20,21,22,23,27,29,45,47,59,64,67,70,71,77,78,81,84,86,98,99,101],noncharacter_code_point:9,nondecreas:[67,78],none:[2,84,101],nonincreas:[67,78],nor:[39,43],norm:96,normal:[0,2,3,5,9,13,17,37,53,62,64,69,70,71,77,86,94,97,99,100,101],normalis:[0,2,64,101],northern:90,norwegian:30,note:[1,2,5,8,9,10,11,12,13,14,17,18,19,20,22,23,30,32,35,36,39,40,41,43,44,46,47,51,53,56,57,58,59,60,63,66,68,75,77,80,81,83,86,90,92,94,96,97,98,100,101],noteworthi:102,noth:[23,102],notion:[10,17,100],now:[1,2],nparagraph:[2,69],npattern:75,nth:12,nul:[44,62],number100:64,number2:64,number:[0,1,2,3,5,6,7,9,12,13,20,22,23,25,27,28,31,33,46,54,63,68,69,71,75,80,81,84,85,92,93,100,101],numer:[2,4,5,9,21,23,30,31,64,67,78,90,101],numeric_valu:9,object:[0,2,3,14,15,17,19,20,22,23,25,32,38,42,46,47,50,51,53,59,62,63,64,65,66,72,73,76,80,81,86,88,100,102],observ:[2,5,6,43,71,90],obtain:[0,2,5,9,30,31,55,84,85,90],occur:[7,8,12,30,44],occurr:[0,2,3,7,18,27,31,44],octal:[12,98],off:1,offset:[89,90],often:[0,10,30,35,62,69,94,96,97],ogonek:[5,36,77,96],old:39,older:1,oldloc:57,oldrel:2,oldtz:91,omit:[1,48,63,82],omit_empti:[2,48,80,82],omit_na:[2,86,87,88],omit_no_match:[2,46,47,52,58,59,60,87],onc:[4,27,73],one:[1,2,4,5,6,8,9,12,18,20,23,26,27,32,33,38,42,44,46,48,53,54,55,58,59,60,62,63,64,68,71,75,84,87,88,89,90,92,94,96,102],ones:[33,64,98],onli:[2,4,5,9,12,30,33,38,39,46,48,51,52,58,59,60,63,66,68,75,79,80,81,82,86,87,88,90,92,97,101],ooo:[12,98],oooo:23,open:[0,2,9,72,73,102],opensus:[1,2],oper:[0,1,2,3,4,5,7,8,9,13,14,15,17,21,29,30,32,42,57,62,66,68,70,71,77,86,87,91,94,99,101],operator_add:[0,3],operator_compar:[0,3],operator_dollar:[0,3],opposit:64,optim:5,option:[1,2,6,15,17,29,30,43,51,52,67,78,79,99],opts_brkit:[2,19,47,59,81,92],opts_col:[2,17,18,27,29,46,58,64,67,75,78,79,80,83,88,99],opts_fix:[2,18,27,46,58,65,75,80,83,88],opts_regex:[2,18,27,46,58,60,66,75,80,88],oracl:2,order:[0,2,3,5,6,9,13,17,27,30,31,43,44,64,70,72,77,78,79,86,96],ordinari:[51,64],org:[1,5,6,8,9,10,12,13,17,20,23,26,29,30,44,63,64,65,66,67,78,79,82,90,91,92,94,95,96,97,99,100],orient:85,origin:[2,79,85],other:[0,2,4,5,6,7,8,9,10,11,12,13,14,15,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,68,69,70,71,72,73,74,75,76,78,79,80,81,82,83,84,85,86,87,88,89,90,91,92,93,94,95,96,97,98,99,100,101,102],otherwis:[4,23,27,29,44,45,46,47,49,51,52,54,66,71,80,81,84,89,90,101],our:[1,2,4,5,97],out:[1,2,5,9,46,50,68,69,86,97],output:[2,5,23,42,43,44,47,53,67,68,70,71,72,73,77,78,88,96,102],outsid:[12,23],over:[2,5,14,15,16,17,18,19,20,21,22,23,27,28,30,31,46,47,51,58,59,60,68,71,75,80,81,82,83,86,87,88,92,93,97,101],overal:12,overflow:2,overful:2,overlap:[2,9,46,58,60,65,75],overload:16,overrid:1,overwhelm:1,own:44,pace:13,pacif:23,packag:[1,2,5,9,47,57,68,91],pad:[0,2,3,13],page:[2,4,5,7,13,24,45],pair:9,pairwis:15,paper:[0,2,10],paragraph:[0,2,3,8,9,69,82],paramet:[2,10,82,86,87],parametr:6,parenthes:[12,60,75],pars:[0,2,3,13],part:[1,2,9,38,39,75,86,87],particular:[1,4,5,6,8,9,13,63,86,94],pass:[0,1,2,3,16,18,27,46,55,58,59,60,63,64,65,66,75,80,83,86,87,88],password:71,past:[2,48,51,76],pat1:9,pat2:9,pat:[58,83],patch:2,path:1,patter:2,pattern:[0,2,3,4,7,10,12,13,23,30,66,71,93,97],pdf:2,pdt:23,peculiar:[4,70,71,77],pellentesqu:[84,101],per:[4,6,57,69,101],perform:[0,2,3,4,5,6,7,9,10,11,12,15,17,19,29,47,56,57,59,62,63,64,66,67,73,78,81,94],perhap:[67,78],perl:[9,12],permiss:64,permut:[0,2,3,70,77],persian:26,phonebook:[6,17],php:85,piec:[9,10,19,80,81],pipabl:2,pipe:[2,86,87],pizza:60,pkg:[1,2],pkg_config:[1,2],pkg_config_path:1,pl_fonipa:94,pl_pl:[17,23,26,55,67,78,79],place:[9,86,87,88],plai:[5,87],plain:76,plass:101,platform:[1,2,5,6,13,38,82,91,102],pleas:[1,4,5,9,10,17,24,44,60,63,97],plu:[5,9,12],point:[0,2,3,5,8,9,12,13,15,17,19,31,32,33,40,42,44,59,62,64,65,68,71,77,83,84,86,90,92,93,99,101],polish:[5,6,17,30],poor:2,poorli:66,portabl:[0,1,2,5,9,44],portion:12,portugues:30,posit:[2,5,8,9,12,35,36,58,59,63,64,80,81,83,86,101],posix:[2,65],posix_alnum:9,posix_blank:9,posix_graph:9,posix_print:9,posix_xdigit:9,posixct:[20,21,22,23,25],posixst:23,possess:12,possibl:[0,1,2,3,4,5,12,31,38,63,65,80,81,83,96,101],potenti:96,power:[0,12,13],pqrst:28,practic:101,pratt:[2,11],pre:[2,94],preced:[9,12],precis:[5,6,66,90],predefin:[9,69],predict:13,prefer:12,prefix:[2,101],prepar:2,preprocessor:1,preserv:[2,97,101],prevent:[2,63],previou:[12,57,91],previous:[2,39,57,91],primari:64,print:[2,5,8,9,20,53,68,86,87,88,100,101],printabl:45,prioriti:86,privat:9,probabl:71,problem:[1,2,96],problemat:44,proce:100,process:[2,3,5,7,8,9,10,11,17,29,30,45,47,62,66,68,69,80,91,94,96,97,99,101],produc:[23,44,65],prof:[59,81],program:[5,6,101],proin:[85,101],project:[1,2,5,6,8,9,10,12,13,17,20,23,26,29,30,44,63,64,65,66,67,78,79,90,92,94,95,96,97,99],pronounc:0,propag:1,proper:36,properli:[1,5,6,10,38,50,53,62],properti:[4,7,12,18,84,97,100],protect:2,protocol:5,provid:[2,5,6,9,10,11,12,13,16,17,31,33,47,49,51,55,60,64,86,89,90,93,94,101],pseudo:[2,13,69,70,71],pt_br:57,punct:9,punctuat:[8,9,10,11,23],purpos:[2,5,8,82],put:[67,78,96,101],python:16,qqq:23,qqqq:23,qqqqq:23,quarter:[23,26],quaternari:64,queri:[0,3,6,56,91],quick:75,quicker:75,quit:[0,5,12,66],quot:[9,12,23,45],quotat:9,quotation_mark:9,r_home:1,r_inst_dir:1,r_usedynamicsymbol:2,ragged:[2,101],rais:[2,33],random:[0,2,3,9,13,69,70,77],randomli:[0,3,69],rang:[0,5,9,12,23,86,87,94],ranki:94,rare:[2,4,5],rather:[27,44,66,68,83,88,96,101],raw:[0,3,5,30,31,34,35,36,42,44,89,90],rawoffset:89,rawtochar:[30,44],rbbi:63,rbind:90,rbuildignor:1,rchk:2,rcpp:[0,2],read:[0,2,3,5,13,38,41],readabl:89,readbin:30,readlin:[30,72,84,85],real:23,realli:[5,55],rearrang:67,reason:[2,4,5,43,44],recal:9,recent:1,recogn:[6,45,66,98],recommend:[96,101],recycl:[2,4,15,18,27,46,58,60,71,75,80,83,87,88],redund:71,refer:[0,1,2,18,24,27,46,58,60,75,80,83,88],referenc:6,reflect:[6,33],reformat:101,regard:29,regardless:5,regex:[0,2,3,4,7,9,18,27,46,58,75,80,83,88],regexmatch:2,regexp:[9,12,66],region:[6,90],regular:[0,3,4,5,7,9,13,66,82,97],reilli:12,rel:[1,23],relat:[13,15,17,23],relationship:64,releas:[0,1,2,84,85],relev:1,reli:[1,2,5,83,97],reliabl:64,remaind:[80,81],rememb:4,remov:[0,2,3,5,9,17,30,37,43,63,64,65,66,67,75,78,80,82,94,96,97,99],renam:2,rep:70,replac:[0,2,3,7,13,20,23,24,40,43,44,71,80,88,93,97,101],repo:1,report:[1,2,9,12,19,66,82,96,100],repres:[5,9,17,23,25,30,32,33,36,37,46,58,60,66,82,84,85,90],represent:[2,5,21,33,79,89,91],request:[5,6,24,56],requir:[1,2,11,12,23,63],reserv:[9,23],resolv:1,resourc:[6,56],respect:[2,4,9,12,18,23,27,46,47,58,59,75,80,81,83,86,87,88,93],rest:92,restor:[57,91],restrict:94,result:[2,4,5,6,9,11,12,13,14,15,17,18,19,23,27,28,29,35,36,37,41,43,46,47,49,51,52,54,55,58,60,64,65,69,70,71,75,77,78,79,80,81,82,83,87,88,92,98],retri:12,reus:4,revers:[0,3,13,33,68,70],revert:2,rexamin:75,rf_error:2,rfc3629:13,rfc5198:96,rfc:[13,23,96],rid:[2,74],right:[0,3,9,46,58,75],robust:72,role:[5,87],romanian:30,roughli:[31,42,76,88,100],round:[2,60,75],routin:[2,5],row:[23,46,47,54,58,59,60,80,81],rpm:1,rule:[2,4,19,47,59,63,64,82,87,90,96],run:[2,30,46,57,62,75,83,86,91],russian:30,sake:23,same:[2,5,6,9,13,17,29,33,38,39,50,53,54,55,57,62,64,79,80,90,96,99,100],sampl:[71,78],saniti:2,sappli:[69,89],sausag:52,save:[89,90],scelerisqu:[84,85,101],scenario:[46,58,60,87],scharf:92,schedul:2,scheme:[5,9,33],scp:1,screen:68,script:[1,2,9,68,71,94,101],search:[0,1,2,3,4,5,6,9,11,12,13,18,19,27,29,46,47,58,59,60,63,64,66,71,75,80,81,83,84,88,97,100],search_charclass:[7,9,97],search_col:[7,10,64],search_count:[7,18,19],search_detect:[7,27,83],search_extract:[7,46,47,60],search_fix:[7,11,65],search_loc:[7,58,59],search_regex:[7,12,66],search_replac:[7,75,97],search_split:[7,80,81,82],search_subset:[7,88],second:[2,17,20,21,22,23,25,58,59,60,90],secondari:64,section:[6,9,12,66],sed:[1,84,85,101],see:[0,1,2,16,68,77],seek:13,seem:10,seen:[2,38],segfault:2,select:[0,3,5,6,22,31,33,69,101],selector:26,semant:5,sens:5,sensit:[0,3,7,13,23,57,65,66,92],sentenc:[8,19,59,63,69,81,92],sep:[2,14,23,48,51,52,68,69,76,101,102],separ:[8,9,23,47,48,51,52,55,58,63,72,80,82,83,84,85,94,102],septemb:23,sequenc:[0,1,2,3,5,11,12,23,30,32,34,36,40,42,43,44,53,58,66,82,94,96,101],seri:[9,94],serv:[44,82],server:[1,2],servic:[2,5,6,10,56,64,90,94],session:1,set:[0,1,2,3,4,5,6,9,11,12,17,18,19,20,21,22,23,27,29,32,42,43,44,46,47,51,53,58,59,60,67,69,71,75,78,79,80,81,82,83,88,92,99],setdatadirectori:2,setup:1,sever:[6,30],shall:2,shape:9,shift_ji:30,ship:[1,2],shorter:[15,18,27,46,58,60,75,80,83,88],should:[1,2,5,6,21,23,29,30,38,39,44,48,49,54,58,63,65,67,68,69,74,75,78,80,82,88,97,100,101],show:30,shown:[5,9,12],shuffl:[0,3],side:[0,3,68,101],sign:[2,5,9,20,25],signific:[2,6,23],significantli:[29,99],silent:[2,4,5,17,43,51,52,86],similar:[2,5,6,9,12,16,43,54,55,90],simpl:[2,5,38,65,69,101],simplest:87,simpli:[1,2],simplifi:[2,30,37,46,47,69,80,81,101],simplify2arrai:54,sinc:[0,9,12,25,46,75,90],singl:[2,5,8,9,16,19,20,21,22,23,26,27,29,30,31,32,33,37,39,40,43,44,46,47,48,49,51,52,54,55,57,58,59,60,63,64,65,67,68,69,71,72,75,76,78,80,81,82,83,86,87,88,89,90,91,92,93,94,97,101],singleton:27,sit:[18,52,69,75,80,84,85,86,101],site:[1,2,13,90],situat:39,six:12,size:[33,44,66,72],sk_sk:[17,46,58,67,78,79,89],skip:[46,58,75],skip_:63,skip_line_hard:63,skip_line_soft:63,skip_sentence_sep:[63,81],skip_sentence_term:63,skip_word_ideo:63,skip_word_kana:63,skip_word_lett:[63,81],skip_word_non:[19,59,63,81],skip_word_numb:[63,81],slash:9,slightli:[83,85],slovak:17,slow:75,slower:[10,14,29,99],small:[5,71,85,92,94],smaller:87,smith:[59,81],snprintf:2,soft:[9,63,100],soft_dot:9,softwar:101,solari:[1,2,39],sole:[2,5],solut:1,solv:2,some:[1,2,4,5,9,11,12,13,23,24,30,33,37,44,48,55,56,57,58,63,66,85,86,89,98],somehow:5,someth:[9,75],sometim:[4,35,53,82],somewhat:12,sort:[0,2,3,5,6,13,37,64,67,87],sourc:[0,1,2,69],sourceforg:85,southern:90,space:[2,5,8,9,12,18,23,46,58,66,75,84,85,97,100,101],space_separ:12,spaghetti:60,spam:[19,52,59,81],sparc:1,speak:5,special:[5,9,45,63,66],specif:[2,6,8,9,10,11,13,17,20,23,31,56,83,90,96],specifi:[2,5,6,9,12,20,21,22,23,24,37,44,63,71,75,94,96,97,101],spectrum:5,speed:[2,5,66],spell:2,split:[0,2,3,7,12,13,72,73,101],spontan:2,sprintf:[0,2,3],squar:[9,101],src:[1,2],sse2:2,sss:23,ssss:23,ssz:23,stabl:[67,78],stable_sort:[67,78],stack:[2,66],stack_limit:[2,66],stage:2,stand:[6,9,22,23,26],standalon:26,standard:[0,1,2,5,6,9,12,33,59,62,81,82,96,98,100],start:[0,2,3,7,8,9,27,46,58,59,66,68,69,75,86,87,97,101],start_lipsum:69,stat:[84,85],state:[2,9,20,68,89,101],statist:[0,3,5,13,30,31],statu:[2,19,47,59],stdin:[5,38],step:94,stick:97,still:[1,6],sting:27,stl:[67,78],stop:[2,27,66],storag:[5,66],store:[5,62],str2:76,str:[2,11,18,19,23,27,28,29,30,31,34,35,36,38,40,41,42,43,44,45,46,47,48,50,53,58,59,60,62,67,68,70,75,76,77,78,79,80,81,82,83,84,85,86,87,88,92,93,94,96,97,98,99,100,101,102],str_split_fix:2,strchr:2,strcmp:17,stream:[0,3,40,43],strength:[17,29,46,58,64,83,99],strftime:[23,24],stri:[2,14,15,16,28],stri_:[2,4,7,9,10,12,65,83],stri_brkit:2,stri_c:[2,51],stri_c_list:52,stri_cmp:[2,13,17,64],stri_cmp_eq:[2,17,92],stri_cmp_equiv:[2,15,17],stri_cmp_g:[2,17],stri_cmp_gt:[2,17],stri_cmp_l:[2,15,17],stri_cmp_lt:[2,17],stri_cmp_neq:[2,17],stri_cmp_nequiv:[2,17],stri_col:64,stri_compar:[0,3,6,8,10,15,19,29,31,47,59,64,67,78,79,81,92,99,101],stri_conv:44,stri_count:[0,2,3,7,19],stri_count_:7,stri_count_boundari:[0,2,3,6,7,8,10,13,15,17,18,29,31,47,53,59,63,64,67,78,79,81,82,92,99,101],stri_count_charclass:18,stri_count_col:18,stri_count_fix:[2,18,65],stri_count_regex:[18,66],stri_count_word:[2,19,47,59],stri_datetime_add:[0,2,3,21,22,23,24,25,26,89,90,91],stri_datetime_cr:[0,2,3,20,22,23,24,25,26,89,90,91],stri_datetime_field:[0,2,3,20,21,23,24,25,26,89,90,91],stri_datetime_format:[0,2,3,13,20,21,22,24,25,26,89,90,91],stri_datetime_fstr:[0,2,3,20,21,22,23,25,26,89,90,91],stri_datetime_now:[0,2,3,20,21,22,23,24,26,89,90,91],stri_datetime_pars:[2,23,24],stri_datetime_symbol:[0,2,3,20,21,22,23,24,25,89,90,91],stri_detect:[0,2,3,7,83,88],stri_detect_:[2,7],stri_detect_charclass:27,stri_detect_col:[27,64],stri_detect_fix:[27,65],stri_detect_regex:[2,27,66,83],stri_dup:[0,2,3,13,14,48,51,52],stri_dupl:[0,2,3,6,8,10,13,15,17,19,31,47,59,64,67,78,79,81,92,99,101],stri_duplicated_ani:[2,29],stri_enc_detect2:[0,2,3,5,6,8,10,15,17,19,29,30,34,35,36,47,59,64,67,78,79,81,92,99,101],stri_enc_detect:[0,2,3,5,31,34,35,36,73],stri_enc_fromutf32:[0,3,5,40,41,42,43,44,46,100],stri_enc_get:[5,38,39,41,43,44],stri_enc_info:[0,3,5,37,38,39,49],stri_enc_isascii:[0,2,3,5,30,31,35,36],stri_enc_isnf:2,stri_enc_isutf16:[0,3],stri_enc_isutf16b:[5,30,31,34,35,36],stri_enc_isutf16l:35,stri_enc_isutf32b:35,stri_enc_isutf32l:35,stri_enc_isutf8:[0,2,3,5,30,31,34,35],stri_enc_list:[0,3,5,33,38,39,44],stri_enc_mark:[0,2,3,5,33,37,39,40,41,43,44],stri_enc_nf:2,stri_enc_set:[0,2,3,5,33,37,38],stri_enc_toascii:[0,3,5,32,41,42,43,44],stri_enc_ton:[0,2,3,5,32,40,42,43,44],stri_enc_toutf32:[0,3,5,32,40,41,43,44],stri_enc_toutf8:[0,2,3,5,32,40,41,42,44,53,76],stri_encod:[0,2,3,5,30,32,40,41,42,43,72,73],stri_endswith:[2,27,83],stri_endswith_:[2,7],stri_endswith_charclass:83,stri_endswith_col:83,stri_endswith_fix:83,stri_escape_unicod:[0,3,13,62,98],stri_extract:[0,2,3,7,58,60],stri_extract_:[2,7,46,47],stri_extract_al:[2,7,46,47,54,60,87],stri_extract_all_:[2,46,47],stri_extract_all_boundari:[6,7,8,10,15,17,19,29,31,46,47,59,60,63,64,67,78,79,81,82,92,99,101],stri_extract_all_charclass:[2,46],stri_extract_all_col:46,stri_extract_all_fix:[2,46,65],stri_extract_all_regex:[2,46,52,60],stri_extract_all_word:[2,8,12,19,47,52,59],stri_extract_boundari:[0,3],stri_extract_first:[46,86],stri_extract_first_:[46,47],stri_extract_first_boundari:47,stri_extract_first_charclass:46,stri_extract_first_col:46,stri_extract_first_fix:46,stri_extract_first_regex:46,stri_extract_first_word:[2,47],stri_extract_last:[46,86],stri_extract_last_:[46,47],stri_extract_last_boundari:47,stri_extract_last_charclass:46,stri_extract_last_col:46,stri_extract_last_fix:46,stri_extract_last_regex:46,stri_extract_last_word:[2,47],stri_extract_word:2,stri_flatten:[0,2,3,13,14,28,30,51,52,69],stri_info:[0,2,3,39],stri_install_check:2,stri_install_icudt:2,stri_isempti:[0,3,53,62,100],stri_join:[0,2,3,4,13,14,28,48,52],stri_join_list:[0,2,3,14,28,48,51],stri_length:[0,2,3,13,19,50,62,93,100],stri_list2matrix:[0,2,3,46,47,61,74,76,80,81],stri_loc:[0,2,3,7],stri_locale_get:57,stri_locale_info:[0,3,6,49,56,57],stri_locale_list:[0,3,6,55,57],stri_locale_set:[0,3,6,55,56],stri_locate_:[7,58,59],stri_locate_al:[7,58,59,86,87],stri_locate_all_:[2,58,59],stri_locate_all_boundari:[2,6,7,8,10,15,17,19,29,31,47,58,59,63,64,67,78,79,81,82,86,87,92,99,101],stri_locate_all_charclass:[2,58],stri_locate_all_col:58,stri_locate_all_fix:[2,58,65],stri_locate_all_regex:[44,58,87],stri_locate_all_word:[2,19,59],stri_locate_boundari:[0,2,3],stri_locate_first:[58,86,87],stri_locate_first_:[58,59],stri_locate_first_boundari:[2,59],stri_locate_first_charclass:58,stri_locate_first_col:58,stri_locate_first_fix:58,stri_locate_first_regex:[58,86],stri_locate_first_word:[2,59],stri_locate_last:[58,86,87],stri_locate_last_:[58,59],stri_locate_last_boundari:[2,59],stri_locate_last_charclass:58,stri_locate_last_col:58,stri_locate_last_fix:58,stri_locate_last_regex:[58,86],stri_locate_last_word:[2,59],stri_locate_regex:2,stri_locate_word:2,stri_match:[0,2,3,7,12,46],stri_match_:[2,60],stri_match_al:[7,46,47,60],stri_match_all_:[2,60],stri_match_all_regex:60,stri_match_first:60,stri_match_first_regex:60,stri_match_last:60,stri_match_last_regex:60,stri_na2empti:[0,2,3,54,74,76],stri_numbyt:[0,3,19,50,53,100],stri_omit_empti:[2,74],stri_omit_empty_na:[2,74],stri_omit_na:[2,74],stri_opts_brkit:[0,2,3,7,8,19,47,59,81,82,92,101],stri_opts_col:[0,2,3,6,7,8,10,13,15,17,18,19,27,29,31,46,47,58,59,67,75,78,79,80,81,83,88,92,99,101],stri_opts_fix:[0,2,3,7,11,18,27,46,58,75,80,83,88],stri_opts_regex:[0,2,3,7,12,18,27,46,58,60,75,80,88],stri_ord:[0,2,3,6,8,10,13,15,17,19,29,31,47,59,64,78,79,81,92,99,101],stri_pad:[0,2,3,13,101],stri_pad_:[2,68],stri_pad_both:[2,68],stri_pad_left:[2,68],stri_pad_right:[2,68],stri_past:[2,51,58,70,71,76,83,101],stri_paste_list:52,stri_prepare_arg_posixct:2,stri_rand_lipsum:[0,2,3,13,70,71],stri_rand_shuffl:[0,2,3,13,69,71,77],stri_rand_str:[0,2,3,9,13,69,70],stri_read_bin:2,stri_read_lin:[0,2,3,13,73,84,102],stri_read_raw:[0,2,3,13,72,102],stri_remove_empti:[0,2,3,54,61,76],stri_remove_empty_na:[2,74],stri_remove_na:[2,74],stri_replac:[0,3,7,97],stri_replace_:[7,75],stri_replace_al:[2,7,75,97],stri_replace_all_:[2,75],stri_replace_all_charclass:[2,75],stri_replace_all_col:75,stri_replace_all_fix:[2,75],stri_replace_all_regex:75,stri_replace_first:[75,86],stri_replace_first_charclass:75,stri_replace_first_col:75,stri_replace_first_fix:75,stri_replace_first_regex:75,stri_replace_last:[75,86],stri_replace_last_charclass:75,stri_replace_last_col:75,stri_replace_last_fix:75,stri_replace_last_regex:75,stri_replace_na:[0,2,3,54,61,74],stri_revers:[0,3,13,70],stri_sort:[0,2,3,6,8,10,13,15,17,19,29,31,47,59,64,67,79,81,92,99,101],stri_sort_kei:[0,2,3,6,8,10,15,17,19,29,31,47,59,64,67,78,81,92,99,101],stri_split:[0,2,3,7,54,81,82],stri_split_:[2,7],stri_split_boundari:[0,2,3,6,7,8,10,15,17,19,29,31,47,59,63,64,67,78,79,80,82,92,99,101],stri_split_charclass:[2,80],stri_split_col:[2,80],stri_split_fix:[2,55,80],stri_split_lin:[0,3,7,8,13,19,47,59,63,80,81,92,101],stri_split_lines1:[72,73,82],stri_split_regex:[2,80],stri_startsendswith:[0,3],stri_startswith:[2,7,27,83],stri_startswith_:[2,7],stri_startswith_charclass:83,stri_startswith_col:83,stri_startswith_fix:83,stri_stats_gener:[0,3,13,85],stri_stats_latex:[0,3,13,84],stri_sub:[0,2,3,13,58,59,87],stri_sub_al:[0,2,3,58,59,86],stri_sub_all_replac:87,stri_sub_replac:[2,86],stri_sub_replace_al:[2,87],stri_subset:[0,2,3,7,27],stri_subset_:[2,7],stri_subset_charclass:88,stri_subset_col:88,stri_subset_fix:88,stri_subset_regex:88,stri_timezone_get:[2,20,21,22,23,24,25,26,89,90,91],stri_timezone_info:[0,2,3,20,21,22,23,24,25,26,90,91],stri_timezone_list:[0,2,3,20,21,22,23,24,25,26,89,91],stri_timezone_set:[0,2,3],stri_trans_casefold:2,stri_trans_casemap:[0,3],stri_trans_char:[0,2,3,13,92,94,95,96],stri_trans_gener:[0,2,3,13,92,93,95,96],stri_trans_isnf:[2,96],stri_trans_isnfc:96,stri_trans_isnfd:96,stri_trans_isnfkc:96,stri_trans_isnfkc_casefold:96,stri_trans_isnfkd:96,stri_trans_list:[0,2,3,92,93,94,96],stri_trans_nf:[0,2,3],stri_trans_nfc:[5,13,53,86,92,93,94,95,96,100,101],stri_trans_nfd:[77,94,96],stri_trans_nfkc:96,stri_trans_nfkc_casefold:96,stri_trans_nfkd:[17,19,29,53,68,96,99,100],stri_trans_to:2,stri_trans_tolow:[6,7,8,10,13,15,17,19,29,31,47,59,63,64,67,78,79,81,82,92,93,94,95,96,99,101],stri_trans_totitl:[2,8,92],stri_trans_toupp:[92,94],stri_trim:[0,3,7,13,75],stri_trim_both:[7,9,75,97],stri_trim_left:[68,97],stri_trim_right:97,stri_unescape_unicod:[0,3,45],stri_uniqu:[0,2,3,6,8,10,13,15,17,19,29,31,47,59,64,67,78,79,81,92,101],stri_width:[0,2,3,13,50,53,62,68,101],stri_wrap:[0,2,3,6,7,8,10,13,15,17,19,29,31,47,59,63,64,67,68,69,78,79,81,82,92,99],stri_write_lin:[0,2,3,13,72,73],stricontainerutf16:2,stricontainerutf8:2,strictest:64,striexcept:2,string8:2,string:[2,3,4,5,6,9,11,12,16,18,19,20,21,22,23,26,27,29,30,31,32,33,34,35,36,39,40,45,46,47,49,51,53,54,55,57,58,59,60,62,63,64,65,66,67,69,72,75,76,78,79,84,85,86,87,88,89,90,91,93,94,96,99,100,101],stringi:[7,13,17,18,19,25,27,32,34,35,36,37,38,44,46,47,51,55,56,58,59,60,63,64,65,66,67,68,71,75,78,79,80,81,82,83,84,85,86,88,92,94,96,97,99,100,101],stringi_1:1,stringi_cflag:[1,2],stringi_cppflag:[1,2],stringi_cxxflag:[1,2],stringi_disable_cxx11:[1,2],stringi_disable_icu_bundl:[1,2],stringi_disable_pkg_config:[1,2],stringi_general_top:[4,5,6,7,8,9,10,11,12,13],stringi_ldflag:[1,2],stringi_lib:[1,2],stringr:[0,2],stringsearch:[7,10],strncpy:2,strongli:[1,9],strptime:[0,2,3],strrringi:[18,27],strstr:2,strsxp:2,strwrap:[2,101],stubdata:2,student:2,studio:2,stuff:[84,85],style:[0,3,9,23,30],sub:[12,60,88],sub_index:2,submiss:2,subsequ:101,subset:[1,2,4,5,7,9,27,33],substitut:[2,5,40,44,72,80,86,87,88,101,102],substr:[0,2,3,12,13,46,59,60,64,75,80],success:1,successfulli:1,suffici:2,suggest:[0,1,2,6,101,102],suit:[29,97,99],suitabl:[1,2,101],summar:[9,12],sun:2,sundai:22,superset:[5,39],supplementari:[18,27,46,58,60,75,80,83,88],suppli:[2,12,30,31,75],support:[0,2,5,6,9,23,24,37,39,44,46,49,60,62,80,89,96],suppos:2,suppress:2,sure:[1,35],surrog:9,surround:92,suscipit:[84,85,101],swedish:30,sxpinfo:2,syllabl:9,symbol:[2,9,23],synonym:28,syntax:[9,12,16,23,63],sys:2,system:[1,2,5,6,8,9,38,39,49],tab:[9,12,82,101],tabl:30,tabul:12,take:[10,17,65,68,89,101],taken:[8,30],tar:1,target:[2,44],tartanu:[0,13],task:[2,7,12,13,94,95],tato:94,team:85,technic:[5,8,12,44,82,96],techniqu:30,technolog:2,tellu:[84,101],temporari:14,term:[51,90],termin:[12,27,63,66],terminal_punctu:9,tertiari:64,test1:76,test2:19,test:[2,6,9,15,17,19,27,29,30,39,59,76,81,83,99],text:[0,2,3,5,7,9,12,13,23,30,31,63,68,69,80,84,85,86,92,96,100],text_boundari:[7,8,19,47,59,63,81,82,92,101],textbf:85,textit:85,textual:9,tf08:5,tgca:93,th_th_tradit:26,than:[2,4,5,8,9,10,12,14,17,23,29,38,40,44,51,52,54,58,62,64,70,71,87,99,101],thank:[0,2],thei:[2,5,6,9,12,13,15,17,23,32,43,44,46,58,59,60,63,65,67,75,78,83,88,94],them:[5,6,17,30,33,95],themselv:[66,80],theoret:9,therefor:[5,9,17,82],therein:13,thereof:44,thi:[0,1,2,4,5,6,7,8,9,17,18,19,22,23,27,30,31,32,33,34,36,37,38,40,41,42,43,44,46,50,51,53,54,55,58,59,60,61,62,63,64,65,66,67,68,70,71,72,75,76,77,78,79,81,82,83,84,85,90,94,96,99,101,102],think:8,third:[8,60,64],those:[5,6,10],though:[2,12],thought:5,three:[12,23,30,31,90,92],through:9,throughout:90,thu:[4,5,59,80,96,102],tie:9,time:[0,2,3,5,9,11,12,13,14,24,28,29,66,80,88,93],time_limit:[2,66],timezon:[20,23,89,90,91],titl:[13,92,94],to_raw:44,todo:2,togeth:[0,1,3,6,49,94],token:[80,81],tokens_onli:[2,80,81],toler:1,too:2,took:4,tool:[2,12,13,96],top:64,topic:[12,13],total:[12,31,68,84,97,101],tr11:100,tr13:82,tr15:96,tr18:[12,82],tr29:66,tr44:9,tr_tr:92,tracker:0,tradit:[30,66],trail:62,transform:[0,2,3,13,93,96],transit:12,translat:[0,3,5,13,33],transliter:[0,2,3,13],transpos:54,transposit:54,treat:[12,13,23,48,51,64,66,74],treatment:[67,78],tri:[2,5,8,12,31,37,39],trick:1,trim:[0,3,13,83],trivial:2,truncat:[23,69],tue:23,tuesdai:23,tune:[6,10,11,12,17,18,27,46,58,63,64,65,66,67,75,78,79,80,83,88],turkish:30,turn:64,tutori:12,tweak:[1,2,11],two:[0,2,3,5,6,9,12,15,17,23,53,58,59,82,86,87,90,92,93,96],txt:[9,30,96],type:[1,2,5,8,9,19,44,53,59,63,73,80,81,86,87,92,102],typic:[5,14,15,83,90,96],tzone:22,u0000:9,u0007:12,u0009:12,u000a:12,u000c:12,u000d:12,u0010ffff:[9,12],u001a:44,u001b:12,u0032:98,u00a0abov:[19,59,81],u00a9:19,u00df:[19,29,92,94,99],u00e1rio:17,u00e4rtn:17,u00fd:[17,46,58],u0104123:77,u0104:[34,36,50,53,62,92,94],u0105:[9,17,29,34,36,45,50,53,62,77,92,96,98,99,100],u0119:19,u0153:19,u0222:36,u03c0:19,u0627:[58,83],u0633:[58,83],u0635:[58,83],u0639:[58,83],u0644:[58,83],u0645xyz:[58,83],u0647:[58,83],u0648:[58,83],u0649:[58,83],u064a:[58,83],u105:17,u1234:36,u200c:12,u200d:12,u2190:19,u2192:19,u2193:19,u2620:94,u7fffffff:62,u_charset_is_utf8:[2,39,49],u_ea_fullwidth:100,u_ea_wid:100,u_hst_trailing_jamo:100,u_hst_vowel_jamo:100,u_init:2,u_missing_resource_error:2,u_toupp:65,uax:100,ubbfc:68,ubc1f:100,ubrk:63,ubrk_8h:63,ubrk_word_non:[19,47,59],ubsan:2,ubuntu:[1,2],uc74c:68,uc815:68,ucd:13,uchar32:33,uchar:33,uchar_east_asian_width:100,uchar_hangul_syllable_typ:100,ucs:100,ud6c8:68,ufb00:17,ufdfa:[58,83,96],ufdfaxyz:[58,83],ufffd:[43,44],uhhhh:12,uhhhhhhhh:12,uint32_t:2,umlaut:36,unambigu:82,unassign:9,unavail:[33,56,60],unbound:12,unchang:[43,75,86,87],under:[0,2,5,13],underli:[18,27,46,58,60,75,80,83,88],underscor:55,understand:[5,55,98],undesir:39,unfortun:5,unicod:[0,2,3,5,7,8,11,12,13,17,19,26,32,33,42,43,49,53,62,63,64,66,68,70,71,72,77,80,82,84,86,90,91,92,93,94,97,98,99,100,101],unicode_equival:96,unicodeset:[2,94],unicodestr:2,unidata:9,uninspect:27,union:9,uniqu:[0,2,3,6,8,29,37,93],unit:[2,5,8,9,20,92],unitialis:2,univers:[2,5,13,90,97],unix:[2,5,9,66],unix_lin:66,unknown:[2,5,6,30,33,38],unless:[5,9,27,39,51,52,91],unlik:[23,29,38,42,58,99],unnecessari:97,unprotect:2,unrecogn:66,unsupport:55,until:12,unzip:1,updat:2,upgrad:2,upon:1,upper:[9,13,64,92,94],uppercas:[9,94],uppercase_first:64,ups:[2,5],uregex_8h:66,uregexpflag:66,usag:[1,2,9],use:[1,2,4,9,10,12,38,42,43,44,48,62,66,80,83,85,88,90,94,96,100],use_length:[68,101],use_width:2,usearch:2,used:[1,2,4,5,6,9,13,17,18,19,23,24,27,30,32,33,38,39,40,43,44,45,46,47,48,49,51,52,53,55,57,58,59,60,62,63,64,65,68,69,72,75,76,80,82,83,86,88,89,90,91,92,93,95,97,101],usedynlib:2,useful:[2,5,7,9,19,54,59,79,81,94],user:[1,2,5,6,8,9,10,12,17,20,23,26,29,30,39,44,63,64,65,66,67,78,79,90,92,94,95,96,99],userguid:[5,6,8,9,10,12,17,20,23,26,29,30,44,63,64,65,66,67,78,79,90,92,94,95,96,99],uses:[2,6,8,9,26,30,31,38,65,66,67,78,89,96],usesdaylighttim:89,using:[2,5,6,9,10,15,23,24,30,31,66,79,91,96,102],uslax:23,usr:1,usual:[11,15,32,45,51,53,67,78,87,88,96,99],utc:[25,90],utf8:[5,37,49],utf8toint:42,utf:[0,2,3,13,17,30,31,33,38,39,40,41,44,49,51,53,62,72,88,96,98,102],utf_8:5,utf_bom:5,util:[6,12,54,61,74,76,91,101],utr22:33,utr:82,uuuu:23,uword:66,uxxxx:[45,98],uxxxxxxxx:[45,98],valgrind:2,valid:[2,5,6,17,31,34,35,36,37,43,98],valu:[0,2,3,5,6,9,12],vari:90,variabl:[1,2,23,64],variant:[6,55,75,86,87],varieti:94,variou:[5,68,101],vec:32,vector:[0,2,3,5,7,13,15,16,17,18,19,20,21,22,23,24,27,28,29,30,31,32,34,35,36,37,38,40,41,42,43,44,45,46,47,48,50,52,53,54,56,58,59,60,61,62,67,68,69,70,71,72,73,75,77,78,79,80,81,82,83,87,88,90,92,93,94,95,96,97,98,99,100,101,102],vectorise_al:75,vectorize_al:[2,75],vel:[84,101],veri:[0,1,2,5,9,11,12,19,39,59,69,81,101],verifi:6,versa:23,version:[1,2,20,32,44,49,74,78,86,87,88,98,99],vertic:82,via:[1,2,11,12,30,38,51,65],vice:23,video:0,vietnames:9,vignett:2,violat:2,vowel:100,vvv:23,vvvv:23,w3c:96,wai:[2,5,10,11,12,16,23,34,35,36,44,50,64,72,76,80,94,101,102],want:[2,6,42,43],warn:[2,4,9,12,18,24,27,32,39,40,42,44,53,63,64,65,66,83,93,98],warnfix:2,warsaw:[2,91],wcwidth:100,weakli:78,web:96,wed:23,week:[20,23],weekdai:26,weekofmonth:22,weekofyear:22,weight:64,well:[2,9,13,36,45,49,64,86,100],were:[2,5,60,94],werner:10,western:5,wget:1,what:[0,4,5,8,9,11,17,39,43],whatev:12,when:[2,4,5,6,8,12,17,23,43,53,64,66,68,79,82,89,90,101],whenev:[4,5,65],where:[2,5,17,23,24,32,39,42,43,51,58,63,67,75,78,82,83,84,85,88,90,97,101],wherea:23,wherev:[76,86,87],whether:[2,6,17,23,27,29,31,34,35,36,38,44,46,49,50,58,64,66,80,82,83,86,87,88,89,96,99],which:[1,2,5,6,8,9,10,13,19,29,30,40,44,51,62,64,67,68,72,78,79,80,81,90,96,101],white:[2,9,12,13,18,46,58,66,75,84,85,97,101],white_spac:[9,18,75,80,84],whitespace_onli:[2,101],who:6,whole:[8,60,65],wickham:0,wide:[0,5,26,96],width:[0,2,3,9,13,23,26,53,68,101],wieczori:94,wiki:96,wikipedia:96,win:2,winbuild:2,window:[2,5,30,33,36,62,89,98,102],windtfmt:2,winnmfmt:2,wise:[2,7,13],wish:[1,12,48,75,80,83],within:[1,2,4,6,8,12,18,23,27,30,46,58,60,66,86,87,101],without:[0,3,6,23,66],word:[0,2,3,8,9,12,19,47,59,63,66,69,75,81,85,88,92],word_boundari:66,work:[1,2,5,30,31,41,65,86,96,98],world:[5,96],worst:11,worth:92,would:[8,62,66,97],wparenthes:2,wraca:94,wrap:[0,2,3,8,13,68,87],wrapper:[60,97],write:[0,3,8,13],writelin:102,written:[5,30,66],wspace:[83,97],www:[5,6,9,12,82,96,100],x1a:40,xaaaax:[46,58],xhh:12,xml:30,xnox:2,xxx:[23,48,98],xxxx:23,xxxxx:23,xyx:60,xyz:51,year:[5,20,21,22,23,89,90],yet:[2,13,96,97],yield:[2,23,46,67],you:[0,1,2,4,5,6,9,10,11,12,17,30,31,38,39,42,43,48,51,52,55,57,58,59,62,66,70,75,80,83,84,96,97,101],your:[1,4,5,6,9,38,39,62,83,97],yutannihil:2,yyyi:23,yyyyi:23,zc1:27,zero:[0,2,3,5,9,12,23,58,80,100,101],zip:[1,2],zipf:69,zone:[0,2,3,13,20,21,22,23],zwnbsp:9,zwsp:9,zxy:77,zzz:23,zzzz:23,zzzzz:23},titles:["stringi: THE String Processing Package for R","Installing stringi","What Is New in stringi","R Package stringi Reference","about_arguments: Passing Arguments to Functions in stringi","about_encoding: Character Encodings and stringi","about_locale: Locales and stringi","about_search: String Searching","about_search_boundaries: Text Boundary Analysis in stringi","about_search_charclass: Character Classes in stringi","about_search_coll: Locale-Sensitive Text Searching in stringi","about_search_fixed: Locale-Insensitive Fixed Pattern Matching in stringi","about_search_regex: Regular Expressions in stringi","about_stringi: THE String Processing Package","operator_add: Concatenate Two Character Vectors","operator_compare: Compare Strings with or without Collation","operator_dollar: C-Style Formatting with sprintf as a Binary Operator","stri_compare: Compare Strings with or without Collation","stri_count: Count the Number of Pattern Matches","stri_count_boundaries: Count the Number of Text Boundaries","stri_datetime_add: Date and Time Arithmetic","stri_datetime_create: Create a Date-Time Object","stri_datetime_fields: Get Values for Date and Time Fields","stri_datetime_format: Date and Time Formatting and Parsing","stri_datetime_fstr: Convert strptime-Style Format Strings","stri_datetime_now: Get Current Date and Time","stri_datetime_symbols: List Localizable Date-Time Formatting Data","stri_detect: Detect a Pattern Match","stri_dup: Duplicate Strings","stri_duplicated: Determine Duplicated Elements","stri_enc_detect: Detect Character Set and Language","stri_enc_detect2: [DEPRECATED] Detect Locale-Sensitive Character Encoding","stri_enc_fromutf32: Convert From UTF-32","stri_enc_info: Query a Character Encoding","stri_enc_isascii: Check If a Data Stream Is Possibly in ASCII","stri_enc_isutf16: Check If a Data Stream Is Possibly in UTF-16 or UTF-32","stri_enc_isutf8: Check If a Data Stream Is Possibly in UTF-8","stri_enc_list: List Known Character Encodings","stri_enc_mark: Get Declared Encodings of Each String","stri_enc_set: Set or Get Default Character Encoding in stringi","stri_enc_toascii: Convert To ASCII","stri_enc_tonative: Convert Strings To Native Encoding","stri_enc_toutf32: Convert Strings To UTF-32","stri_enc_toutf8: Convert Strings To UTF-8","stri_encode: Convert Strings Between Given Encodings","stri_escape_unicode: Escape Unicode Code Points","stri_extract: Extract Occurrences of a Pattern","stri_extract_boundaries: Extract Data Between Text Boundaries","stri_flatten: Flatten a String","stri_info: Query Default Settings for stringi","stri_isempty: Determine if a String is of Length Zero","stri_join: Concatenate Character Vectors","stri_join_list: Concatenate Strings in a List","stri_length: Count the Number of Code Points","stri_list2matrix: Convert a List to a Character Matrix","stri_locale_info: Query Given Locale","stri_locale_list: List Available Locales","stri_locale_set: Set or Get Default Locale in stringi","stri_locate: Locate Occurrences of a Pattern","stri_locate_boundaries: Locate Text Boundaries","stri_match: Extract Regex Pattern Matches, Together with Capture Groups","stri_na2empty: Replace NAs with Empty Strings","stri_numbytes: Count the Number of Bytes","stri_opts_brkiter: Generate a List with BreakIterator Settings","stri_opts_collator: Generate a List with Collator Settings","stri_opts_fixed: Generate a List with Fixed Pattern Search Engine\u2019s Settings","stri_opts_regex: Generate a List with Regex Matcher Settings","stri_order: Ordering Permutation","stri_pad: Pad (Center/Left/Right Align) a String","stri_rand_lipsum: A Lorem Ipsum Generator","stri_rand_shuffle: Randomly Shuffle Code Points in Each String","stri_rand_strings: Generate Random Strings","stri_read_lines: Read Text Lines from a Text File","stri_read_raw: Read Text File as Raw","stri_remove_empty: Remove All Empty Strings from a Character Vector","stri_replace: Replace Occurrences of a Pattern","stri_replace_na: Replace Missing Values in a Character Vector","stri_reverse: Reverse Each String","stri_sort: Sorting","stri_sort_key: Sort Keys","stri_split: Split a String By Pattern Matches","stri_split_boundaries: Split a String at Text Boundaries","stri_split_lines: Split a String Into Text Lines","stri_startsendswith: Determine if the Start or End of a String Matches a Pattern","stri_stats_general: General Statistics for a Character Vector","stri_stats_latex: Statistics for a Character Vector Containing LaTeX Commands","stri_sub: Extract a Substring From or Replace a Substring In a Character Vector","stri_sub_all: Extract or Replace Multiple Substrings","stri_subset: Select Elements that Match a Given Pattern","stri_timezone_info: Query a Given Time Zone","stri_timezone_list: List Available Time Zone Identifiers","stri_timezone_set: Set or Get Default Time Zone in stringi","stri_trans_casemap: Transform Strings with Case Mapping","stri_trans_char: Translate Characters","stri_trans_general: General Text Transforms, Including Transliteration","stri_trans_list: List Available Text Transforms and Transliterators","stri_trans_nf: Perform or Check For Unicode Normalization","stri_trim: Trim Characters from the Left and/or Right Side of a String","stri_unescape_unicode: Un-escape All Escape Sequences","stri_unique: Extract Unique Elements","stri_width: Determine the Width of Code Points","stri_wrap: Word Wrap Text to Format Paragraphs","stri_write_lines: Write Text Lines to a Text File"],titleterms:{"2013":2,"2014":2,"2015":2,"2016":2,"2017":2,"2018":2,"2019":2,"2020":2,"2021":2,"byte":[11,62],"case":92,"class":9,"default":[6,39,49,57,91],"function":[4,6,12],"new":2,For:96,Into:82,NAs:[4,61],THE:[0,13],about_argu:4,about_encod:5,about_local:6,about_search:7,about_search_boundari:8,about_search_charclass:9,about_search_col:10,about_search_fix:11,about_search_regex:12,about_stringi:13,align:68,all:[74,98],also:[4,5,6,7,8,9,10,11,12,13,14,15,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,69,70,71,72,73,74,75,76,78,79,80,81,82,83,84,85,86,87,88,89,90,91,92,93,94,95,96,97,98,99,100,101,102],analysi:8,argument:[4,14,15,16,17,18,19,20,21,22,23,24,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,57,58,59,60,61,62,63,64,65,66,67,68,69,70,71,72,73,74,75,76,77,78,79,80,81,82,83,84,85,86,87,88,89,90,91,92,93,94,96,97,98,99,100,101,102],arithmet:20,ascii:[34,40],attribut:4,author:13,avail:[13,56,90,95],awar:10,between:[44,47],binari:[9,16],boundari:[8,19,47,59,81],breakiter:63,build:1,captur:60,categori:9,center:68,charact:[5,9,12,14,30,31,33,37,39,51,54,74,76,84,85,86,93,97],check:[34,35,36,96],code:[45,53,70,100],coercion:4,collat:[15,17,64],command:85,compar:[11,15,17],concaten:[14,51,52],conclus:1,contain:85,convers:5,convert:[24,32,40,41,42,43,44,54],count:[18,19,53,62],cran:2,creat:21,current:25,customis:1,data:[26,34,35,36,47],date:[20,21,22,23,25,26],declar:38,deprec:31,descript:[4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,68,69,70,71,72,73,74,75,76,77,78,79,80,81,82,83,84,85,86,87,88,89,90,91,92,93,94,95,96,97,98,99,100,101,102],detail:[5,6,7,8,9,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,50,51,52,53,54,55,56,57,58,59,60,62,63,64,65,66,67,68,69,70,71,72,73,75,76,77,78,79,80,81,82,83,84,85,86,87,88,89,90,91,92,93,94,96,97,98,99,100,101,102],detect:[5,27,30,31],determin:[29,50,83,100],devel:2,duplic:[28,29],each:[38,70,77],element:[29,88,99],empti:[61,74],encod:[5,31,33,37,38,39,41,44],end:83,engin:[10,65],escap:[45,98],exampl:[14,15,16,17,18,19,20,21,22,23,24,26,27,28,29,30,34,36,45,46,47,48,50,51,52,53,54,55,57,58,59,60,61,62,64,65,66,67,68,69,70,71,74,75,76,77,78,79,80,81,83,84,85,86,87,88,89,90,91,92,93,94,96,97,98,99,100,101],express:12,extract:[46,47,60,86,87,99],facil:13,field:22,file:[72,73,102],fix:[11,65],flatten:48,format:[16,23,24,26,101],from:[32,72,74,86,97],gener:[9,63,64,65,66,69,71,84,94],get:[22,25,38,39,57,91],given:[44,55,88,89],glanc:12,group:60,handl:4,icu4c:1,icu:12,identifi:[6,90],includ:94,input:4,insensit:11,instal:1,introduct:1,ipsum:69,kei:79,known:37,languag:30,latex:85,left:[68,97],length:50,line:[72,82,102],list:[26,37,52,54,56,63,64,65,66,90,95],local:[6,10,11,31,55,56,57],localiz:26,locat:[58,59],lorem:69,map:92,match:[11,18,27,60,80,83,88],matcher:66,matrix:54,meta:12,miss:[4,76],multipl:87,nativ:41,normal:96,note:6,number:[18,19,53,62],object:[4,21],occurr:[46,58,75],oper:[12,16],operator_add:14,operator_compar:15,operator_dollar:16,order:67,packag:[0,3,13],pad:68,paragraph:101,pars:23,pass:4,pattern:[9,11,18,27,46,58,60,65,75,80,83,88],perform:96,permut:67,point:[45,53,70,100],posix:9,possibl:[34,35,36],preserv:4,process:[0,1,13],properti:9,queri:[33,49,55,89],random:71,randomli:70,raw:73,read:[72,73],refer:[3,5,6,8,9,10,12,13,17,20,23,26,29,30,44,63,64,65,66,67,78,79,82,90,91,92,94,95,96,99,100,101],regex:[12,60,66],regular:12,remov:74,replac:[61,75,76,86,87],revers:77,right:[68,97],search:[7,10,65],see:[4,5,6,7,8,9,10,11,12,13,14,15,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,69,70,71,72,73,74,75,76,78,79,80,81,82,83,84,85,86,87,88,89,90,91,92,93,94,95,96,97,98,99,100,101,102],select:88,sensit:[6,10,31],sequenc:98,set:[30,39,49,57,63,64,65,66,91],shuffl:70,side:97,sort:[78,79],split:[80,81,82],sprintf:16,start:83,statist:[84,85],stream:[34,35,36],stri_compar:17,stri_count:18,stri_count_boundari:19,stri_datetime_add:20,stri_datetime_cr:21,stri_datetime_field:22,stri_datetime_format:23,stri_datetime_fstr:24,stri_datetime_now:25,stri_datetime_symbol:26,stri_detect:27,stri_dup:28,stri_dupl:29,stri_enc_detect2:31,stri_enc_detect:30,stri_enc_fromutf32:32,stri_enc_info:33,stri_enc_isascii:34,stri_enc_isutf16:35,stri_enc_isutf8:36,stri_enc_list:37,stri_enc_mark:38,stri_enc_set:39,stri_enc_toascii:40,stri_enc_ton:41,stri_enc_toutf32:42,stri_enc_toutf8:43,stri_encod:44,stri_escape_unicod:45,stri_extract:46,stri_extract_boundari:47,stri_flatten:48,stri_info:49,stri_isempti:50,stri_join:51,stri_join_list:52,stri_length:53,stri_list2matrix:54,stri_loc:58,stri_locale_info:55,stri_locale_list:56,stri_locale_set:57,stri_locate_boundari:59,stri_match:60,stri_na2empti:61,stri_numbyt:62,stri_opts_brkit:63,stri_opts_col:64,stri_opts_fix:65,stri_opts_regex:66,stri_ord:67,stri_pad:68,stri_rand_lipsum:69,stri_rand_shuffl:70,stri_rand_str:71,stri_read_lin:72,stri_read_raw:73,stri_remove_empti:74,stri_replac:75,stri_replace_na:76,stri_revers:77,stri_sort:78,stri_sort_kei:79,stri_split:80,stri_split_boundari:81,stri_split_lin:82,stri_startsendswith:83,stri_stats_gener:84,stri_stats_latex:85,stri_sub:86,stri_sub_al:87,stri_subset:88,stri_timezone_info:89,stri_timezone_list:90,stri_timezone_set:91,stri_trans_casemap:92,stri_trans_char:93,stri_trans_gener:94,stri_trans_list:95,stri_trans_nf:96,stri_trim:97,stri_unescape_unicod:98,stri_uniqu:99,stri_width:100,stri_wrap:101,stri_write_lin:102,string:[0,7,10,13,15,17,24,28,38,41,42,43,44,48,50,52,61,68,70,71,74,77,80,81,82,83,92,97],stringi:[0,1,2,3,4,5,6,8,9,10,11,12,39,49,57,91],strptime:24,style:[16,24],substr:[86,87],support:1,text:[8,10,19,47,59,72,73,81,82,94,95,101,102],time:[20,21,22,23,25,26,89,90,91],togeth:60,transform:[92,94,95],translat:93,transliter:[94,95],trim:97,two:14,unicod:[9,45,96],unicodeset:9,uniqu:99,usag:[14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,68,69,70,71,72,73,74,75,76,77,78,79,80,81,82,83,84,85,86,87,88,89,90,91,92,93,94,95,96,97,98,99,100,101,102],utf:[5,32,35,36,42,43],valu:[4,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,68,69,70,71,72,73,74,75,76,77,78,79,80,81,82,83,84,85,86,87,88,89,90,91,92,93,94,95,96,97,98,99,100,101,102],vector:[4,14,51,74,76,84,85,86],what:2,width:100,without:[15,17],word:101,wrap:101,write:102,zero:50,zone:[89,90,91]}}) \ No newline at end of file +Search.setIndex({docnames:["index","install","news","rapi","rapi/about_arguments","rapi/about_encoding","rapi/about_locale","rapi/about_search","rapi/about_search_boundaries","rapi/about_search_charclass","rapi/about_search_coll","rapi/about_search_fixed","rapi/about_search_regex","rapi/about_stringi","rapi/operator_add","rapi/operator_compare","rapi/operator_dollar","rapi/stri_compare","rapi/stri_count","rapi/stri_count_boundaries","rapi/stri_datetime_add","rapi/stri_datetime_create","rapi/stri_datetime_fields","rapi/stri_datetime_format","rapi/stri_datetime_fstr","rapi/stri_datetime_now","rapi/stri_datetime_symbols","rapi/stri_detect","rapi/stri_dup","rapi/stri_duplicated","rapi/stri_enc_detect","rapi/stri_enc_detect2","rapi/stri_enc_fromutf32","rapi/stri_enc_info","rapi/stri_enc_isascii","rapi/stri_enc_isutf16","rapi/stri_enc_isutf8","rapi/stri_enc_list","rapi/stri_enc_mark","rapi/stri_enc_set","rapi/stri_enc_toascii","rapi/stri_enc_tonative","rapi/stri_enc_toutf32","rapi/stri_enc_toutf8","rapi/stri_encode","rapi/stri_escape_unicode","rapi/stri_extract","rapi/stri_extract_boundaries","rapi/stri_flatten","rapi/stri_info","rapi/stri_isempty","rapi/stri_join","rapi/stri_join_list","rapi/stri_length","rapi/stri_list2matrix","rapi/stri_locale_info","rapi/stri_locale_list","rapi/stri_locale_set","rapi/stri_locate","rapi/stri_locate_boundaries","rapi/stri_match","rapi/stri_na2empty","rapi/stri_numbytes","rapi/stri_opts_brkiter","rapi/stri_opts_collator","rapi/stri_opts_fixed","rapi/stri_opts_regex","rapi/stri_order","rapi/stri_pad","rapi/stri_rand_lipsum","rapi/stri_rand_shuffle","rapi/stri_rand_strings","rapi/stri_rank","rapi/stri_read_lines","rapi/stri_read_raw","rapi/stri_remove_empty","rapi/stri_replace","rapi/stri_replace_na","rapi/stri_reverse","rapi/stri_sort","rapi/stri_sort_key","rapi/stri_split","rapi/stri_split_boundaries","rapi/stri_split_lines","rapi/stri_startsendswith","rapi/stri_stats_general","rapi/stri_stats_latex","rapi/stri_sub","rapi/stri_sub_all","rapi/stri_subset","rapi/stri_timezone_info","rapi/stri_timezone_list","rapi/stri_timezone_set","rapi/stri_trans_casemap","rapi/stri_trans_char","rapi/stri_trans_general","rapi/stri_trans_list","rapi/stri_trans_nf","rapi/stri_trim","rapi/stri_unescape_unicode","rapi/stri_unique","rapi/stri_width","rapi/stri_wrap","rapi/stri_write_lines"],envversion:{"sphinx.domains.c":2,"sphinx.domains.changeset":1,"sphinx.domains.citation":1,"sphinx.domains.cpp":3,"sphinx.domains.index":1,"sphinx.domains.javascript":2,"sphinx.domains.math":2,"sphinx.domains.python":2,"sphinx.domains.rst":2,"sphinx.domains.std":2,sphinx:56},filenames:["index.rst","install.rst","news.rst","rapi.rst","rapi/about_arguments.rst","rapi/about_encoding.rst","rapi/about_locale.rst","rapi/about_search.rst","rapi/about_search_boundaries.rst","rapi/about_search_charclass.rst","rapi/about_search_coll.rst","rapi/about_search_fixed.rst","rapi/about_search_regex.rst","rapi/about_stringi.rst","rapi/operator_add.rst","rapi/operator_compare.rst","rapi/operator_dollar.rst","rapi/stri_compare.rst","rapi/stri_count.rst","rapi/stri_count_boundaries.rst","rapi/stri_datetime_add.rst","rapi/stri_datetime_create.rst","rapi/stri_datetime_fields.rst","rapi/stri_datetime_format.rst","rapi/stri_datetime_fstr.rst","rapi/stri_datetime_now.rst","rapi/stri_datetime_symbols.rst","rapi/stri_detect.rst","rapi/stri_dup.rst","rapi/stri_duplicated.rst","rapi/stri_enc_detect.rst","rapi/stri_enc_detect2.rst","rapi/stri_enc_fromutf32.rst","rapi/stri_enc_info.rst","rapi/stri_enc_isascii.rst","rapi/stri_enc_isutf16.rst","rapi/stri_enc_isutf8.rst","rapi/stri_enc_list.rst","rapi/stri_enc_mark.rst","rapi/stri_enc_set.rst","rapi/stri_enc_toascii.rst","rapi/stri_enc_tonative.rst","rapi/stri_enc_toutf32.rst","rapi/stri_enc_toutf8.rst","rapi/stri_encode.rst","rapi/stri_escape_unicode.rst","rapi/stri_extract.rst","rapi/stri_extract_boundaries.rst","rapi/stri_flatten.rst","rapi/stri_info.rst","rapi/stri_isempty.rst","rapi/stri_join.rst","rapi/stri_join_list.rst","rapi/stri_length.rst","rapi/stri_list2matrix.rst","rapi/stri_locale_info.rst","rapi/stri_locale_list.rst","rapi/stri_locale_set.rst","rapi/stri_locate.rst","rapi/stri_locate_boundaries.rst","rapi/stri_match.rst","rapi/stri_na2empty.rst","rapi/stri_numbytes.rst","rapi/stri_opts_brkiter.rst","rapi/stri_opts_collator.rst","rapi/stri_opts_fixed.rst","rapi/stri_opts_regex.rst","rapi/stri_order.rst","rapi/stri_pad.rst","rapi/stri_rand_lipsum.rst","rapi/stri_rand_shuffle.rst","rapi/stri_rand_strings.rst","rapi/stri_rank.rst","rapi/stri_read_lines.rst","rapi/stri_read_raw.rst","rapi/stri_remove_empty.rst","rapi/stri_replace.rst","rapi/stri_replace_na.rst","rapi/stri_reverse.rst","rapi/stri_sort.rst","rapi/stri_sort_key.rst","rapi/stri_split.rst","rapi/stri_split_boundaries.rst","rapi/stri_split_lines.rst","rapi/stri_startsendswith.rst","rapi/stri_stats_general.rst","rapi/stri_stats_latex.rst","rapi/stri_sub.rst","rapi/stri_sub_all.rst","rapi/stri_subset.rst","rapi/stri_timezone_info.rst","rapi/stri_timezone_list.rst","rapi/stri_timezone_set.rst","rapi/stri_trans_casemap.rst","rapi/stri_trans_char.rst","rapi/stri_trans_general.rst","rapi/stri_trans_list.rst","rapi/stri_trans_nf.rst","rapi/stri_trim.rst","rapi/stri_unescape_unicode.rst","rapi/stri_unique.rst","rapi/stri_width.rst","rapi/stri_wrap.rst","rapi/stri_write_lines.rst"],objects:{},objnames:{},objtypes:{},terms:{"0000":[5,9],"000a":66,"001a":44,"00ad":101,"0100":23,"0105":9,"0123456789":70,"032":40,"0377":12,"0530":23,"075258":23,"0800":23,"0ooo":12,"0x0a":83,"0x0b":83,"0x0c":83,"0x0d":83,"0x1a":40,"0x1f":99,"0x2028":83,"0x2029":83,"0x3000":101,"0x85":83,"0xff01":101,"0xff5e":101,"100":[2,64,67,72,79],"100000":30,"101":[67,72,79],"102":2,"105":2,"106":2,"10646":13,"107":2,"108":2,"109":2,"10ffff":[5,9],"110":2,"111":2,"1119":102,"112":2,"114":2,"116":2,"117":2,"118":2,"1184":102,"119":2,"120":2,"122":2,"123":[2,14,18,27,47,50,51,52,53,62,76,78,82,89,93,94],"1234":76,"124":2,"1250":[30,36],"1251":30,"1252":[2,5,30],"1253":30,"1254":30,"1255":30,"1256":30,"126":2,"127":[5,34,38,40,43],"128":2,"129":2,"12l":21,"132":2,"133":2,"134":2,"135":2,"137":2,"138":2,"139":2,"141":2,"143":2,"144":2,"149":2,"154":2,"157":2,"164":2,"165":2,"168":2,"169":2,"16be":[30,31,35],"16le":[30,31,35],"170":2,"174":2,"175":2,"176":2,"177":5,"180":2,"183":2,"187":2,"188":2,"189":23,"190":69,"193":2,"1970":25,"1981":102,"199":2,"1990":9,"1996":23,"1999":[10,23],"1bc":[21,22],"1st":23,"1to1":33,"2001":2,"2002":12,"200b":101,"2013":0,"2014":[0,20],"2015":[0,21,23],"2016":[0,20],"2017":0,"2018":0,"2019":0,"2020":0,"2021":0,"2022":30,"2028":[9,83],"2029":[9,83],"205":2,"2060":9,"206f":9,"207":2,"210":2,"214":2,"216":2,"219":2,"220":2,"227":2,"230":2,"231":2,"232":2,"235":23,"2350":23,"238":2,"242":2,"2451334":23,"253":2,"254":2,"258":2,"263":2,"266":2,"267":2,"270":2,"285":2,"288":2,"289":2,"296":2,"2bc":[21,22],"2nd":23,"314":2,"3166":[6,91],"317":2,"318":2,"319":2,"31t23":23,"325":2,"32be":[30,31,35],"32le":[30,31,35],"334":2,"335":2,"337":2,"338":2,"341":2,"343":2,"344":2,"345":2,"3456":[87,88],"347":2,"348":2,"355":2,"362":2,"3629":13,"363":2,"364":2,"366":2,"369":2,"370":2,"372":2,"382":2,"386":2,"393":2,"398":2,"399":2,"3rd":2,"400":2,"401":2,"405":2,"408":2,"414":2,"415":2,"421":2,"456":[27,52,76,82],"4601":23,"5198":97,"55200":46,"5775":21,"61201235":23,"639":6,"667":[87,88],"789":[27,52,76,82,87,88],"822":23,"8601":23,"8859":[5,30],"8bit":33,"9899":9,"999":21,"abstract":12,"bart\u0142omiej":0,"break":[2,8,19,47,59,63,82,93,102],"byte":[0,2,3,5,7,12,13,30,31,32,33,34,35,36,38,40,41,42,43,44,53,66,80,87,99],"case":[0,1,2,3,4,5,6,7,8,9,10,11,12,13,17,19,24,27,30,31,43,44,46,47,51,53,55,59,63,64,65,66,70,76,81,82,88,95,97,102],"char":85,"class":[0,2,3,7,8,12,13,20,21,22,23,25,26,64,71,91,92,98],"default":[0,1,2,3,5,12,15,17,18,19,20,21,22,23,26,27,29,31,33,37,38,43,44,46,47,55,58,59,60,63,64,65,66,67,68,72,73,76,79,80,81,82,83,84,89,90,91,93,98,100,102,103],"enum":[2,66],"export":2,"final":[5,6,9,12,101],"float":2,"function":[0,1,2,3,5,9,10,11,13,15,17,18,19,20,23,24,27,29,30,31,32,34,35,36,38,40,41,42,43,44,46,47,51,52,53,54,55,57,58,59,60,61,62,63,64,65,66,67,68,72,73,76,77,79,80,81,82,83,84,85,86,87,88,89,90,91,92,93,95,97,98,99,100,101,102,103],"import":[2,4],"long":[1,2,4,23,90,91],"new":[0,12,14,82,102],"null":[1,2,6,17,18,19,20,21,22,23,26,27,29,31,32,33,39,41,42,44,46,47,51,52,55,57,58,59,60,63,64,67,72,73,76,79,80,81,82,84,89,90,92,93,100,102,103],"public":9,"return":[2,5,7,12,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,68,69,70,71,73,74,75,76,77,78,81,82,83,84,85,86,87,88,89,90,91,92,93,94,95,96,97,98,99,100,101,102,103],"short":[1,2,9,11,23,49,90],"static":2,"strin\u0261i":0,"switch":[2,5],"throw":2,"true":[2,5,9,12,17,19,21,23,27,29,37,43,44,46,47,48,49,51,52,54,58,59,64,65,66,67,68,69,71,72,75,76,79,81,82,83,87,88,89,102],"try":[1,2,31],"var":1,"while":[2,5,6,8,17,39],Added:2,For:[0,1,3,4,5,6,8,9,10,12,17,19,23,24,30,32,36,37,43,44,45,46,47,53,58,59,60,62,63,66,67,72,76,79,80,82,84,87,88,90,92,93,95,98,99],Into:[0,3],Its:[12,36,87,88],Los:23,Mrs:[59,82],NAs:[0,3],NFs:97,Not:[30,46,57,62,76,87,92],One:6,Such:[5,29,87,88,100],Sys:[5,38,39],THE:[3,47,81],The:[0,1,2,5,6,7,8,9,10,11,12,13,17,19,20,23,25,27,30,31,34,36,37,41,48,54,58,59,60,62,63,67,69,72,73,76,79,80,81,82,89,91,97,99,101,102],Their:[6,12],There:5,These:[5,7,8,9,14,15,17,18,19,23,27,35,44,46,47,51,52,58,59,60,68,76,81,83,84,89,93,97,98],Use:[2,58,59],Used:90,Useful:2,Uses:99,Using:2,With:[12,55,93],_boundari:[2,7,59],_charclass:[2,7,9,84],_coll:[2,7,10,84],_count:2,_euro:6,_fix:[2,7,65,84],_limit:2,_regex:[2,7,12,58,60,76],_static:2,_word:[47,59],_xpg6:2,a_b_c__d:81,a_b_c_d:81,aaa:[23,46,58,98],aaaa:[46,58,76],aaaaaaaa:[46,58],aabbcc:[46,58],ab_c:81,aba:46,ababa:84,abababa:46,abaca:76,abbrevi:[23,26],abc:[9,14,27,28,46,50,51,53,58,62,78,87,88,93],abcd:[60,68],abcdefghi:70,abcdefghijk:[46,58],abil:[73,80,103],abl:[2,7],about:[0,2],about_argu:[0,3,5,6,7,8,9,10,11,12,13],about_encod:[0,3,4,6,7,8,9,10,11,12,13,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44],about_local:[0,3,4,5,7,8,9,10,11,12,13,15,17,19,29,31,47,55,56,57,59,64,67,72,79,80,82,93,100,102],about_search:[0,3,4,5,6,8,9,10,11,12,13,18,19,27,46,47,58,59,60,63,64,65,66,76,81,82,83,84,89,93,98,102],about_search_boundari:[0,3,4,5,6,7,9,10,11,12,13,15,17,19,29,31,47,59,63,64,67,72,79,80,82,83,93,100,102],about_search_charclass:[0,3,4,5,6,7,8,10,11,12,13,98],about_search_col:[0,3,4,5,6,7,8,9,11,12,13,15,17,19,29,31,47,59,64,67,72,79,80,82,93,100,102],about_search_fix:[0,3,4,5,6,7,8,9,10,12,13,65],about_search_regex:[0,3,4,5,6,7,8,9,10,11,13,66],about_stringi:[0,3,4,5,6,7,8,9,10,11,12],abov:[9,31,54,60,64],absolut:1,ac_config_fil:2,ac_subst:2,acagagactttagatagagaaga:[58,60],accent:[9,10,11,95],accept:[2,63,89],access:[1,2,9,16,42],accompani:13,accord:[9,38,44,46,62,64,72,79,81,93],accordingli:2,account:[8,10,17,30,65,68,90,102],acd:9,acgt:[60,94],achiev:95,across:2,act:[2,14,35,63,68,102],action:63,activ:[5,9,62,97],actual:[11,102],add:[2,20,44,68],added:[2,68],adding:20,addit:[1,2,17,18,19,23,27,29,46,47,58,59,60,67,72,76,79,80,81,82,84,89,91,93,100],addition:[2,5,13,17,37,38,60],address:2,adipis:[18,76,85,86,87,102],adjac:23,adjust:98,advanc:[4,9,12,63],aesthet:102,affect:[2,81,82,95],after:[2,12,30,64],aga:[46,58,76],agaga:[46,58,76],again:[2,9],against:[1,2,30],aggreg:[85,86],agonek:78,ahead:12,aim:[2,9,19,44,73],ala:[65,66],algorithm:[2,9,10,11,13,67,79,80,86,97,102],alia:[2,17,29,44,54,64,66,69,73,74,75,76,87,88,102,103],alias:[2,9,37,51,52],align:[0,3],alik:64,aliquet:[85,102],all:[0,1,2,3,4,5,6,7,9,10,12,13,15,17,18,19,22,23,26,27,28,29,30,31,33,34,36,38,40,43,44,45,46,47,52,56,57,58,59,60,61,64,76,81,82,91,92,97,98,102,103],alloc:2,allow:[2,5,9,10,12,17,18,21,27,32,46,58,60,66,87,102],almost:[4,5,91],alon:23,along:30,alpha:27,alphabet:[9,12],alphanumer:5,alreadi:[1,29,92],also:[0,1,2,68,78],alter:12,altern:[2,9,12,58,80,87],alternate_shift:64,alwai:[5,9,17,31,39,40,44,51,54,56,57,71,73,89,91,97,102],ambigu:5,america:23,amet:[18,52,69,76,81,85,86,87,102],among:[0,2,5,9,13,60,68],amount:[5,20,30,91],ampm:[22,26],analog:95,analysi:[0,2,3,7,12,13,19,47,59,63,82,102],angel:23,angl:[12,30],ani:[0,2,4,5,6,9,12,13,17,23,29,32,43,45,51,55,63,64,65,66,76,83,87,88,90,95,97,101],annex:[9,97,101],anno:23,anoth:[9,95],anydupl:29,anymor:2,anyth:[55,87],anywai:[1,2],apart:[5,37],api:[0,2,9,13,24,26,32,38,63,64,66,91,92],apidoc:[9,13,26,63,64,66,91,92],appear:[5,6,12,23,63,71,81,83,85,86],append:23,appli:[4,9,12,14,81,83,88,91,101,102],applic:[2,5,87,88],appreci:0,appropri:[1,8,44,46,64,81],approxim:[2,13,101],arab:30,arbitrari:[32,84,98],architectur:64,archiv:1,area:91,arg:[1,2],argument:[0,1,2,3,5,6,13],aris:97,arithmet:[0,3],arrai:2,arrang:102,asan:2,ascend:67,ascii:[0,2,3,5,9,12,23,31,33,36,38,39,43,44,45,66,71,95,99,101,102],ascii_hex_digit:9,asian:101,ask:6,assert:12,assum:[1,2,4,5,38,39,40,43,44,97],assumpt:[5,38,40],asymmetr:9,atom:[2,4,12,16,51,54],atomic_vector:16,attempt:2,attr:22,attrib:2,attribut:[2,37,64,100],augu:[85,86,102],australian:6,author:0,auto:2,autoconf:2,autom:5,automat:[5,6,9,38,44,97],avail:[0,2,3,6,7,9,12,37,46,65,66,76,90,95],avoid:[2,6,9,97],awar:[6,11,12,13,27,64,80],baaab:18,baab:18,bab:18,babaab:94,babab:18,back:[6,9,12,23,87],backslash:[9,66,76],backtrack:66,backward:[2,64],bacon:[19,52,59,60,82],bartek:13,bartolini:[46,58],base:[1,2,5,7,9,10,13,15,16,21,22,24,29,31,59,64,69,72,84,87,88,95,100,101,102],basic:[2,5,8,23,33,54,55,90],bastienfr:2,bbbbb:58,bear:76,becam:2,becaus:[1,2,4,6,11,14,30,31,36,44,65,73,97],becom:[1,23,81,103],been:[0,1,2,5,9,30,53,63,84,92],befor:[2,9,12,30,45,64,90,102],begin:[12,13,67,79,86,91],behavior:[4,6,8,12,43,51,63,64,65,66,67,79,91],behaviour:2,behind:[2,12],being:[2,5,12,23,55,64,87,102],bell:12,belong:9,below:[2,4,5,8,9,12,17,23,33,46,58,64,67,76,79,85],best:[5,6,30,31],better:[5,12,29,65,70,100],between:[0,2,3,5,9,10,12,17,24,48,59,64,81,98,102],bewar:99,biarch:2,bibliograph:9,bidi:9,bidi_control:9,bidi_mirror:9,bidirect:[9,70,71,78,87],big5:30,big:[1,2,71],bin:[1,2],binari:[0,2,3,7,14,18,73,74,85,98,103],bit:[5,31,32,33,36,39,40,42,43,62,91],bitcoin:98,bitwis:11,black:76,bogu:43,bom:[2,5,17,43,44],both:[2,5,17,19,20,35,43,68,75,87,98,102],bound:[9,87],boundari:[0,2,3,7,12,13,63,66,81,93,102],boundaryanalysi:[8,63],box:[1,2],bracket:[9,12,30],breakfast:60,breakiter:[0,2,3,8,19,47,59,82,93,102],briefli:9,bring:2,british:2,broader:95,broken:2,brown:[59,76,82],bsd:[0,2,13],buddhist:26,buffer:2,bug:[0,1,2],bugfix:2,build:[0,2],built:[1,2,49,51,54,95],bundl:[1,2],by_row:54,byrow:[2,46,47,54,81,82],bytewis:[29,64,100],c90:9,calendar:[2,6,20,21,22,23,26,90],call:[0,1,2,4,5,6,11,14,15,17,18,19,27,30,41,42,43,44,46,47,48,55,57,58,59,60,73,76,81,82,84,88,89,91,95,102],cam:101,can:[0,1,2,5,8,9,30,32,38,41,43,44,70,74,88,93,95,98,102],canadian:64,cannot:[2,8,44,73,99],canon:[2,10,15,17,29,33,37,97,100],capabl:95,capit:[8,93],captur:[0,2,3,12,46,76],care:[4,87],carefulli:5,carriag:[12,83],cascad:5,case_ignor:9,case_insensit:[2,27,46,58,65,66,76],case_level:[17,64],case_map:65,case_sensit:9,casemap:93,cat:[1,5,68,69,101,102],categori:[5,7,12,18,38,39,63,98,101],caus:[2,9,43,64],cbind:[87,88],ccc:23,cccc:23,ccccc:23,cccccc:23,center:[0,3],cento:[1,2],central:5,certain:[23,45],certainli:36,cflag:1,cg_miss:[2,60],chain:[2,69,95],chang:[2,5,6,9,12,30,39,42,57,66,68,87,91,92,93,102],changes_when_casefold:9,changes_when_casemap:9,changes_when_lowercas:9,changes_when_nfkc_casefold:9,changes_when_titlecas:9,changes_when_uppercas:9,charact:[0,2,3,4,6,7,8,13,15,16,17,18,19,23,24,27,28,29,32,34,35,36,38,40,41,42,43,44,45,46,47,48,49,50,52,53,55,56,58,59,60,61,62,63,67,68,69,70,71,72,73,76,78,79,80,81,82,83,84,88,89,91,93,95,96,97,99,100,101,102,103],character_set:30,charclass:[2,9,18,27,46,58,71,76,81,84,85,89,98,101],charmod:97,charscmdenvir:86,charset:[39,49],charsiz:33,charsnwhit:85,charswhit:86,charsword:86,charsxp:2,chartr:2,check:[0,1,2,3,5,6,9,17,30,31,38,46,64,68,84],chines:[8,9,23,30],chladni:[17,67,72,79,80],choic:[5,23],choos:1,chunk:7,circul:6,circumst:24,citi:23,civil:6,cjkv:9,clang:2,clariti:9,classicu_1_1col:64,classicu_1_1dateformatsymbol:26,classicu_1_1timezon:[91,92],classicu_1_1unicodeset:9,classif:9,classifi:35,claus:[0,2,13],cldr:2,clean:2,clever:[17,44],clock:[22,23],close:[1,9],closer:91,cluster:12,cmd:[1,86],code:[0,2,3,5,6,8,9,12,13,15,17,19,31,32,33,40,42,43,44,59,62,64,65,68,71,78,84,85,87,91,93,94,100,102],codec:2,codepoint:97,coerc:[2,37,48,54,67,79],coercibl:[4,14,15,17,19,20,22,23,32,38,42,47,50,51,53,59,62,77,82,101],coercion:2,coexist:5,coll:[18,27,46,58,64,65,76,81,84,89],collaps:[2,4,30,48,51,52,69,70],collat:[0,2,3,6,7,10,13,29,67,72,79,80,100],collect:2,colour:1,column:[2,22,54,58,59,60,67,87,88,101],com:[1,2,13],combin:[9,12,55,95,97],come:[8,93],command:[0,1,3],comment:[12,66],common:[1,2,40,90],commonli:[9,30],commun:[5,6],compar:[0,3,5,6,12,13,29,60,62,76],comparison:[2,5,6,15,17,64,67,79],compat:[2,23,97,101,102],competit:5,compil:[1,2],complement:9,complex:[1,5,10,11,64,94,102],complic:55,compon:[13,26,31,33,49,90],composit:[95,97],compound:95,comprehens:[2,9],comput:[5,6,22,62,80],con:[2,73,74,103],concaten:[0,2,3,5,13,28],concept:6,concern:91,concis:49,conclus:0,condition:2,confid:[30,31],config:[1,2],configur:[1,2,30,87],conform:[2,12,73],confus:51,conjoin:[10,11],conjunct:2,connect:[2,9,54,73,74,103],connector_punctu:12,consectetur:[18,76,85,86,87,102],consecut:[27,46,58,76,102],consequ:[15,39],consid:[44,64],consider:5,consist:[0,2,4,5,9,13,17,24,40,47,52,60,68,69,71,93,94],consol:[5,53,68,102],conson:101,consortium:13,constant:[2,12,66],construct:[2,21],contain:[0,3,9,49,63,66,76,80,85,102],content:[13,83,97],context:[12,23,26,65,86,93],continu:9,contrari:[98,102],contribut:[0,13],contributor:86,control:[2,8,9,12,64,66,67,79,84,99,101],conveni:[0,2,13,18,27,32,46,57,58,60,63,64,65,66,68,76,77,81,84,89,95,98],convent:[6,19,45,47,59,93,102],convers:[2,11,13,24,30,44,74,95],convert:[0,2,3,4,5,9,23,31,37,45,95,97],converted_str:44,cooki:93,coordin:91,copi:[1,2,4,87,88,100],coptic:26,copyright:[2,13],correct:[0,2,6,10,11,13,87],correctli:[1,2,5,39],correspond:[2,4,9,15,17,27,32,34,36,42,51,53,60,72,76,83,87,88,91,94],cost:[2,102],cost_expon:102,could:[2,6,30],count:[0,2,3,7,8,13,23,84,86,87],counterpart:[29,100],countri:[6,55,91],cours:[2,4,30,31,84],cover:[5,12,31],cpp:[2,31],cppflag:1,cpu:66,cra:[85,102],cran:0,creat:[0,1,3,5,14,56],criteria:[2,67,72],crlf:83,csrucod:31,cstring:2,cultur:6,currenc:[6,9],current:[0,1,2,3,6,9,12,22,23,39,41,44,49,57,60,62,69,73,90,92,103],custom:[1,2,63],customis:0,cxx11:[1,2],cxx1x:2,cxxcpp:2,cxxflag:1,cyclic:23,cyril:[9,95],czech:30,czw:23,d_ef_g:81,dai:[20,21,22,23],danish:30,dash:[2,9],dat:2,data:[0,1,2,3,5,9,11,22,23,30,31,38,44,59,62,64,67,69,72,81,91,103],databas:[9,13],date:[0,2,3,13,24,91,92],date_long:23,dateformatsymbol:26,datetim:[20,21,22,23,24,25,26,90,91,92],datetime_relative_medium:23,davisvaughan:2,daylight:[23,90,91],dayofweek:22,dayofyear:22,de_d:[17,93],deal:[2,4,5,42,53],debian:1,debug:2,decid:5,decim:[9,12],decimal_numb:12,declar:[0,2,3,5,39,40,41,43,44],decnumb:2,decod:[32,95],decomposit:97,decreas:[30,31,67,79],def:27,default_ignorable_code_point:9,default_local:2,defin:[9,10,12,32,39,49,64,81,83,84,87,88,91,97,99],definit:[64,66],delimit:81,deliv:6,denorm:5,denot:[5,9,22,48,76,84,87,102],depend:[1,2,5,6,8,9,12,15,17,18,22,23,27,29,46,57,58,66,67,72,76,79,80,81,83,84,89,92,93,100,102],deprec:[0,2,3,9,29,63,64,65,66,69,73,74,103],descend:67,describ:[9,10,11,12,54],design:[2,5,23,91,95],desir:[6,66,71,77,95],dessert:60,detail:4,detect:[0,2,3,6,7,13,35,38,39,42,53,60,65,74,85],determin:[0,2,3,5,9,13,17,19,27,30,40,81,83,92,97,102],dev:[1,2,9,13,26,63,64,66,91,92],devel:[0,1],develop:[1,5,13],diacrit:[8,9,17],diagnos:44,diagnost:2,did:[2,6],differ:[2,5,6,8,9,12,17,18,19,30,46,48,51,58,60,66,76,93,94,95,97,98],digit:[5,9,12,13,23,45,64,71,91,99],digraph:9,dim:4,dimitri:2,dir:[1,2],directli:[2,58,80,84],directori:1,disabl:[1,2,12],disallow:[9,44],disappear:9,discourag:9,discret:69,discuss:[5,39,44,55],disjoint:88,dispatch:68,displai:[2,5,8,9,23,69],display_typ:90,distinguish:12,distribut:[1,2,13,69],divers:1,doc:[9,10,13,26,63,64,66,91,92],document:[2,8,9,13,26,63,64,66,91,92,97],doe:[1,2,5,6,8,9,12,17,23,24,33,55,60,64,91,101,102],dog:76,doing:[4,5,39],dolor:[18,52,69,76,81,85,86,87,102],domini:23,done:[11,71],dot:9,dot_al:66,dotal:66,download:[0,1,2],draft:[0,2,13,97],drastic:2,draw:71,drop:4,dst:[90,91],dt_relative_styl:23,dt_style:23,du_disable_renam:2,dual:[32,42],due:[1,4,5,37],dummi:[2,69],duplic:[0,2,3,37,100],dure:[6,56,81,91],dutch:30,dynam:[2,102],dynlib:2,e0000:9,e0fff:9,each:[0,2,3,4,5,6,7,8,9,13,14,18,24,27,28,29,30,31,32,37,40,42,46,47,51,52,53,54,58,60,62,68,71,72,73,76,77,81,83,84,85,86,87,88,93,94,95,96,97,102,103],eagerli:2,earli:2,eas:2,easier:[5,89],easili:[2,42,103],east:101,eee:23,eeee:23,eeeee:23,eeeeee:23,effect:[39,57,91],effici:[2,4,10,12,43],efficient_text_searching_in_java:10,egg:[19,59,60,82],eight:12,either:[1,5,9,12,18,23,24,27,44,45,46,63,81,84,89,91,93],element:[0,2,3,4,6,13,15,17,18,27,30,31,34,36,37,42,46,47,48,50,51,53,54,58,60,67,71,76,79,81,83,84,85,86,88,103],elit:[18,76,85,86,87,102],ellipsi:36,embed:44,emoji:[2,9,46],emoji_modifi:9,emoji_modifier_bas:9,emoji_present:9,emploi:9,empti:[0,2,3,4,6,9,12,18,27,31,46,47,48,50,51,81,82,83,84,87],emul:2,en_au:6,en_u:[6,57,59,82,93],enabl:[12,30,65,66],enc2utf8:[42,43],enc:[33,39],enclos:[9,23],encod:[0,2,3,9,13,30,32,34,35,36,40,42,43,49,53,62,73,74,80,89,97,103],encoding_convers:[5,32,40,41,42,43,44],encoding_detect:[5,30,31,34,35,36],encoding_manag:[5,33,37,38,39],encodingnam:44,encount:[5,12,39],encourag:[1,101],end:[0,2,3,7,8,9,12,13,27,30,32,46,57,58,59,62,63,66,67,76,79,83,86,87,88,91,92,98,102],endian:[1,2],engin:[0,2,3,7,9,11,12,13,18,27,30,46,58,60,76,81,84,89],english:[6,10,30],enhanc:80,entir:66,entireti:73,entri:[0,37,66],enumer:101,envir:86,environ:[1,2,41,86],equal:[17,23,29,30,31,51,52,64,68,71,81,82,100,101],equat:91,equip:2,equival:[2,5,9,10,15,16,17,19,29,38,42,48,51,59,64,65,66,76,77,80,83,89,97,100,101],era:[22,23,26],erron:44,error:[2,4,9,12,33,53,66,85,102],error_on_unknown_escap:66,escap:[0,3,12,13,23,66,76],especi:[1,5,10,30,87],essenti:97,establish:[2,4,57,64,92],eszett:93,etc:[1,2,4,5,12,21,22,26,42,46,63,81],etiam:[85,102],euc:30,euro:[2,6],europ:[90,92],european:[5,6],evalu:12,even:[5,8,12,23,30,54,55],evenli:102,ever:5,everi:[13,60,76,78,102],everyth:9,exact:[2,12],exactli:[5,12,17,32,33,38,42,68],examin:[5,27],exampl:[0,2,5,6,8,9,11,12],examplercppstringi:2,exce:[44,73],except:[2,9,12,23,102],exclud:[63,89],exclus:[87,88],exdent:[2,102],execut:[1,45],exemplar:23,exemplari:23,exercis:69,exist:[1,2,5,12],expand:2,expect:[1,4,6,9,66],experi:[1,102],expert:39,explain:[4,5,6,7],explicit:5,explicitli:[44,87],expon:102,express:[0,3,4,5,7,9,13,66,83,98],extend:[5,9,23,36,38,40,43],extens:2,extern:[2,5],extra:[1,64,94],extract:[0,2,3,7,12,13,29,58,81,82],face:1,facil:[10,11,30,31,66,99],fact:[30,37],factor:4,fail:[1,2,5,6,12,30,31,39,41,43,62,66],failur:[2,12,30,31],fall:[9,23],fallback:1,fallback_encod:[2,73],fals:[2,5,21,23,27,29,30,35,36,37,43,44,46,47,48,49,51,54,58,59,60,63,64,65,67,68,69,75,76,79,81,82,83,84,87,88,89,102],famili:[2,31,37,63],familiar:2,fanci:[13,48],faq:5,fashion:[2,17],fast:[0,2,11,12,13],faster:[9,44,84,89],fastest:50,fcd:64,featur:[0,1,2,12,19,59,68,82,102],feature_test:2,februari:20,fedora:1,feed:[12,83],feel:[14,15,17,84],fetch:[1,90,91],few:[0,1,12,30,31],fewer:12,fff0:9,fffb:9,fffd:44,field:[0,2,3,23,81],file:[0,1,2,3,5,13,30,63,83,85,86],fill:[2,46,47,54,81,82],filter:[30,82],filter_angle_bracket:30,find:[1,4,8,9,50,58,67],first:[1,2,4,7,8,9,10,12,17,22,23,29,31,33,46,48,51,52,58,59,60,76,84,91,93,95,98,102],fit:[5,8,63],fix:[0,2,3,10,12,18,27,43,46,49,58,62,66,76,81,84,89],flag:[1,2,12,23,49,66],flatten:[0,3],flavor:[1,9],flavour:2,floor:[68,102],fname:[2,73,74,103],fold:[2,13,97],follow:[1,2,5,6,7,9,12,13,19,22,26,29,30,31,33,45,47,49,55,59,63,69,83,85,86,90,93,95,97,99,101,102],font:101,food:60,forc:[1,2,64],form:[5,6,9,12,16,23,24,36,40,42,49,55,57,60,64,76,83,87,97,99],formal:[97,101],format:[0,2,3,8,9,12,13,30,91,97],formatpars:[23,26],formatt:24,found:[29,40,44,46,58],four:5,fox:76,fraction:[21,23],fragment:12,frame:[2,22,30,31,67,72,91],free:12,freeli:9,french:[6,30,64],frequent:[2,30],friedl:12,friend:15,friendli:[2,5,33,39,87,88],from:[0,1,2,3,4,5,9,12,13,17,21,23,29,30,37,43,44,46,51,58,66,67,69,71,76,79,81,83,84,88,89,91,95,97],from_last:[2,29],fromlast:[2,29],front:87,full:[2,23,65,81,82,93,95,101],fulli:[0,31,60],fundament:6,further:[5,13],futur:[2,23,63,64,65,66,85,86],gaertner:17,gagolew:[1,2],gagolewski:[0,2,13],gain:2,garbag:2,gather:13,gb18030:30,gcing:2,gcmask:2,gcuacggagcuucggagcuag:94,gener:[0,1,2,3,4,7,8,12,13,18,23,27,32,39,40,42,44,46,53,61,70,80,84,87,88,93,96,97,98,101],general_categori:9,generic_loc:90,generic_long:90,generic_short:90,german:[6,30,93],get:[0,1,2,3,4,5,6,33,45,51,52,53,55,58,59,64,75,85,95,98,102],getlocal:[5,38,39],getopt:[68,102],ggg:23,gggg:23,ggggg:23,ghi:27,github:[0,1,2,9,13,26,63,64,66,91,92],give:[0,2,5,11,12,13,23,29,37,38,49,57,58,59,60,67,68,70,71,77,78,80,81,82,84,85,86,87,88,94,102],given:[0,2,3,4,5,7,12,17,18,23,24,27,32,33,35,36,37,38,39,46,47,49,52,53,54,58,60,66,67,68,69,76,77,81,82,83,84,87,91,94,95,98,99,102,103],glanc:[9,10],glibc:2,gmt:[23,90,91],gmt_long:90,gmt_short:90,good:[12,46],graphem:[5,12],great:4,greater:[5,17,36,38,40,51,52,62,71,102],greatest:31,greatli:0,greedi:[2,102],greek:[9,30,95],greenwich:91,gregorian:[2,20,21,22,23,26,90],gro:[29,95,100],gross:[29,100],group:[0,2,3,5,6,12,30,46,76],gru:23,grudnia:23,guarante:[1,2],guess:[30,31],guid:[5,6,8,9,10,12,17,20,23,26,29,30,44,63,64,65,66,67,72,79,80,91,93,95,96,97,100],guidelin:[23,73,83],had:[2,5],hadlei:0,half:91,halfwidth:95,hand:[81,82],handl:[2,5,6,8,30,38,50,53,62,77,87,95,99],hangul:101,happi:[59,82],hard:63,has:[0,1,2,5,30,38,39,43,48,51,52,53,84,87,92],have:[1,2,5,6,8,9,12,23,29,31,33,39,44,54,63,68,101,102],hbox:2,he_il:26,heap:66,hebrew:[20,21,22,26,30],help:1,hemispher:91,henc:[29,100],here:[9,10,11,12,17,23,30,38,41,43,53,58,60,93],hesit:1,heurist:[30,31],hex:[12,45,95,99],hex_digit:9,hexadecim:9,hhhh:12,hhhhhhhh:12,higher:[30,31],hiragana:63,histor:91,hit:31,hladn:17,hladni:[17,67,72,79,80],hms:23,hold:[17,38],home:[2,13],homepag:[0,13],honour:2,hopefulli:1,horizont:[12,102],host:0,hour12:22,hour:[20,21,22,23,90,91],how:[2,4,5,6,7,9,10,12,13,17,55,67,72,79,80],howev:[1,2,5,6,9,14,30,35,36,44,54,55,62,76,95],html:[5,6,9,10,12,13,26,30,63,64,66,83,91,92],http:[1,2,5,6,8,9,10,12,13,17,20,23,26,29,30,44,63,64,65,66,67,72,79,80,83,86,91,92,93,95,96,97,100,101],human:[6,90],hundr:[5,30,31],hungarian:30,hyphen:[9,101],i18n:[2,13,31],iana:33,ibm420:30,ibm424:30,ibm:[13,33],icecream:60,iconv:44,icu4c:[0,2,9,13,26,63,64,66,91,92],icu52dt:2,icu55:[1,2],icu61:2,icu:[0,1,2,5,6,7,8,9,10,13,17,19,20,23,24,26,29,30,31,33,37,38,39,44,46,47,49,55,56,59,60,63,64,65,66,67,72,76,79,80,82,90,91,92,93,95,96,97,99,100,102],icudt52b:2,icudt61b:2,icudt61l:2,icudt:[1,2],icudt_dir:1,id456:89,id_:14,id_continu:9,id_start:9,ident:91,identifi:[0,2,3,9,19,20,21,22,23,26,31,33,37,47,55,56,59,90,92,93,95,96,102],ideograph:[9,63],iec:9,ietf:[13,97],ifels:103,iff:31,ignor:[2,5,6,9,10,11,12,17,19,23,25,30,44,47,51,52,59,64,71,81,87,91,94,97],ignore_nul:[2,51],ill:[32,40,42,99],imag:30,imbal:2,implement:[2,6,10,11,12,44,69,73,84,86,93],impli:36,implicit:[5,9,38],imprecis:[5,30,31],improp:6,improv:2,inc:13,incident:5,includ:[0,1,2,3,6,7,8,9,12,13,18,26,27,46,58,60,62,76,81,84,86,87,89,101],inclus:[9,87],incompat:2,inconsist:24,incorrect:[2,43,44,53],incorrectli:2,increas:79,increment:64,inde:36,indent:[2,102],independ:[2,7,13,15,17,34,35,36,76],index:[2,29,58,59,84,87,88],indian:26,indic:[2,7,15,17,29,31,34,36,44,46,47,49,58,59,60,82,87,88,100],individu:[2,6,13,42,46,81],influenti:1,info:[12,91],inform:[2,5,6,10,12,13,17,19,33,37,47,49,55,56,57,59,67,72,79,80,82,90,91,92],initi:[2,5,6,9,31,102],inject:87,input:[2,5,11,12,17,30,32,38,40,44,45,51,59,63,64,66,67,73,76,79,81,83,87,88,93,94,95,97,102],ins:73,insensit:[0,3,5,9,12,17,65,66],insert:2,insid:[12,23,66],insight:55,inspect:27,inspir:[0,12,31],instal:[0,2],instanc:[4,5,18,23,27,36,37,46,58,60,84,87,98],instead:[2,62,68,102],instruct:2,integ:[4,5,17,18,19,20,21,27,28,29,32,42,53,54,58,59,62,64,66,67,68,69,71,81,82,84,85,86,87,88,101,102],intellig:2,intens:2,interact:6,interchang:[91,97],interest:[4,13,27,84,89],interestingli:10,interfer:30,intern:[2,5,13,30,32,39,44,49,62,92],internation:13,internet:1,interoper:[5,97],interpret:[5,23,40,43],intersect:9,introduc:[2,97],introduct:[0,12],inttoutf8:32,intuit:[5,38,67,79],invalid:[2,43],invis:[39,57,92],ipa:0,ipsum:[0,2,3,18,52,76,81,85,86,87,102],is_unknown_8bit:[5,43],isalnum:9,ish:2,islam:[6,26],ismwx:12,iso8601:23,iso:[5,6,9,13,23,30,91],ispunct:9,issu:[1,2,4,13,42,44],italian:30,iter:[2,4,8,9,19,47,59,63,82,93,102],its:[2,4,5,6,9,12,13,15,17,29,37,87,100],itself:[40,91],ja_jp_tradit:26,jamo:101,januari:[20,22],japanes:[8,9,26,30,95],java:[0,10,12,13,33],jdk:12,jkl:27,john:2,join:[14,28,48,51,52],jone:[59,82],joy:13,juli:23,julian:23,jump:76,just:[2,5,6,8,12,19,29,31,41,47,58,59,60,69,76,88,100],kana:63,katakana:[9,63,95],keep:58,kei:[0,2,3,5,64],keyboard:[5,38],keyword:[6,13,20,21,22,23],kile:86,kind:9,know:[4,5,39],knowledg:5,known:[0,2,3,5,31,45,56,66,99],knuth:[2,11,102],koi8:30,korean:[9,30],l10n:13,lacinia:[85,86,102],lai:69,languag:[0,2,3,5,6,7,8,11,13,17,29,31,55,57,64,65,93,95,100,102],language_countri:[6,55,57],language_country_vari:[6,57],lappli:91,larg:9,larger:[2,5],largest:12,last:[2,7,12,29,46,58,59,60,76,83,84,87,94,98,102],latest:1,latex:[0,3],latin1:[2,5,38,44],latin:[9,68,69,71,95,102],lazi:76,lc_ctype:[5,38,39],ldflag:[1,2],lead:[4,5,9,12,17],leak:2,leap:[25,91],least:[4,12,27,30,31,68,71,85],leav:[87,88],led:2,ledkov:2,left:[0,3,9,46,58,64,66,76,102],legal:9,legibl:30,length:[0,2,3,4,9,11,12,29,30,31,38,46,47,48,51,52,53,54,58,59,62,67,68,69,71,76,79,80,81,82,87,88,97,101,102],lenient:[21,23],less:[12,17,54,58],let:5,letter:[6,8,9,10,11,14,18,23,24,30,34,36,48,50,51,53,62,63,64,66,70,71,79,91,93,95,101],level:[2,64],lexicograph:[17,67,72,79],lib64:1,lib:[1,2,49],libc:[2,80],libicu:[1,2],librari:[1,2,17,31,49,98],licens:[0,2,13],ligatur:17,like:[0,1,2,4,5,9,13,14,19,23,31,47,51,58,59,68,76,82,88,93,100,102],limit:[30,66],line:[0,1,2,3,8,9,12,13,19,30,59,63,66,68,74,82,85,86,102],line_break:[8,19,47,59,63,82],linesnempti:85,linguist:[8,9],link:[1,2,9,13],linker:1,linux:[2,5],lipca:23,list:[0,1,2,3,4,5,6,8,9,12,13,16,17,18,19,27,29,30,31,32,33,34,35,36,39,42,44,46,47,49,55,58,59,60,67,72,76,79,80,81,82,83,84,88,89,90,93,95,100,101,102],liter:[12,23,66,76],littl:1,lll:23,llll:23,lllll:23,load:[2,5,30,85,86],local:[0,2,3,7,8,9,12,13,15,17,19,20,21,22,23,26,29,46,47,49,58,59,63,64,67,72,79,80,82,90,91,93,100,102],locale_manag:[6,55,56,57],locale_sensit:[6,8,10,15,17,19,29,31,47,59,64,67,72,79,80,82,93,100,102],localiz:[0,2,3],locat:[0,2,3,7,8,10,11,19,23,44,47,82],locate_first:58,locate_last:58,log:[67,79],logic:[4,15,17,21,23,27,29,30,34,35,36,37,43,44,46,47,48,49,50,51,54,58,59,60,63,64,65,66,67,68,69,76,79,81,82,83,84,87,88,89,97,102],london:90,longer:[2,36,73,94],longest:[51,54],look:[2,12,14,15,17,30,81,84],lookahead:58,lookup:12,loos:12,lorem:[0,2,3,18,52,76,81,85,86,87,102],los_angel:23,lower:[13,64,93,95],lowercas:[9,95],lukaszdaniel:2,lunar:23,lunch:60,machin:[1,5,39],macro:2,made:2,magrittr:[2,87,88],mai:[1,2,4,5,6,7,8,9,11,12,17,19,20,21,22,23,24,30,33,35,38,39,40,42,43,44,53,54,55,56,57,58,59,62,63,66,68,70,71,76,77,78,81,82,84,85,86,87,93,96,97,98,102],main:30,mainli:95,major:5,make:[1,2,5,8,84,97],makeconf:1,makevar:2,malform:[2,9,55],malici:2,man:[4,7,9,13,45],manag:[1,2,13],mandatori:63,mani:[0,2,6,7,9,12,13,55,57,92,97,98,102],manipul:[5,13],manual:[0,1,2,4,5,12,13,24],map:[0,2,3,5,6,13,40,43,55,65],marek:[0,13],margin:8,mario:17,mark:[2,5,8,9,12,27,30,32,34,35,36,38,40,41,43,44,62,73,80,87,97],marker:[23,44,73],markov:69,markup:30,mask:99,master:[1,12],match:[0,2,3,6,7,8,9,10,12,13,30,31,38,39,46,47,58,59,65,66,76,83,98],matcher:[0,3,4],math:9,mathemat:[9,95],matric:[2,58,59,60,87,88],matrix:[0,3,46,47,58,59,60,81,82,87],max:33,max_count:[2,27],maxim:[33,44,66,73,81,82,102],maximum:1,mean:[9,23,35,36,57,66,85,91,92],meaning:5,mechan:[5,38],medial:101,medium:23,memcheck:2,memori:[2,5,62,74],mention:[19,59,64,82],mere:46,merg:[2,30,46,58,76],messag:[2,12],met:1,meta:84,metacharact:66,method:[53,92,102],mgk25:101,microsystem:2,middl:[8,9,87],might:[9,11,17,19,23,27,30,37,44,87,91],migrat:[9,65],mileston:2,millisecond:[20,22,23,66],mime:33,mimic:2,min:[33,72],mind:[5,58],minim:[2,33,54,68,102],minu:5,minut:[20,21,22,23],mirror:[1,2],misalign:2,mislead:[5,53],miss:[0,2,3,27,29,38,40,42,43,44,46,47,48,50,51,53,58,59,60,61,62,64,66,67,72,75,79,81,85,87,88,89],mmm:23,mmmm:23,mmmmm:23,mode:[46,58,60,66,73,74,76,102,103],model:[69,97],modifi:[6,9,20,23,57,86,89],mondai:23,mono:101,monster:93,month:[20,21,22,23,26],more:[0,1,2,4,5,6,8,9,10,12,13,17,18,19,23,24,27,30,31,33,37,43,44,46,47,48,56,57,58,59,60,64,67,72,73,76,79,80,81,82,84,89,90,92,93,97,98,102],moreov:[0,1,2,5,9,19,24,27,38,51,53,54,58,76,83,99,102],morri:[2,11],most:[0,1,2,4,5,9,23,24,26,30,35,36,64,66,97,98,102],mostli:30,move:[2,64],much:[2,10,17,29,73,95,100],multi:[5,9,30],multi_lin:66,multilin:66,multipl:[0,2,3,23,67,68,87,102],multitud:0,must:[6,8,12,76,88],mutual:[87,88],n_max:2,n_min:[2,54,81,82],n_paragraph:[2,69],na_character_:[2,32,54,60,91],na_empti:[2,48,75],na_integer_:91,na_last:[2,67,79],name:[1,2,4,5,9,12,17,18,19,20,21,22,23,26,27,29,30,31,33,37,39,44,46,47,55,57,58,59,60,63,64,65,66,67,72,73,74,76,79,80,81,82,84,85,86,89,90,91,93,95,100,103],narrow:26,nativ:[0,2,3,5,9,13,38,39,43,44,49,62,97],natur:[2,5,7,11,13,17,29,64,100,102],nchar:[2,101],necessari:[1,4,15,18,27,46,58,60,71,76,81,84,89],necessarili:6,need:[2,4,5,12,30,62,87,88,91,98],neg:[12,27,29,81,82,84,87,102],negat:[2,9,27,84,89],neither:[39,43],nel:83,network:97,never:[81,83],new_substr:87,newer:1,newlin:[12,73,83,103],next:83,nfc:[87,97,101],nfd:[64,95,97],nfkc:97,nfkc_casefold:97,nfkd:[95,97],nibh:[85,86,102],nice:2,nie:95,nil:2,nisan:21,nix:2,non:[2,4,5,9,10,12,17,19,20,21,22,23,27,29,45,47,59,64,67,70,71,78,79,82,85,87,99,100,102],noncharacter_code_point:9,nondecreas:[67,79],none:[2,85,102],nonincreas:[67,79],nor:[39,43],norm:97,normal:[0,2,3,5,9,13,17,37,53,62,64,69,70,71,78,87,95,98,100,101,102],normalis:[0,2,64,102],northern:91,norwegian:30,note:[1,2,5,8,9,10,11,12,13,14,17,18,19,20,22,23,30,32,35,36,39,40,41,43,44,46,47,51,53,56,57,58,59,60,63,66,68,76,78,81,82,84,87,91,93,95,97,98,99,101,102],noteworthi:103,noth:[23,103],notion:[10,17,101],now:[1,2],nparagraph:[2,69],npattern:76,nth:12,nul:[44,62],number100:64,number2:64,number:[0,1,2,3,5,6,7,9,12,13,20,22,23,25,27,28,31,33,46,54,63,68,69,71,76,81,82,85,86,93,94,101,102],numer:[2,4,5,9,21,23,30,31,64,67,72,79,91,102],numeric_valu:9,object:[0,2,3,14,15,17,19,20,22,23,25,32,38,42,46,47,50,51,53,59,62,63,64,65,66,73,74,77,81,82,87,89,101,103],observ:[2,5,6,43,71,72,91],obtain:[0,2,5,9,30,31,55,85,86,91],occur:[7,8,12,30,44],occurr:[0,2,3,7,18,27,31,44],octal:[12,99],off:1,offset:[90,91],often:[0,10,30,35,62,69,95,97,98],ogonek:[5,36,78,97],old:39,older:1,oldloc:57,oldrel:2,oldtz:92,omit:[1,48,63,83],omit_empti:[2,48,81,83],omit_na:[2,87,88,89],omit_no_match:[2,46,47,52,58,59,60,88],onc:[4,27,74],one:[1,2,4,5,6,8,9,12,18,20,23,26,27,32,33,38,42,44,46,48,53,54,55,58,59,60,62,63,64,68,71,76,85,88,89,90,91,93,95,97,103],ones:[33,64,99],onli:[2,4,5,9,12,30,33,38,39,46,48,51,52,58,59,60,63,66,68,76,80,81,82,83,87,88,89,91,93,98,102],ooo:[12,99],oooo:23,open:[0,2,9,73,74,103],opensus:[1,2],oper:[0,1,2,3,4,5,7,8,9,13,14,15,17,21,29,30,32,42,57,62,66,68,70,71,78,87,88,92,95,100,102],operator_add:[0,3],operator_compar:[0,3],operator_dollar:[0,3],opposit:64,optim:5,option:[1,2,6,15,17,29,30,43,51,52,67,72,79,80,100],opts_brkit:[2,19,47,59,82,93],opts_col:[2,17,18,27,29,46,58,64,67,72,76,79,80,81,84,89,100],opts_fix:[2,18,27,46,58,65,76,81,84,89],opts_regex:[2,18,27,46,58,60,66,76,81,89],oracl:2,order:[0,2,3,5,6,9,13,17,27,30,31,43,44,64,70,72,73,78,79,80,87,97],ordinari:[51,64],org:[1,5,6,8,9,10,12,13,17,20,23,26,29,30,44,63,64,65,66,67,72,79,80,83,91,92,93,95,96,97,98,100,101],orient:86,origin:[2,80,86],other:[0,2,4,5,6,7,8,9,10,11,12,13,14,15,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,68,69,70,71,72,73,74,75,76,77,79,80,81,82,83,84,85,86,87,88,89,90,91,92,93,94,95,96,97,98,99,100,101,102,103],otherwis:[4,23,27,29,44,45,46,47,49,51,52,54,66,71,81,82,85,90,91,102],our:[1,2,4,5,98],out:[1,2,5,9,46,50,68,69,87,98],output:[2,5,23,42,43,44,47,53,67,68,70,71,73,74,78,79,80,89,97,103],outsid:[12,23],over:[2,5,14,15,16,17,18,19,20,21,22,23,27,28,30,31,46,47,51,58,59,60,68,71,76,81,82,83,84,87,88,89,93,94,98,102],overal:[5,12],overflow:2,overful:2,overlap:[2,9,46,58,60,65,76],overload:16,overrid:1,overwhelm:1,own:44,pace:13,pacif:23,packag:[1,2,5,9,47,57,68,92],pad:[0,2,3,13],page:[2,4,5,7,13,24,45],pair:9,pairwis:15,paper:[0,2,10],paragraph:[0,2,3,8,9,69,83],paramet:[2,10,83,87,88],parametr:6,parenthes:[12,60,76],pars:[0,2,3,13],part:[1,2,9,38,39,76,87,88],particular:[1,4,5,6,8,9,13,63,87,95],pass:[0,1,2,3,16,18,27,46,55,58,59,60,63,64,65,66,76,81,84,87,88,89],password:71,past:[2,48,51,77],pat1:9,pat2:9,pat:[58,84],patch:2,path:1,patter:2,pattern:[0,2,3,4,7,10,12,13,23,30,66,71,94,98],pdf:2,pdt:23,peculiar:[4,70,71,78],pellentesqu:[85,102],per:[4,6,57,69,102],perform:[0,2,3,4,5,6,7,9,10,11,12,15,17,19,29,47,56,57,59,62,63,64,66,67,74,79,82,95],perl:[9,12],permiss:64,permut:[0,2,3,70,78],persian:26,phonebook:[6,17],php:86,piec:[9,10,19,81,82],pipabl:2,pipe:[2,87,88],pizza:60,pkg:[1,2],pkg_config:[1,2],pkg_config_path:1,pl_fonipa:95,pl_pl:[17,23,26,55,67,72,79,80],place:[9,87,88,89],plai:[5,88],plain:77,plass:102,platform:[1,2,5,6,13,38,83,92,103],pleas:[1,4,5,9,10,17,24,44,60,63,98],plu:[5,9,12],point:[0,2,3,5,8,9,12,13,15,17,19,31,32,33,40,42,44,59,62,64,65,68,71,78,84,85,87,91,93,94,100,102],polish:[5,6,17,30],poor:2,poorli:66,portabl:[0,1,2,5,9,44,72],portion:12,portugues:30,posit:[2,5,8,9,12,35,36,58,59,63,64,81,82,84,87,102],posix:[2,65],posix_alnum:9,posix_blank:9,posix_graph:9,posix_print:9,posix_xdigit:9,posixct:[20,21,22,23,25],posixst:23,possess:12,possibl:[0,1,2,3,4,5,12,31,38,63,65,81,82,84,97,102],potenti:97,power:[0,12,13],pqrst:28,practic:102,pratt:[2,11],pre:[2,95],preced:[9,12],precis:[5,6,66,91],predefin:[9,69],predict:13,prefer:12,prefix:[2,102],prepar:2,preprocessor:1,preserv:[2,98,102],prevent:[2,63],previou:[12,57,92],previous:[2,39,57,92],primari:64,print:[2,5,8,9,20,53,68,87,88,89,101,102],printabl:45,prioriti:87,privat:9,probabl:71,problem:[1,2,97],problemat:44,proce:101,process:[2,3,5,7,8,9,10,11,17,29,30,45,47,62,66,68,69,81,92,95,97,98,100,102],produc:[23,44,65],prof:[59,82],program:[5,6,102],proin:[86,102],project:[1,2,5,6,8,9,10,12,13,17,20,23,26,29,30,44,63,64,65,66,67,72,79,80,91,93,95,96,97,98,100],pronounc:0,propag:1,proper:36,properli:[1,5,6,10,38,50,53,62],properti:[4,7,12,18,85,98,101],protect:2,protocol:5,provid:[2,5,6,9,10,11,12,13,16,17,31,33,47,49,51,55,60,64,87,90,91,94,95,102],pseudo:[2,13,69,70,71],pt_br:57,punct:9,punctuat:[8,9,10,11,23],purpos:[2,5,8,83],put:[67,79,97,102],python:16,qqq:23,qqqq:23,qqqqq:23,quarter:[23,26],quaternari:64,queri:[0,3,6,56,92],quick:76,quicker:76,quit:[0,5,12,66],quot:[9,12,23,45],quotat:9,quotation_mark:9,r_home:1,r_inst_dir:1,r_usedynamicsymbol:2,ragged:[2,102],rais:[2,33],random:[0,2,3,9,13,69,70,78],randomli:[0,3,69],rang:[0,5,9,12,23,87,88,95],rank:[0,2,3,13,80],ranki:95,rare:[2,4,5],rather:[27,44,66,68,84,89,97,102],raw:[0,3,5,30,31,34,35,36,42,44,90,91],rawoffset:90,rawtochar:[30,44],rbbi:63,rbind:91,rbuildignor:1,rchk:2,rcpp:[0,2],read:[0,2,3,5,13,38,41],readabl:90,readbin:30,readlin:[30,73,85,86],real:23,realli:[5,55],rearrang:67,reason:[2,4,5,43,44],recal:9,receiv:72,recent:1,recogn:[6,45,66,99],recommend:[97,102],recycl:[2,4,15,18,27,46,58,60,71,76,81,84,88,89],redund:71,refer:[0,1,2,18,24,27,46,58,60,76,81,84,89],referenc:6,reflect:[6,33],reformat:102,regard:[2,29,67],regardless:5,regex:[0,2,3,4,7,9,18,27,46,58,76,81,84,89],regexmatch:2,regexp:[9,12,66],region:[6,91],regular:[0,3,4,5,7,9,13,66,83,98],reilli:12,rel:[1,23,80],relat:[13,15,17,23],relationship:64,releas:[0,1,2,85,86],relev:1,reli:[1,2,5,84,98],reliabl:64,remaind:[81,82],rememb:4,remov:[0,2,3,5,9,17,30,37,43,63,64,65,66,67,76,79,81,83,95,97,98,100],renam:2,rep:70,replac:[0,2,3,7,13,20,23,24,40,43,44,71,72,81,89,94,98,102],repo:1,report:[1,2,9,12,19,66,83,97,101],repres:[5,9,17,23,25,30,32,33,36,37,46,58,60,66,83,85,86,91],represent:[2,5,21,33,80,90,92],request:[5,6,24,56],requir:[1,2,11,12,23,63],reserv:[9,23],resolv:1,resourc:[6,56],respect:[2,4,9,12,18,23,27,46,47,58,59,72,76,81,82,84,87,88,89,94],rest:93,restor:[57,92],restrict:95,result:[2,4,5,6,9,11,12,13,14,15,17,18,19,23,27,28,29,35,36,37,41,43,46,47,49,51,52,54,55,58,60,64,65,69,70,71,72,76,78,79,80,81,82,83,84,88,89,93,99],retri:12,reus:4,revers:[0,3,13,33,68,70],revert:2,rexamin:76,rf_error:2,rfc3629:13,rfc5198:97,rfc:[13,23,97],rid:[2,75],right:[0,3,9,46,58,76],robust:73,role:[5,88],romanian:30,roughli:[31,42,77,89,101],round:[2,60,76],routin:[2,5],row:[23,46,47,54,58,59,60,81,82],rpm:1,rule:[2,4,19,47,59,63,64,83,88,91,97],run:[2,30,46,57,62,76,84,87,92],runif:72,russian:30,sake:23,same:[2,5,6,9,13,17,29,33,38,39,50,53,54,55,57,62,64,72,80,81,91,97,100,101],sampl:[71,79],saniti:2,sappli:[69,90],sausag:52,save:[90,91],scelerisqu:[85,86,102],scenario:[46,58,60,88],scharf:93,schedul:2,scheme:[5,9,33],scp:1,screen:68,script:[1,2,9,68,71,95,102],search:[0,1,2,3,4,5,6,9,11,12,13,18,19,27,29,46,47,58,59,60,63,64,66,71,76,81,82,84,85,89,98,101],search_charclass:[7,9,98],search_col:[7,10,64],search_count:[7,18,19],search_detect:[7,27,84],search_extract:[7,46,47,60],search_fix:[7,11,65],search_loc:[7,58,59],search_regex:[7,12,66],search_replac:[7,76,98],search_split:[7,81,82,83],search_subset:[7,89],second:[2,17,20,21,22,23,25,58,59,60,91],secondari:64,section:[6,9,12,66],sed:[1,85,86,102],see:[0,1,2,16,68,78],seek:13,seem:10,seen:[2,38],segfault:2,select:[0,3,5,6,22,31,33,69,102],selector:26,semant:5,sens:5,sensit:[0,3,7,13,23,57,65,66,93],sentenc:[8,19,59,63,69,82,93],sep:[2,14,23,48,51,52,68,69,77,102,103],separ:[8,9,23,47,48,51,52,55,58,63,73,81,83,84,85,86,95,103],septemb:23,sequenc:[0,1,2,3,5,11,12,23,30,32,34,36,40,42,43,44,53,58,66,83,95,97,102],seri:[9,95],serv:[44,83],server:[1,2],servic:[2,5,6,10,56,64,91,95],session:1,set:[0,1,2,3,4,5,6,9,11,12,17,18,19,20,21,22,23,27,29,32,42,43,44,46,47,51,53,58,59,60,67,69,71,72,76,79,80,81,82,83,84,89,93,100],setdatadirectori:2,setup:1,sever:[6,30],shall:2,shape:9,shift_ji:30,ship:[1,2],shorter:[15,18,27,46,58,60,76,81,84,89],should:[1,2,5,6,21,23,29,30,38,39,44,48,49,54,58,63,65,67,68,69,75,76,79,81,83,89,98,101,102],show:30,shown:[5,9,12],shuffl:[0,3],side:[0,3,68,102],sign:[2,5,9,20,25],signific:[2,6,23],significantli:[29,100],silent:[2,4,5,17,43,51,52,87],similar:[2,5,6,9,12,16,43,54,55,91],simpl:[2,5,38,65,69,102],simplest:88,simpli:[1,2],simplifi:[2,30,37,46,47,69,81,82,102],simplify2arrai:54,sinc:[0,9,12,25,46,76,91],singl:[2,5,8,9,16,19,20,21,22,23,26,27,29,30,31,32,33,37,39,40,43,44,46,47,48,49,51,52,54,55,57,58,59,60,63,64,65,67,68,69,71,73,76,77,79,80,81,82,83,84,87,88,89,90,91,92,93,94,95,98,102],singleton:27,sit:[18,52,69,76,81,85,86,87,102],site:[1,2,13,91],situat:39,six:12,size:[33,44,66,73],sk_sk:[17,46,58,67,72,79,80,90],skip:[46,58,76],skip_:63,skip_line_hard:63,skip_line_soft:63,skip_sentence_sep:[63,82],skip_sentence_term:63,skip_word_ideo:63,skip_word_kana:63,skip_word_lett:[63,82],skip_word_non:[19,59,63,82],skip_word_numb:[63,82],slash:9,slightli:[84,86],slovak:17,slow:76,slower:[10,14,29,100],small:[5,71,86,93,95],smaller:88,smith:[59,82],snprintf:2,soft:[9,63,101],soft_dot:9,softwar:102,solari:[1,2,39],sole:[2,5],solut:1,solv:2,some:[1,2,4,5,9,11,12,13,23,24,30,33,37,44,48,55,56,57,58,63,66,86,87,90,99],somehow:5,someth:[9,76],sometim:[4,35,53,83],somewhat:[12,67,79],sort:[0,2,3,5,6,13,37,64,67,88],sourc:[0,1,2,69],sourceforg:86,southern:91,space:[2,5,8,9,12,18,23,46,58,66,76,85,86,98,101,102],space_separ:12,spaghetti:60,spam:[19,52,59,82],sparc:1,speak:5,special:[5,9,45,63,66],specif:[2,6,8,9,10,11,13,17,20,23,31,56,84,91,97],specifi:[2,5,6,9,12,20,21,22,23,24,37,44,63,71,76,95,97,98,102],spectrum:5,speed:[2,5,66],spell:2,split:[0,2,3,7,12,13,73,74,102],spontan:2,sprintf:[0,2,3],squar:[9,102],src:[1,2],sse2:2,sss:23,ssss:23,ssz:23,stabl:[67,79],stable_sort:[67,79],stack:[2,66],stack_limit:[2,66],stage:2,stand:[6,9,22,23,26],standalon:26,standard:[0,1,2,5,6,9,12,33,59,62,82,83,97,99,101],start:[0,2,3,7,8,9,27,46,58,59,66,68,69,76,87,88,98,102],start_lipsum:69,stat:[85,86],state:[2,9,20,68,90,102],statist:[0,3,5,13,30,31],statu:[2,19,47,59],stdin:[5,38],step:95,stick:98,still:[1,6],sting:27,stl:[67,79],stop:[2,27,66],storag:[5,66],store:[5,62],str2:77,str:[2,11,18,19,23,27,28,29,30,31,34,35,36,38,40,41,42,43,44,45,46,47,48,50,53,58,59,60,62,67,68,70,72,76,77,78,79,80,81,82,83,84,85,86,87,88,89,93,94,95,97,98,99,100,101,102,103],str_split_fix:2,strchr:2,strcmp:[17,80],stream:[0,3,40,43],strength:[17,29,46,58,64,84,100],strftime:[23,24],stri:[2,14,15,16,28],stri_:[2,4,7,9,10,12,65,84],stri_brkit:2,stri_c:[2,51],stri_c_list:52,stri_cmp:[2,13,17,64],stri_cmp_eq:[2,17,93],stri_cmp_equiv:[2,15,17],stri_cmp_g:[2,17],stri_cmp_gt:[2,17],stri_cmp_l:[2,15,17],stri_cmp_lt:[2,17],stri_cmp_neq:[2,17],stri_cmp_nequiv:[2,17],stri_col:64,stri_compar:[0,3,6,8,10,15,19,29,31,47,59,64,67,72,79,80,82,93,100,102],stri_conv:44,stri_count:[0,2,3,7,19],stri_count_:7,stri_count_boundari:[0,2,3,6,7,8,10,13,15,17,18,29,31,47,53,59,63,64,67,72,79,80,82,83,93,100,102],stri_count_charclass:18,stri_count_col:18,stri_count_fix:[2,18,65],stri_count_regex:[18,66],stri_count_word:[2,19,47,59],stri_datetime_add:[0,2,3,21,22,23,24,25,26,90,91,92],stri_datetime_cr:[0,2,3,20,22,23,24,25,26,90,91,92],stri_datetime_field:[0,2,3,20,21,23,24,25,26,90,91,92],stri_datetime_format:[0,2,3,13,20,21,22,24,25,26,90,91,92],stri_datetime_fstr:[0,2,3,20,21,22,23,25,26,90,91,92],stri_datetime_now:[0,2,3,20,21,22,23,24,26,90,91,92],stri_datetime_pars:[2,23,24],stri_datetime_symbol:[0,2,3,20,21,22,23,24,25,90,91,92],stri_detect:[0,2,3,7,84,89],stri_detect_:[2,7],stri_detect_charclass:27,stri_detect_col:[27,64],stri_detect_fix:[27,65],stri_detect_regex:[2,27,66,84],stri_dup:[0,2,3,13,14,48,51,52],stri_dupl:[0,2,3,6,8,10,13,15,17,19,31,47,59,64,67,72,79,80,82,93,100,102],stri_duplicated_ani:[2,29],stri_enc_detect2:[0,2,3,5,6,8,10,15,17,19,29,30,34,35,36,47,59,64,67,72,79,80,82,93,100,102],stri_enc_detect:[0,2,3,5,31,34,35,36,74],stri_enc_fromutf32:[0,3,5,40,41,42,43,44,46,101],stri_enc_get:[5,38,39,41,43,44],stri_enc_info:[0,3,5,37,38,39,49],stri_enc_isascii:[0,2,3,5,30,31,35,36],stri_enc_isnf:2,stri_enc_isutf16:[0,3],stri_enc_isutf16b:[5,30,31,34,35,36],stri_enc_isutf16l:35,stri_enc_isutf32b:35,stri_enc_isutf32l:35,stri_enc_isutf8:[0,2,3,5,30,31,34,35],stri_enc_list:[0,3,5,33,38,39,44],stri_enc_mark:[0,2,3,5,33,37,39,40,41,43,44],stri_enc_nf:2,stri_enc_set:[0,2,3,5,33,37,38],stri_enc_toascii:[0,3,5,32,41,42,43,44],stri_enc_ton:[0,2,3,5,32,40,42,43,44],stri_enc_toutf32:[0,3,5,32,40,41,43,44],stri_enc_toutf8:[0,2,3,5,32,40,41,42,44,53,77],stri_encod:[0,2,3,5,30,32,40,41,42,43,73,74],stri_endswith:[2,27,84],stri_endswith_:[2,7],stri_endswith_charclass:84,stri_endswith_col:84,stri_endswith_fix:84,stri_escape_unicod:[0,3,13,62,99],stri_extract:[0,2,3,7,58,60],stri_extract_:[2,7,46,47],stri_extract_al:[2,7,46,47,54,60,88],stri_extract_all_:[2,46,47],stri_extract_all_boundari:[6,7,8,10,15,17,19,29,31,46,47,59,60,63,64,67,72,79,80,82,83,93,100,102],stri_extract_all_charclass:[2,46],stri_extract_all_col:46,stri_extract_all_fix:[2,46,65],stri_extract_all_regex:[2,46,52,60],stri_extract_all_word:[2,8,12,19,47,52,59],stri_extract_boundari:[0,3],stri_extract_first:[46,87],stri_extract_first_:[46,47],stri_extract_first_boundari:47,stri_extract_first_charclass:46,stri_extract_first_col:46,stri_extract_first_fix:46,stri_extract_first_regex:46,stri_extract_first_word:[2,47],stri_extract_last:[46,87],stri_extract_last_:[46,47],stri_extract_last_boundari:47,stri_extract_last_charclass:46,stri_extract_last_col:46,stri_extract_last_fix:46,stri_extract_last_regex:46,stri_extract_last_word:[2,47],stri_extract_word:2,stri_flatten:[0,2,3,13,14,28,30,51,52,69],stri_info:[0,2,3,39],stri_install_check:2,stri_install_icudt:2,stri_isempti:[0,3,53,62,101],stri_join:[0,2,3,4,13,14,28,48,52],stri_join_list:[0,2,3,14,28,48,51],stri_length:[0,2,3,13,19,50,62,94,101],stri_list2matrix:[0,2,3,46,47,61,75,77,81,82],stri_loc:[0,2,3,7],stri_locale_get:57,stri_locale_info:[0,3,6,49,56,57],stri_locale_list:[0,3,6,55,57],stri_locale_set:[0,3,6,55,56],stri_locate_:[7,58,59],stri_locate_al:[7,58,59,87,88],stri_locate_all_:[2,58,59],stri_locate_all_boundari:[2,6,7,8,10,15,17,19,29,31,47,58,59,63,64,67,72,79,80,82,83,87,88,93,100,102],stri_locate_all_charclass:[2,58],stri_locate_all_col:58,stri_locate_all_fix:[2,58,65],stri_locate_all_regex:[44,58,88],stri_locate_all_word:[2,19,59],stri_locate_boundari:[0,2,3],stri_locate_first:[58,87,88],stri_locate_first_:[58,59],stri_locate_first_boundari:[2,59],stri_locate_first_charclass:58,stri_locate_first_col:58,stri_locate_first_fix:58,stri_locate_first_regex:[58,87],stri_locate_first_word:[2,59],stri_locate_last:[58,87,88],stri_locate_last_:[58,59],stri_locate_last_boundari:[2,59],stri_locate_last_charclass:58,stri_locate_last_col:58,stri_locate_last_fix:58,stri_locate_last_regex:[58,87],stri_locate_last_word:[2,59],stri_locate_regex:2,stri_locate_word:2,stri_match:[0,2,3,7,12,46],stri_match_:[2,60],stri_match_al:[7,46,47,60],stri_match_all_:[2,60],stri_match_all_regex:60,stri_match_first:60,stri_match_first_regex:60,stri_match_last:60,stri_match_last_regex:60,stri_na2empti:[0,2,3,54,75,77],stri_numbyt:[0,3,19,50,53,101],stri_omit_empti:[2,75],stri_omit_empty_na:[2,75],stri_omit_na:[2,75],stri_opts_brkit:[0,2,3,7,8,19,47,59,82,83,93,102],stri_opts_col:[0,2,3,6,7,8,10,13,15,17,18,19,27,29,31,46,47,58,59,67,72,76,79,80,81,82,84,89,93,100,102],stri_opts_fix:[0,2,3,7,11,18,27,46,58,76,81,84,89],stri_opts_regex:[0,2,3,7,12,18,27,46,58,60,76,81,89],stri_ord:[0,2,3,6,8,10,13,15,17,19,29,31,47,59,64,72,79,80,82,93,100,102],stri_pad:[0,2,3,13,102],stri_pad_:[2,68],stri_pad_both:[2,68],stri_pad_left:[2,68],stri_pad_right:[2,68],stri_past:[2,51,58,70,71,77,84,102],stri_paste_list:52,stri_prepare_arg_posixct:2,stri_rand_lipsum:[0,2,3,13,70,71],stri_rand_shuffl:[0,2,3,13,69,71,78],stri_rand_str:[0,2,3,9,13,69,70],stri_rank:[0,2,3,6,8,10,13,15,17,19,29,31,47,59,64,67,79,80,82,93,100,102],stri_read_bin:2,stri_read_lin:[0,2,3,13,74,85,103],stri_read_raw:[0,2,3,13,73,103],stri_remove_empti:[0,2,3,54,61,77],stri_remove_empty_na:[2,75],stri_remove_na:[2,75],stri_replac:[0,3,7,98],stri_replace_:[7,76],stri_replace_al:[2,7,76,98],stri_replace_all_:[2,76],stri_replace_all_charclass:[2,76],stri_replace_all_col:76,stri_replace_all_fix:[2,76],stri_replace_all_regex:76,stri_replace_first:[76,87],stri_replace_first_charclass:76,stri_replace_first_col:76,stri_replace_first_fix:76,stri_replace_first_regex:76,stri_replace_last:[76,87],stri_replace_last_charclass:76,stri_replace_last_col:76,stri_replace_last_fix:76,stri_replace_last_regex:76,stri_replace_na:[0,2,3,54,61,75],stri_revers:[0,3,13,70],stri_sort:[0,2,3,6,8,10,13,15,17,19,29,31,47,59,64,67,72,80,82,93,100,102],stri_sort_kei:[0,2,3,6,8,10,15,17,19,29,31,47,59,64,67,72,79,82,93,100,102],stri_split:[0,2,3,7,54,82,83],stri_split_:[2,7],stri_split_boundari:[0,2,3,6,7,8,10,15,17,19,29,31,47,59,63,64,67,72,79,80,81,83,93,100,102],stri_split_charclass:[2,81],stri_split_col:[2,81],stri_split_fix:[2,55,81],stri_split_lin:[0,3,7,8,13,19,47,59,63,81,82,93,102],stri_split_lines1:[73,74,83],stri_split_regex:[2,81],stri_startsendswith:[0,3],stri_startswith:[2,7,27,84],stri_startswith_:[2,7],stri_startswith_charclass:84,stri_startswith_col:84,stri_startswith_fix:84,stri_stats_gener:[0,3,13,86],stri_stats_latex:[0,3,13,85],stri_sub:[0,2,3,13,58,59,88],stri_sub_al:[0,2,3,58,59,87],stri_sub_all_replac:88,stri_sub_replac:[2,87],stri_sub_replace_al:[2,88],stri_subset:[0,2,3,7,27],stri_subset_:[2,7],stri_subset_charclass:89,stri_subset_col:89,stri_subset_fix:89,stri_subset_regex:89,stri_timezone_get:[2,20,21,22,23,24,25,26,90,91,92],stri_timezone_info:[0,2,3,20,21,22,23,24,25,26,91,92],stri_timezone_list:[0,2,3,20,21,22,23,24,25,26,90,92],stri_timezone_set:[0,2,3],stri_trans_casefold:2,stri_trans_casemap:[0,3],stri_trans_char:[0,2,3,13,93,95,96,97],stri_trans_gener:[0,2,3,13,93,94,96,97],stri_trans_isnf:[2,97],stri_trans_isnfc:97,stri_trans_isnfd:97,stri_trans_isnfkc:97,stri_trans_isnfkc_casefold:97,stri_trans_isnfkd:97,stri_trans_list:[0,2,3,93,94,95,97],stri_trans_nf:[0,2,3],stri_trans_nfc:[5,13,53,87,93,94,95,96,97,101,102],stri_trans_nfd:[78,95,97],stri_trans_nfkc:97,stri_trans_nfkc_casefold:97,stri_trans_nfkd:[17,19,29,53,68,97,100,101],stri_trans_to:2,stri_trans_tolow:[6,7,8,10,13,15,17,19,29,31,47,59,63,64,67,72,79,80,82,83,93,94,95,96,97,100,102],stri_trans_totitl:[2,8,93],stri_trans_toupp:[93,95],stri_trim:[0,3,7,13,76],stri_trim_both:[7,9,76,98],stri_trim_left:[68,98],stri_trim_right:98,stri_unescape_unicod:[0,3,45],stri_uniqu:[0,2,3,6,8,10,13,15,17,19,29,31,47,59,64,67,72,79,80,82,93,102],stri_width:[0,2,3,13,50,53,62,68,102],stri_wrap:[0,2,3,6,7,8,10,13,15,17,19,29,31,47,59,63,64,67,68,69,72,79,80,82,83,93,100],stri_write_lin:[0,2,3,13,73,74],stricontainerutf16:2,stricontainerutf8:2,strictest:64,striexcept:2,string8:2,string:[2,3,4,5,6,9,11,12,16,18,19,20,21,22,23,26,27,29,30,31,32,33,34,35,36,39,40,45,46,47,49,51,53,54,55,57,58,59,60,62,63,64,65,66,67,69,72,73,76,77,79,80,85,86,87,88,89,90,91,92,94,95,97,100,101,102],stringi:[7,13,17,18,19,25,27,32,34,35,36,37,38,44,46,47,51,55,56,58,59,60,63,64,65,66,67,68,71,72,76,79,80,81,82,83,84,85,86,87,89,93,95,97,98,100,101,102],stringi_1:1,stringi_cflag:[1,2],stringi_cppflag:[1,2],stringi_cxxflag:[1,2],stringi_disable_cxx11:[1,2],stringi_disable_icu_bundl:[1,2],stringi_disable_pkg_config:[1,2],stringi_general_top:[4,5,6,7,8,9,10,11,12,13],stringi_ldflag:[1,2],stringi_lib:[1,2],stringr:[0,2],stringsearch:[7,10],strncpy:2,strongli:[1,9],strptime:[0,2,3],strrringi:[18,27],strstr:2,strsxp:2,strwrap:[2,102],stubdata:2,student:2,studio:2,stuff:[85,86],style:[0,3,9,23,30],sub:[12,60,89],sub_index:2,submiss:2,subsequ:102,subset:[1,2,4,5,7,9,27,33],substitut:[2,5,40,44,73,81,87,88,89,102,103],substr:[0,2,3,12,13,46,59,60,64,76,81],success:1,successfulli:1,suffici:2,suggest:[0,1,2,6,102,103],suit:[29,98,100],suitabl:[1,2,102],summar:[9,12],sun:2,sundai:22,superset:[5,39],supplementari:[18,27,46,58,60,76,81,84,89],suppli:[2,12,30,31,76],support:[0,2,5,6,9,23,24,37,39,44,46,49,60,62,81,90,97],suppos:2,suppress:2,sure:[1,35],surrog:9,surround:93,suscipit:[85,86,102],swedish:30,sxpinfo:2,syllabl:9,symbol:[2,9,23],synonym:28,syntax:[9,12,16,23,63],sys:2,system:[1,2,5,6,8,9,38,39,49],tab:[9,12,83,102],tabl:30,tabul:12,take:[10,17,65,68,90,102],taken:[8,30],tar:1,target:[2,44],tartanu:[0,13],task:[2,7,12,13,95,96],tato:95,team:86,technic:[5,8,12,44,83,97],techniqu:30,technolog:2,tellu:[85,102],temporari:14,term:[51,91],termin:[12,27,63,66],terminal_punctu:9,tertiari:64,test1:77,test2:19,test:[2,6,9,15,17,19,27,29,30,39,59,77,82,84,100],text:[0,2,3,5,7,9,12,13,23,30,31,63,68,69,81,85,86,87,93,97,101],text_boundari:[7,8,19,47,59,63,82,83,93,102],textbf:86,textit:86,textual:9,tf08:5,tgca:94,th_th_tradit:26,than:[2,4,5,8,9,10,12,14,17,23,29,38,40,44,51,52,54,58,62,64,67,70,71,88,100,102],thank:[0,2],thei:[2,5,6,9,12,13,15,17,23,32,43,44,46,58,59,60,63,65,67,76,79,84,89,95],them:[5,6,17,30,33,96],themselv:[66,81],theoret:9,therefor:[5,9,17,83],therein:13,thereof:44,thi:[0,1,2,4,5,6,7,8,9,17,18,19,22,23,27,30,31,32,33,34,36,37,38,40,41,42,43,44,46,50,51,53,54,55,58,59,60,61,62,63,64,65,66,67,68,70,71,72,73,76,77,78,79,80,82,83,84,85,86,91,95,97,100,102,103],think:8,third:[8,60,64],those:[5,6,10],though:[2,12],thought:5,three:[12,23,30,31,91,93],through:9,throughout:91,thu:[4,5,59,81,97,103],tie:9,tied:72,time:[0,2,3,5,9,11,12,13,14,24,28,29,66,81,89,94],time_limit:[2,66],timezon:[20,23,90,91,92],titl:[13,93,95],to_raw:44,todo:2,togeth:[0,1,3,6,49,95],token:[81,82],tokens_onli:[2,81,82],toler:1,too:2,took:4,tool:[2,12,13,97],top:64,topic:[12,13],total:[12,31,68,85,98,102],tr11:101,tr13:83,tr15:97,tr18:[12,83],tr29:66,tr44:9,tr_tr:93,tracker:0,tradit:[30,66],trail:62,transform:[0,2,3,13,94,97],transit:12,translat:[0,3,5,13,33],transliter:[0,2,3,13],transpos:54,transposit:54,treat:[12,13,23,48,51,64,66,75],treatment:[67,79],tri:[2,5,8,12,31,37,39],trick:1,trim:[0,3,13,84],trivial:2,truncat:[23,69],tue:23,tuesdai:23,tune:[6,10,11,12,17,18,27,46,58,63,64,65,66,67,72,76,79,80,81,84,89],turkish:30,turn:64,tutori:12,tweak:[1,2,11],two:[0,2,3,5,6,9,12,15,17,23,53,58,59,72,83,87,88,91,93,94,97],txt:[9,30,97],type:[1,2,5,8,9,19,44,53,59,63,74,81,82,87,88,93,103],typic:[5,14,15,84,91,97],tzone:22,u0000:9,u0007:12,u0009:12,u000a:12,u000c:12,u000d:12,u0010ffff:[9,12],u001a:44,u001b:12,u0032:99,u00a0abov:[19,59,82],u00a9:19,u00df:[19,29,93,95,100],u00e1rio:17,u00e4rtn:17,u00fd:[17,46,58],u0104123:78,u0104:[34,36,50,53,62,93,95],u0105:[9,17,29,34,36,45,50,53,62,78,93,97,99,100,101],u0119:19,u0153:19,u0222:36,u03c0:19,u0627:[58,84],u0633:[58,84],u0635:[58,84],u0639:[58,84],u0644:[58,84],u0645xyz:[58,84],u0647:[58,84],u0648:[58,84],u0649:[58,84],u064a:[58,84],u105:17,u1234:36,u200c:12,u200d:12,u2190:19,u2192:19,u2193:19,u2620:95,u7fffffff:62,u_charset_is_utf8:[2,39,49],u_ea_fullwidth:101,u_ea_wid:101,u_hst_trailing_jamo:101,u_hst_vowel_jamo:101,u_init:2,u_missing_resource_error:2,u_toupp:65,uax:101,ubbfc:68,ubc1f:101,ubrk:63,ubrk_8h:63,ubrk_word_non:[19,47,59],ubsan:2,ubuntu:[1,2],uc74c:68,uc815:68,ucd:13,uchar32:33,uchar:33,uchar_east_asian_width:101,uchar_hangul_syllable_typ:101,ucs:101,ud6c8:68,ufb00:17,ufdfa:[58,84,97],ufdfaxyz:[58,84],ufffd:[43,44],uhhhh:12,uhhhhhhhh:12,uint32_t:2,umlaut:36,unambigu:83,unassign:9,unavail:[33,56,60],unbound:12,unchang:[43,76,87,88],under:[0,2,5,13],underli:[18,27,46,58,60,76,80,81,84,89],underscor:55,understand:[5,55,99],undesir:39,unfortun:5,unicod:[0,2,3,5,7,8,11,12,13,17,19,26,32,33,42,43,49,53,62,63,64,66,68,70,71,73,78,81,83,85,87,91,92,93,94,95,98,99,100,101,102],unicode_equival:97,unicodeset:[2,95],unicodestr:2,unidata:9,uninspect:27,union:9,uniqu:[0,2,3,6,8,29,37,94],unit:[2,5,8,9,20,93],unitialis:2,univers:[2,5,13,91,98],unix:[2,5,9,66],unix_lin:66,unknown:[2,5,6,30,33,38],unless:[5,9,27,39,51,52,92],unlik:[23,29,38,42,58,100],unnecessari:98,unprotect:2,unrecogn:66,unsupport:55,until:12,unzip:1,updat:2,upgrad:2,upon:1,upper:[9,13,64,93,95],uppercas:[9,95],uppercase_first:64,ups:[2,5],uregex_8h:66,uregexpflag:66,usag:[1,2,9],use:[1,2,4,9,10,12,38,42,43,44,48,62,66,81,84,86,89,91,95,97,101],use_length:[68,102],use_width:2,usearch:2,used:[1,2,4,5,6,9,13,17,18,19,23,24,27,30,32,33,38,39,40,43,44,45,46,47,48,49,51,52,53,55,57,58,59,60,62,63,64,65,68,69,73,76,77,81,83,84,87,89,90,91,92,93,94,96,98,102],usedynlib:2,useful:[2,5,7,9,19,54,59,80,82,95],user:[1,2,5,6,8,9,10,12,17,20,23,26,29,30,39,44,63,64,65,66,67,72,79,80,91,93,95,96,97,100],userguid:[5,6,8,9,10,12,17,20,23,26,29,30,44,63,64,65,66,67,72,79,80,91,93,95,96,97,100],uses:[2,6,8,9,26,30,31,38,65,66,67,79,90,97],usesdaylighttim:90,using:[2,5,6,9,10,15,23,24,30,31,66,80,92,97,103],uslax:23,usr:1,usual:[11,15,32,45,51,53,67,79,88,89,97,100],utc:[25,91],utf8:[5,37,49],utf8toint:42,utf:[0,2,3,13,17,30,31,33,38,39,40,41,44,49,51,53,62,73,89,97,99,103],utf_8:5,utf_bom:5,util:[6,12,54,61,75,77,92,102],utr22:33,utr:83,uuuu:23,uword:66,uxxxx:[45,99],uxxxxxxxx:[45,99],valgrind:2,valid:[2,5,6,17,31,34,35,36,37,43,99],valu:[0,2,3,5,6,9,12],vari:91,variabl:[1,2,23,64],variant:[6,55,76,87,88],varieti:95,variou:[5,68,102],vec:32,vector:[0,2,3,5,7,13,15,16,17,18,19,20,21,22,23,24,27,28,29,30,31,32,34,35,36,37,38,40,41,42,43,44,45,46,47,48,50,52,53,54,56,58,59,60,61,62,67,68,69,70,71,72,73,74,76,78,79,80,81,82,83,84,88,89,91,93,94,95,96,97,98,99,100,101,102,103],vectorise_al:76,vectorize_al:[2,76],vel:[85,102],veri:[0,1,2,5,9,11,12,19,39,59,69,82,102],verifi:6,versa:23,version:[1,2,20,32,44,49,75,79,87,88,89,99,100],vertic:83,via:[1,2,11,12,30,38,51,65],vice:23,video:0,vietnames:9,vignett:2,violat:2,vowel:101,vvv:23,vvvv:23,w3c:97,wai:[2,5,10,11,12,16,23,34,35,36,44,50,64,73,77,81,95,102,103],want:[2,6,42,43],warn:[2,4,9,12,18,24,27,32,39,40,42,44,53,63,64,65,66,84,94,99],warnfix:2,warsaw:[2,92],wcwidth:101,weakli:79,web:97,wed:23,week:[20,23],weekdai:26,weekofmonth:22,weekofyear:22,weight:64,well:[2,9,13,36,45,49,64,87,101],were:[2,5,60,95],werner:10,western:5,wget:1,what:[0,4,5,8,9,11,17,39,43],whatev:12,when:[2,4,5,6,8,12,17,23,43,53,64,66,68,80,83,90,91,102],whenev:[4,5,65],where:[2,5,17,23,24,32,39,42,43,51,58,63,67,76,79,83,84,85,86,89,91,98,102],wherea:23,wherev:[77,87,88],whether:[2,6,17,23,27,29,31,34,35,36,38,44,46,49,50,58,64,66,81,83,84,87,88,89,90,97,100],which:[1,2,5,6,8,9,10,13,19,29,30,40,44,51,62,64,67,68,73,79,80,81,82,91,97,102],white:[2,9,12,13,18,46,58,66,76,85,86,98,102],white_spac:[9,18,76,81,85],whitespace_onli:[2,102],who:6,whole:[8,60,65],wickham:0,wide:[0,5,26,97],width:[0,2,3,9,13,23,26,53,68,102],wieczori:95,wiki:97,wikipedia:97,win:2,winbuild:2,window:[2,5,30,33,36,62,90,99,103],windtfmt:2,winnmfmt:2,wise:[2,7,13],wish:[1,12,48,76,81,84],within:[1,2,4,6,8,12,18,23,27,30,46,58,60,66,87,88,102],without:[0,3,6,23,66],word:[0,2,3,8,9,12,19,47,59,63,66,69,76,82,86,89,93],word_boundari:66,work:[1,2,5,30,31,41,65,87,97,99],world:[5,97],worst:11,worth:93,would:[8,62,66,98],wparenthes:2,wraca:95,wrap:[0,2,3,8,13,68,88],wrapper:[60,98],write:[0,3,8,13],writelin:103,written:[5,30,66],wspace:[84,98],www:[5,6,9,12,83,97,101],x1a:40,xaaaax:[46,58],xhh:12,xml:30,xnox:2,xtfrm:72,xxx:[23,48,99],xxxx:23,xxxxx:23,xyx:60,xyz:51,year:[5,20,21,22,23,90,91],yet:[2,13,97,98],yield:[2,23,46,67],you:[0,1,2,4,5,6,9,10,11,12,17,30,31,38,39,42,43,48,51,52,55,57,58,59,62,66,70,76,81,84,85,97,98,102],your:[1,4,5,6,9,38,39,62,84,98],yutannihil:2,yyyi:23,yyyyi:23,zc1:27,zero:[0,2,3,5,9,12,23,58,81,101,102],zip:[1,2],zipf:69,zone:[0,2,3,13,20,21,22,23],zwnbsp:9,zwsp:9,zxy:78,zzz:23,zzzz:23,zzzzz:23},titles:["stringi: THE String Processing Package for R","Installing stringi","What Is New in stringi","R Package stringi Reference","about_arguments: Passing Arguments to Functions in stringi","about_encoding: Character Encodings and stringi","about_locale: Locales and stringi","about_search: String Searching","about_search_boundaries: Text Boundary Analysis in stringi","about_search_charclass: Character Classes in stringi","about_search_coll: Locale-Sensitive Text Searching in stringi","about_search_fixed: Locale-Insensitive Fixed Pattern Matching in stringi","about_search_regex: Regular Expressions in stringi","about_stringi: THE String Processing Package","operator_add: Concatenate Two Character Vectors","operator_compare: Compare Strings with or without Collation","operator_dollar: C-Style Formatting with sprintf as a Binary Operator","stri_compare: Compare Strings with or without Collation","stri_count: Count the Number of Pattern Matches","stri_count_boundaries: Count the Number of Text Boundaries","stri_datetime_add: Date and Time Arithmetic","stri_datetime_create: Create a Date-Time Object","stri_datetime_fields: Get Values for Date and Time Fields","stri_datetime_format: Date and Time Formatting and Parsing","stri_datetime_fstr: Convert strptime-Style Format Strings","stri_datetime_now: Get Current Date and Time","stri_datetime_symbols: List Localizable Date-Time Formatting Data","stri_detect: Detect a Pattern Match","stri_dup: Duplicate Strings","stri_duplicated: Determine Duplicated Elements","stri_enc_detect: Detect Character Set and Language","stri_enc_detect2: [DEPRECATED] Detect Locale-Sensitive Character Encoding","stri_enc_fromutf32: Convert From UTF-32","stri_enc_info: Query a Character Encoding","stri_enc_isascii: Check If a Data Stream Is Possibly in ASCII","stri_enc_isutf16: Check If a Data Stream Is Possibly in UTF-16 or UTF-32","stri_enc_isutf8: Check If a Data Stream Is Possibly in UTF-8","stri_enc_list: List Known Character Encodings","stri_enc_mark: Get Declared Encodings of Each String","stri_enc_set: Set or Get Default Character Encoding in stringi","stri_enc_toascii: Convert To ASCII","stri_enc_tonative: Convert Strings To Native Encoding","stri_enc_toutf32: Convert Strings To UTF-32","stri_enc_toutf8: Convert Strings To UTF-8","stri_encode: Convert Strings Between Given Encodings","stri_escape_unicode: Escape Unicode Code Points","stri_extract: Extract Occurrences of a Pattern","stri_extract_boundaries: Extract Data Between Text Boundaries","stri_flatten: Flatten a String","stri_info: Query Default Settings for stringi","stri_isempty: Determine if a String is of Length Zero","stri_join: Concatenate Character Vectors","stri_join_list: Concatenate Strings in a List","stri_length: Count the Number of Code Points","stri_list2matrix: Convert a List to a Character Matrix","stri_locale_info: Query Given Locale","stri_locale_list: List Available Locales","stri_locale_set: Set or Get Default Locale in stringi","stri_locate: Locate Occurrences of a Pattern","stri_locate_boundaries: Locate Text Boundaries","stri_match: Extract Regex Pattern Matches, Together with Capture Groups","stri_na2empty: Replace NAs with Empty Strings","stri_numbytes: Count the Number of Bytes","stri_opts_brkiter: Generate a List with BreakIterator Settings","stri_opts_collator: Generate a List with Collator Settings","stri_opts_fixed: Generate a List with Fixed Pattern Search Engine\u2019s Settings","stri_opts_regex: Generate a List with Regex Matcher Settings","stri_order: Ordering Permutation","stri_pad: Pad (Center/Left/Right Align) a String","stri_rand_lipsum: A Lorem Ipsum Generator","stri_rand_shuffle: Randomly Shuffle Code Points in Each String","stri_rand_strings: Generate Random Strings","stri_rank: Ranking","stri_read_lines: Read Text Lines from a Text File","stri_read_raw: Read Text File as Raw","stri_remove_empty: Remove All Empty Strings from a Character Vector","stri_replace: Replace Occurrences of a Pattern","stri_replace_na: Replace Missing Values in a Character Vector","stri_reverse: Reverse Each String","stri_sort: Sorting","stri_sort_key: Sort Keys","stri_split: Split a String By Pattern Matches","stri_split_boundaries: Split a String at Text Boundaries","stri_split_lines: Split a String Into Text Lines","stri_startsendswith: Determine if the Start or End of a String Matches a Pattern","stri_stats_general: General Statistics for a Character Vector","stri_stats_latex: Statistics for a Character Vector Containing LaTeX Commands","stri_sub: Extract a Substring From or Replace a Substring In a Character Vector","stri_sub_all: Extract or Replace Multiple Substrings","stri_subset: Select Elements that Match a Given Pattern","stri_timezone_info: Query a Given Time Zone","stri_timezone_list: List Available Time Zone Identifiers","stri_timezone_set: Set or Get Default Time Zone in stringi","stri_trans_casemap: Transform Strings with Case Mapping","stri_trans_char: Translate Characters","stri_trans_general: General Text Transforms, Including Transliteration","stri_trans_list: List Available Text Transforms and Transliterators","stri_trans_nf: Perform or Check For Unicode Normalization","stri_trim: Trim Characters from the Left and/or Right Side of a String","stri_unescape_unicode: Un-escape All Escape Sequences","stri_unique: Extract Unique Elements","stri_width: Determine the Width of Code Points","stri_wrap: Word Wrap Text to Format Paragraphs","stri_write_lines: Write Text Lines to a Text File"],titleterms:{"2013":2,"2014":2,"2015":2,"2016":2,"2017":2,"2018":2,"2019":2,"2020":2,"2021":2,"byte":[11,62],"case":93,"class":9,"default":[6,39,49,57,92],"function":[4,6,12],"new":2,For:97,Into:83,NAs:[4,61],THE:[0,13],about_argu:4,about_encod:5,about_local:6,about_search:7,about_search_boundari:8,about_search_charclass:9,about_search_col:10,about_search_fix:11,about_search_regex:12,about_stringi:13,align:68,all:[75,99],also:[4,5,6,7,8,9,10,11,12,13,14,15,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,69,70,71,72,73,74,75,76,77,79,80,81,82,83,84,85,86,87,88,89,90,91,92,93,94,95,96,97,98,99,100,101,102,103],analysi:8,argument:[4,14,15,16,17,18,19,20,21,22,23,24,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,57,58,59,60,61,62,63,64,65,66,67,68,69,70,71,72,73,74,75,76,77,78,79,80,81,82,83,84,85,86,87,88,89,90,91,92,93,94,95,97,98,99,100,101,102,103],arithmet:20,ascii:[34,40],attribut:4,author:13,avail:[13,56,91,96],awar:10,between:[44,47],binari:[9,16],boundari:[8,19,47,59,82],breakiter:63,build:1,captur:60,categori:9,center:68,charact:[5,9,12,14,30,31,33,37,39,51,54,75,77,85,86,87,94,98],check:[34,35,36,97],code:[45,53,70,101],coercion:4,collat:[15,17,64],command:86,compar:[11,15,17],concaten:[14,51,52],conclus:1,contain:86,convers:5,convert:[24,32,40,41,42,43,44,54],count:[18,19,53,62],cran:2,creat:21,current:25,customis:1,data:[26,34,35,36,47],date:[20,21,22,23,25,26],declar:38,deprec:31,descript:[4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,68,69,70,71,72,73,74,75,76,77,78,79,80,81,82,83,84,85,86,87,88,89,90,91,92,93,94,95,96,97,98,99,100,101,102,103],detail:[5,6,7,8,9,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,50,51,52,53,54,55,56,57,58,59,60,62,63,64,65,66,67,68,69,70,71,72,73,74,76,77,78,79,80,81,82,83,84,85,86,87,88,89,90,91,92,93,94,95,97,98,99,100,101,102,103],detect:[5,27,30,31],determin:[29,50,84,101],devel:2,duplic:[28,29],each:[38,70,78],element:[29,89,100],empti:[61,75],encod:[5,31,33,37,38,39,41,44],end:84,engin:[10,65],escap:[45,99],exampl:[14,15,16,17,18,19,20,21,22,23,24,26,27,28,29,30,34,36,45,46,47,48,50,51,52,53,54,55,57,58,59,60,61,62,64,65,66,67,68,69,70,71,72,75,76,77,78,79,80,81,82,84,85,86,87,88,89,90,91,92,93,94,95,97,98,99,100,101,102],express:12,extract:[46,47,60,87,88,100],facil:13,field:22,file:[73,74,103],fix:[11,65],flatten:48,format:[16,23,24,26,102],from:[32,73,75,87,98],gener:[9,63,64,65,66,69,71,85,95],get:[22,25,38,39,57,92],given:[44,55,89,90],glanc:12,group:60,handl:4,icu4c:1,icu:12,identifi:[6,91],includ:95,input:4,insensit:11,instal:1,introduct:1,ipsum:69,kei:80,known:37,languag:30,latex:86,left:[68,98],length:50,line:[73,83,103],list:[26,37,52,54,56,63,64,65,66,91,96],local:[6,10,11,31,55,56,57],localiz:26,locat:[58,59],lorem:69,map:93,match:[11,18,27,60,81,84,89],matcher:66,matrix:54,meta:12,miss:[4,77],multipl:88,nativ:41,normal:97,note:6,number:[18,19,53,62],object:[4,21],occurr:[46,58,76],oper:[12,16],operator_add:14,operator_compar:15,operator_dollar:16,order:67,packag:[0,3,13],pad:68,paragraph:102,pars:23,pass:4,pattern:[9,11,18,27,46,58,60,65,76,81,84,89],perform:97,permut:67,point:[45,53,70,101],posix:9,possibl:[34,35,36],preserv:4,process:[0,1,13],properti:9,queri:[33,49,55,90],random:71,randomli:70,rank:72,raw:74,read:[73,74],refer:[3,5,6,8,9,10,12,13,17,20,23,26,29,30,44,63,64,65,66,67,72,79,80,83,91,92,93,95,96,97,100,101,102],regex:[12,60,66],regular:12,remov:75,replac:[61,76,77,87,88],revers:78,right:[68,98],search:[7,10,65],see:[4,5,6,7,8,9,10,11,12,13,14,15,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,69,70,71,72,73,74,75,76,77,79,80,81,82,83,84,85,86,87,88,89,90,91,92,93,94,95,96,97,98,99,100,101,102,103],select:89,sensit:[6,10,31],sequenc:99,set:[30,39,49,57,63,64,65,66,92],shuffl:70,side:98,sort:[79,80],split:[81,82,83],sprintf:16,start:84,statist:[85,86],stream:[34,35,36],stri_compar:17,stri_count:18,stri_count_boundari:19,stri_datetime_add:20,stri_datetime_cr:21,stri_datetime_field:22,stri_datetime_format:23,stri_datetime_fstr:24,stri_datetime_now:25,stri_datetime_symbol:26,stri_detect:27,stri_dup:28,stri_dupl:29,stri_enc_detect2:31,stri_enc_detect:30,stri_enc_fromutf32:32,stri_enc_info:33,stri_enc_isascii:34,stri_enc_isutf16:35,stri_enc_isutf8:36,stri_enc_list:37,stri_enc_mark:38,stri_enc_set:39,stri_enc_toascii:40,stri_enc_ton:41,stri_enc_toutf32:42,stri_enc_toutf8:43,stri_encod:44,stri_escape_unicod:45,stri_extract:46,stri_extract_boundari:47,stri_flatten:48,stri_info:49,stri_isempti:50,stri_join:51,stri_join_list:52,stri_length:53,stri_list2matrix:54,stri_loc:58,stri_locale_info:55,stri_locale_list:56,stri_locale_set:57,stri_locate_boundari:59,stri_match:60,stri_na2empti:61,stri_numbyt:62,stri_opts_brkit:63,stri_opts_col:64,stri_opts_fix:65,stri_opts_regex:66,stri_ord:67,stri_pad:68,stri_rand_lipsum:69,stri_rand_shuffl:70,stri_rand_str:71,stri_rank:72,stri_read_lin:73,stri_read_raw:74,stri_remove_empti:75,stri_replac:76,stri_replace_na:77,stri_revers:78,stri_sort:79,stri_sort_kei:80,stri_split:81,stri_split_boundari:82,stri_split_lin:83,stri_startsendswith:84,stri_stats_gener:85,stri_stats_latex:86,stri_sub:87,stri_sub_al:88,stri_subset:89,stri_timezone_info:90,stri_timezone_list:91,stri_timezone_set:92,stri_trans_casemap:93,stri_trans_char:94,stri_trans_gener:95,stri_trans_list:96,stri_trans_nf:97,stri_trim:98,stri_unescape_unicod:99,stri_uniqu:100,stri_width:101,stri_wrap:102,stri_write_lin:103,string:[0,7,10,13,15,17,24,28,38,41,42,43,44,48,50,52,61,68,70,71,75,78,81,82,83,84,93,98],stringi:[0,1,2,3,4,5,6,8,9,10,11,12,39,49,57,92],strptime:24,style:[16,24],substr:[87,88],support:1,text:[8,10,19,47,59,73,74,82,83,95,96,102,103],time:[20,21,22,23,25,26,90,91,92],togeth:60,transform:[93,95,96],translat:94,transliter:[95,96],trim:98,two:14,unicod:[9,45,97],unicodeset:9,uniqu:100,usag:[14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,68,69,70,71,72,73,74,75,76,77,78,79,80,81,82,83,84,85,86,87,88,89,90,91,92,93,94,95,96,97,98,99,100,101,102,103],utf:[5,32,35,36,42,43],valu:[4,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,68,69,70,71,72,73,74,75,76,77,78,79,80,81,82,83,84,85,86,87,88,89,90,91,92,93,94,95,96,97,98,99,100,101,102,103],vector:[4,14,51,75,77,85,86,87],what:2,width:101,without:[15,17],word:102,wrap:102,write:103,zero:50,zone:[90,91,92]}}) \ No newline at end of file diff --git a/devel/sphinx/news.rst b/devel/sphinx/news.rst index 1d1564f71..e89e51b5f 100644 --- a/devel/sphinx/news.rst +++ b/devel/sphinx/news.rst @@ -15,14 +15,20 @@ What Is New in *stringi* - …todo… #401 (update ICU4C to 69.1), The ICU4C bundle has been updated from version 61.1 to 69.1 which features Unicode 13.0 and CLDR 39. -- …todo… #408 (stri_trans_casefold), +- [NEW FEATURE] #408: …todo… ``stri_trans_casefold()``, -- [INTERNAL] #414: Use ``LEVELS(x)`` macro instead of accessing - ``(x)->sxpinfo.gp`` directly (@lukaszdaniel). +- [NEW FEATURE] #421: ``stri_rank()`` ranks strings in a character + vector (e.g., for ordering data frames with regards to multiple + criteria, the ranks can be passed to ``order()``, see #219). + +- [BUGFIX] ``stri_sort_key()`` now outputs ``bytes``-encoded strings. - [BUGFIX] #415: ``locale=''`` was not equivalent to ``locale=NULL`` in ``stri_opts_collator()``. +- [INTERNAL] #414: Use ``LEVELS(x)`` macro instead of accessing + ``(x)->sxpinfo.gp`` directly (@lukaszdaniel). + 1.5.3 (2020-09-04) **CRAN** --------------------------- diff --git a/devel/sphinx/rapi.rst b/devel/sphinx/rapi.rst index 216e166d7..687690722 100644 --- a/devel/sphinx/rapi.rst +++ b/devel/sphinx/rapi.rst @@ -72,6 +72,7 @@ R Package *stringi* Reference rapi/stri_rand_lipsum rapi/stri_rand_shuffle rapi/stri_rand_strings + rapi/stri_rank rapi/stri_read_lines rapi/stri_read_raw rapi/stri_remove_empty diff --git a/devel/sphinx/rapi/about_encoding.rst b/devel/sphinx/rapi/about_encoding.rst index ee364b6a0..0a43a6b40 100644 --- a/devel/sphinx/rapi/about_encoding.rst +++ b/devel/sphinx/rapi/about_encoding.rst @@ -43,7 +43,7 @@ Character Encodings in R Data in memory are just bytes (small integer values) – an en\ *coding* is a way to represent characters with such numbers, it is a semantic 'key' to understand a given byte sequence. For example, in ISO-8859-2 (Central European), the value 177 represents Polish “a with ogonek”, and in ISO-8859-1 (Western European), the same value denotes the “plus-minus” sign. Thus, a character encoding is a translation scheme: we need to communicate with R somehow, relying on how it represents strings. -Basically, R has a very simple encoding marking mechanism, see `stri_enc_mark `__. There is an implicit assumption that your platform's default (native) encoding always extends ASCII – stringi checks that whenever your native encoding is being detected automatically on ICU's initialization and each time when you change it manually by calling `stri_enc_set `__. +Overall, R has a very simple encoding marking mechanism, see `stri_enc_mark `__. There is an implicit assumption that your platform's default (native) encoding always extends ASCII – stringi checks that whenever your native encoding is being detected automatically on ICU's initialization and each time when you change it manually by calling `stri_enc_set `__. Character strings in R (internally) can be declared to be in: diff --git a/devel/sphinx/rapi/about_locale.rst b/devel/sphinx/rapi/about_locale.rst index 9257e65d1..014a69a9a 100644 --- a/devel/sphinx/rapi/about_locale.rst +++ b/devel/sphinx/rapi/about_locale.rst @@ -54,6 +54,6 @@ See Also Other locale_management: `stri_locale_info() `__, `stri_locale_list() `__, `stri_locale_set() `__ -Other locale_sensitive: `%s<%() `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ +Other locale_sensitive: `%s<%() `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_rank() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ Other stringi_general_topics: `about_arguments `__, `about_encoding `__, `about_search_boundaries `__, `about_search_charclass `__, `about_search_coll `__, `about_search_fixed `__, `about_search_regex `__, `about_search `__, `about_stringi `__ diff --git a/devel/sphinx/rapi/about_search_boundaries.rst b/devel/sphinx/rapi/about_search_boundaries.rst index 8e404b39f..831b2ee74 100644 --- a/devel/sphinx/rapi/about_search_boundaries.rst +++ b/devel/sphinx/rapi/about_search_boundaries.rst @@ -43,7 +43,7 @@ References See Also ~~~~~~~~ -Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ +Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_rank() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ Other text_boundaries: `about_search `__, `stri_count_boundaries() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_brkiter() `__, `stri_split_boundaries() `__, `stri_split_lines() `__, `stri_trans_tolower() `__, `stri_wrap() `__ diff --git a/devel/sphinx/rapi/about_search_coll.rst b/devel/sphinx/rapi/about_search_coll.rst index 5514cf651..13ce9358d 100644 --- a/devel/sphinx/rapi/about_search_coll.rst +++ b/devel/sphinx/rapi/about_search_coll.rst @@ -29,6 +29,6 @@ See Also Other search_coll: `about_search `__, `stri_opts_collator() `__ -Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ +Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_rank() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ Other stringi_general_topics: `about_arguments `__, `about_encoding `__, `about_locale `__, `about_search_boundaries `__, `about_search_charclass `__, `about_search_fixed `__, `about_search_regex `__, `about_search `__, `about_stringi `__ diff --git a/devel/sphinx/rapi/about_stringi.rst b/devel/sphinx/rapi/about_stringi.rst index 4f891e487..a82d1573a 100644 --- a/devel/sphinx/rapi/about_stringi.rst +++ b/devel/sphinx/rapi/about_stringi.rst @@ -4,7 +4,7 @@ about_stringi: THE String Processing Package Description ~~~~~~~~~~~ -stringi is THE R package for fast, correct, consistent, and convenient string/text manipulation. It gives predictable results on every platform, in each locale, and under any “native” character encoding. +stringi is THE R package for fast, correct, consistent, and convenient string/text manipulation. It gives predictable results on every platform, in each locale, and under any native character encoding. **Keywords**: R, text processing, character strings, internationalization, localization, ICU, ICU4C, i18n, l10n, Unicode. @@ -19,7 +19,7 @@ Manual pages on general topics: - `about_encoding `__ – character encoding issues, including information on encoding management in stringi, as well as on encoding detection and conversion. -- `about_locale `__ – locale issues, including locale management and specification in stringi, and the list of locale-sensitive operations. In particular, see `stri_opts_collator `__ for a description of the string collation algorithm, which is used for string comparing, ordering, sorting, case-folding, and searching. +- `about_locale `__ – locale issues, including locale management and specification in stringi, and the list of locale-sensitive operations. In particular, see `stri_opts_collator `__ for a description of the string collation algorithm, which is used for string comparing, ordering, ranking, sorting, case-folding, and searching. - `about_arguments `__ – information on how stringi treats its functions' arguments. @@ -54,7 +54,7 @@ Refer to the following: - `stri_trans_tolower `__ (among others) for case mapping, i.e., conversion to lower, UPPER, or Title Case, `stri_trans_nfc `__ (among others) for Unicode normalization, `stri_trans_char `__ for translating individual code points, and `stri_trans_general `__ for other universal yet powerful text transforms, including transliteration. -- `stri_cmp `__, `%s<% `__, `stri_order `__, `stri_sort `__, `stri_unique `__, and `stri_duplicated `__ for collation-based, locale-aware operations, see also `about_locale `__. +- `stri_cmp `__, `%s<% `__, `stri_order `__, `stri_sort `__, `stri_rank `__, `stri_unique `__, and `stri_duplicated `__ for collation-based, locale-aware operations, see also `about_locale `__. - `stri_split_lines `__ (among others) to split a string into text lines. @@ -69,7 +69,7 @@ Note that each man page provides many further links to other interesting facilit Author(s) ~~~~~~~~~ -Marek Gagolewski, with contributions from Bartek Tartanus and many others. ICU4C was developed by IBM and others. The Unicode Character Database is due to Unicode, Inc.; see the COPYRIGHTS file for more details. +Marek Gagolewski, with contributions from Bartek Tartanus and many others. ICU4C was developed by IBM, Unicode, Inc., and others. References ~~~~~~~~~~ diff --git a/devel/sphinx/rapi/operator_compare.rst b/devel/sphinx/rapi/operator_compare.rst index 5aebca12e..ebcfa325c 100644 --- a/devel/sphinx/rapi/operator_compare.rst +++ b/devel/sphinx/rapi/operator_compare.rst @@ -67,7 +67,7 @@ All the functions return a logical vector indicating the result of a pairwise co See Also ~~~~~~~~ -Other locale_sensitive: `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ +Other locale_sensitive: `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_rank() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ Examples ~~~~~~~~ diff --git a/devel/sphinx/rapi/stri_compare.rst b/devel/sphinx/rapi/stri_compare.rst index ec92c611c..2da14bd78 100644 --- a/devel/sphinx/rapi/stri_compare.rst +++ b/devel/sphinx/rapi/stri_compare.rst @@ -72,7 +72,7 @@ References See Also ~~~~~~~~ -Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ +Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_rank() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ Examples ~~~~~~~~ diff --git a/devel/sphinx/rapi/stri_count_boundaries.rst b/devel/sphinx/rapi/stri_count_boundaries.rst index cadcde0bd..308bbb4be 100644 --- a/devel/sphinx/rapi/stri_count_boundaries.rst +++ b/devel/sphinx/rapi/stri_count_boundaries.rst @@ -51,7 +51,7 @@ See Also Other search_count: `about_search `__, `stri_count() `__ -Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ +Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_rank() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ Other text_boundaries: `about_search_boundaries `__, `about_search `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_brkiter() `__, `stri_split_boundaries() `__, `stri_split_lines() `__, `stri_trans_tolower() `__, `stri_wrap() `__ diff --git a/devel/sphinx/rapi/stri_duplicated.rst b/devel/sphinx/rapi/stri_duplicated.rst index de02931dd..21173f55c 100644 --- a/devel/sphinx/rapi/stri_duplicated.rst +++ b/devel/sphinx/rapi/stri_duplicated.rst @@ -68,7 +68,7 @@ References See Also ~~~~~~~~ -Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ +Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_rank() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ Examples ~~~~~~~~ diff --git a/devel/sphinx/rapi/stri_enc_detect2.rst b/devel/sphinx/rapi/stri_enc_detect2.rst index bf07d139d..533a7b2bc 100644 --- a/devel/sphinx/rapi/stri_enc_detect2.rst +++ b/devel/sphinx/rapi/stri_enc_detect2.rst @@ -51,6 +51,6 @@ The guesses are ordered by decreasing confidence. See Also ~~~~~~~~ -Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ +Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_rank() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ Other encoding_detection: `about_encoding `__, `stri_enc_detect() `__, `stri_enc_isascii() `__, `stri_enc_isutf16be() `__, `stri_enc_isutf8() `__ diff --git a/devel/sphinx/rapi/stri_extract_boundaries.rst b/devel/sphinx/rapi/stri_extract_boundaries.rst index aecf953a6..4eb9875e0 100644 --- a/devel/sphinx/rapi/stri_extract_boundaries.rst +++ b/devel/sphinx/rapi/stri_extract_boundaries.rst @@ -74,7 +74,7 @@ See Also Other search_extract: `about_search `__, `stri_extract_all() `__, `stri_match_all() `__ -Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ +Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_rank() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ Other text_boundaries: `about_search_boundaries `__, `about_search `__, `stri_count_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_brkiter() `__, `stri_split_boundaries() `__, `stri_split_lines() `__, `stri_trans_tolower() `__, `stri_wrap() `__ diff --git a/devel/sphinx/rapi/stri_locate_boundaries.rst b/devel/sphinx/rapi/stri_locate_boundaries.rst index 3bdc3714e..96b5e6e31 100644 --- a/devel/sphinx/rapi/stri_locate_boundaries.rst +++ b/devel/sphinx/rapi/stri_locate_boundaries.rst @@ -66,7 +66,7 @@ Other search_locate: `about_search `__, `stri_locate_all() `__, `stri_sub_all() `__, `stri_sub() `__ -Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ +Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_rank() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ Other text_boundaries: `about_search_boundaries `__, `about_search `__, `stri_count_boundaries() `__, `stri_extract_all_boundaries() `__, `stri_opts_brkiter() `__, `stri_split_boundaries() `__, `stri_split_lines() `__, `stri_trans_tolower() `__, `stri_wrap() `__ diff --git a/devel/sphinx/rapi/stri_opts_collator.rst b/devel/sphinx/rapi/stri_opts_collator.rst index 85989bb7e..db1c9d606 100644 --- a/devel/sphinx/rapi/stri_opts_collator.rst +++ b/devel/sphinx/rapi/stri_opts_collator.rst @@ -84,7 +84,7 @@ References See Also ~~~~~~~~ -Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_order() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ +Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_order() `__, `stri_rank() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ Other search_coll: `about_search_coll `__, `about_search `__ diff --git a/devel/sphinx/rapi/stri_order.rst b/devel/sphinx/rapi/stri_order.rst index 81334a958..f7e49d7c8 100644 --- a/devel/sphinx/rapi/stri_order.rst +++ b/devel/sphinx/rapi/stri_order.rst @@ -33,10 +33,12 @@ Details For more information on ICU's Collator and how to tune it up in stringi, refer to `stri_opts_collator `__. -As usual in stringi, non-character inputs are coerced to strings, see an example below for a perhaps non-intuitive behavior of lexicographic sorting on numeric inputs. +As usual in stringi, non-character inputs are coerced to strings, see an example below for a somewhat non-intuitive behavior of lexicographic sorting on numeric inputs. This function uses a stable sort algorithm (STL's ``stable_sort``), which performs up to *N*log^2(N)* element comparisons, where *N* is the length of ``str``. +For ordering with regards to multiple criteria (such as sorting data frames by more than 1 column), see `stri_rank `__. + Value ~~~~~ @@ -50,7 +52,7 @@ References See Also ~~~~~~~~ -Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ +Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_rank() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ Examples ~~~~~~~~ diff --git a/devel/sphinx/rapi/stri_rank.rst b/devel/sphinx/rapi/stri_rank.rst new file mode 100644 index 000000000..1f13d4df6 --- /dev/null +++ b/devel/sphinx/rapi/stri_rank.rst @@ -0,0 +1,62 @@ +stri_rank: Ranking +================== + +Description +~~~~~~~~~~~ + +This function ranks each string in a character vector according to a locale-dependent lexicographic order. It is a portable replacement for the base ``xtfrm`` function. + +Usage +~~~~~ + +.. code-block:: r + + stri_rank(str, ..., opts_collator = NULL) + +Arguments +~~~~~~~~~ + ++-------------------+----------------------------------------------------------------------------------------------------------------------------------------+ +| ``str`` | a character vector | ++-------------------+----------------------------------------------------------------------------------------------------------------------------------------+ +| ``...`` | additional settings for ``opts_collator`` | ++-------------------+----------------------------------------------------------------------------------------------------------------------------------------+ +| ``opts_collator`` | a named list with ICU Collator's options, see `stri_opts_collator `__, ``NULL`` for default collation options | ++-------------------+----------------------------------------------------------------------------------------------------------------------------------------+ + +Details +~~~~~~~ + +Missing values result in missing ranks and tied observations receive the same ranks (based on min). + +For more information on ICU's Collator and how to tune it up in stringi, refer to `stri_opts_collator `__. + +Value +~~~~~ + +The result is a vector of ranks corresponding to each string in ``str``. + +References +~~~~~~~~~~ + +*Collation* - ICU User Guide, http://userguide.icu-project.org/collation + +See Also +~~~~~~~~ + +Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ + +Examples +~~~~~~~~ + +.. code-block:: r + + stri_rank(c('hladny', 'chladny'), locale='pl_PL') + stri_rank(c('hladny', 'chladny'), locale='sk_SK') + + stri_rank("a" %s+% c(1, 100, 2, 101, 11, 10)) # lexicographic order + stri_rank("a" %s+% c(1, 100, 2, 101, 11, 10), numeric=TRUE) + + # Ordering a data frame with respect to two criteria: + X <- data.frame(a=c("b", NA, "b", "b", NA, "a", "a", "c"), b=runif(8)) + X[order(stri_rank(X$a), X$b), ] diff --git a/devel/sphinx/rapi/stri_sort.rst b/devel/sphinx/rapi/stri_sort.rst index 64c922946..bff8c070d 100644 --- a/devel/sphinx/rapi/stri_sort.rst +++ b/devel/sphinx/rapi/stri_sort.rst @@ -4,7 +4,7 @@ stri_sort: Sorting Description ~~~~~~~~~~~ -This function sorts a character vector according to the locale-dependent lexicographic order. +This function sorts a character vector according to a locale-dependent lexicographic order. Usage ~~~~~ @@ -33,7 +33,7 @@ Details For more information on ICU's Collator and how to tune it up in stringi, refer to `stri_opts_collator `__. -As usual in stringi, non-character inputs are coerced to strings, see an example below for a perhaps non-intitive behavior of lexicographic sorting on numeric inputs. +As usual in stringi, non-character inputs are coerced to strings, see an example below for a somewhat non-intuitive behavior of lexicographic sorting on numeric inputs. This function uses a stable sort algorithm (STL's ``stable_sort``), which performs up to *N*log^2(N)* element comparisons, where *N* is the length of ``str``. @@ -50,7 +50,7 @@ References See Also ~~~~~~~~ -Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_sort_key() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ +Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_rank() `__, `stri_sort_key() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ Examples ~~~~~~~~ diff --git a/devel/sphinx/rapi/stri_sort_key.rst b/devel/sphinx/rapi/stri_sort_key.rst index fb1f33588..1fa67a493 100644 --- a/devel/sphinx/rapi/stri_sort_key.rst +++ b/devel/sphinx/rapi/stri_sort_key.rst @@ -4,7 +4,7 @@ stri_sort_key: Sort Keys Description ~~~~~~~~~~~ -This function computes a locale-dependent 'sort key', which is an alternative character representation of the string that, when ordered in the C locale (which orders using bytes directly), will give an equivalent ordering to the original string. It is useful for enhancing algorithms that sort only in the C locale with the ability to be locale-aware. +This function computes a locale-dependent sort key, which is an alternative character representation of the string that, when ordered in the C locale (which orders using the underlying bytes directly), will give an equivalent ordering to the original string. It is useful for enhancing algorithms that sort only in the C locale (e.g., the ``strcmp`` function in libc) with the ability to be locale-aware. Usage ~~~~~ @@ -29,10 +29,12 @@ Details For more information on ICU's Collator and how to tune it up in stringi, refer to `stri_opts_collator `__. +See also `stri_rank `__ for ranking strings with a single character vector, i.e., generating relative sort keys. + Value ~~~~~ -The result is a character vector with the same length as ``str`` that contains the sort keys. +The result is a character vector with the same length as ``str`` that contains the sort keys. The output is marked as ``bytes``-encoded. References ~~~~~~~~~~ @@ -42,7 +44,7 @@ References See Also ~~~~~~~~ -Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ +Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_rank() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ Examples ~~~~~~~~ diff --git a/devel/sphinx/rapi/stri_split_boundaries.rst b/devel/sphinx/rapi/stri_split_boundaries.rst index 4cf25d35e..fc2367aa6 100644 --- a/devel/sphinx/rapi/stri_split_boundaries.rst +++ b/devel/sphinx/rapi/stri_split_boundaries.rst @@ -60,7 +60,7 @@ See Also Other search_split: `about_search `__, `stri_split_lines() `__, `stri_split() `__ -Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ +Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_rank() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ Other text_boundaries: `about_search_boundaries `__, `about_search `__, `stri_count_boundaries() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_brkiter() `__, `stri_split_lines() `__, `stri_trans_tolower() `__, `stri_wrap() `__ diff --git a/devel/sphinx/rapi/stri_trans_casemap.rst b/devel/sphinx/rapi/stri_trans_casemap.rst index 0171d7399..54b76c9f1 100644 --- a/devel/sphinx/rapi/stri_trans_casemap.rst +++ b/devel/sphinx/rapi/stri_trans_casemap.rst @@ -60,7 +60,7 @@ References See Also ~~~~~~~~ -Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_unique() `__, `stri_wrap() `__ +Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_rank() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_unique() `__, `stri_wrap() `__ Other transform: `stri_trans_char() `__, `stri_trans_general() `__, `stri_trans_list() `__, `stri_trans_nfc() `__ diff --git a/devel/sphinx/rapi/stri_unique.rst b/devel/sphinx/rapi/stri_unique.rst index ea6906c9c..7feb971ae 100644 --- a/devel/sphinx/rapi/stri_unique.rst +++ b/devel/sphinx/rapi/stri_unique.rst @@ -44,7 +44,7 @@ References See Also ~~~~~~~~ -Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_wrap() `__ +Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_rank() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_wrap() `__ Examples ~~~~~~~~ diff --git a/devel/sphinx/rapi/stri_wrap.rst b/devel/sphinx/rapi/stri_wrap.rst index 1ffd8a838..25e4d7fea 100644 --- a/devel/sphinx/rapi/stri_wrap.rst +++ b/devel/sphinx/rapi/stri_wrap.rst @@ -84,7 +84,7 @@ D.E. Knuth, M.F. Plass, Breaking paragraphs into lines, *Software: Practice and See Also ~~~~~~~~ -Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__ +Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_rank() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__ Other text_boundaries: `about_search_boundaries `__, `about_search `__, `stri_count_boundaries() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_brkiter() `__, `stri_split_boundaries() `__, `stri_split_lines() `__, `stri_trans_tolower() `__ diff --git a/devel/tinytest/test-sort.R b/devel/tinytest/test-sort.R index 776b7e1eb..d404ce170 100644 --- a/devel/tinytest/test-sort.R +++ b/devel/tinytest/test-sort.R @@ -171,3 +171,38 @@ if (getRversion() > "3.3.0") { expect_equivalent(radix_order(stri_sort_key(x, numeric = TRUE)), stri_order(x, numeric = TRUE)) } + + +x <- LETTERS +expect_equivalent(stri_rank(x), rank(x, ties.method="min")) + +x <- rev(LETTERS) +expect_equivalent(stri_rank(x), rank(x, ties.method="min")) + +x <- c("b", "a", "a", "b", "a", "b", "a", "b", "a") +expect_equivalent(stri_rank(x), rank(x, ties.method="min")) + +x <- c("a", "a", "b", NA, "a", "b", "a", "b", "a", NA) +r <- rank(x, ties.method="min") +r[is.na(x)] <- NA +expect_equivalent(stri_rank(x), r) + +expect_equivalent(stri_rank(character(0)), integer(0)) + +expect_equivalent(stri_rank(NA), NA_integer_) + + +expect_equivalent(stri_rank(c(NA, 1, 2)), c(NA, 1, 2)) +expect_equivalent(stri_rank(c(2, NA, 1)), c(2, NA, 1)) +expect_equivalent(stri_rank(c(NA, 1)), c(NA, 1)) +expect_equivalent(stri_rank(c(1, NA)), c(1, NA)) + +expect_equivalent(stri_rank(c(rep(NA, 100), 1)), c(rep(NA, 100), 1)) + +expect_equivalent(stri_rank(c(rep(NA, 100))), c(rep(NA_integer_, 100))) + +expect_equivalent(stri_rank(c('hladny', 'chladny'), locale='pl_PL'), c(2, 1)) + +expect_equivalent(stri_rank(c('hladny', 'chladny'), locale='sk_SK'), c(1, 2)) + + diff --git a/docs/_sources/news.rst.txt b/docs/_sources/news.rst.txt index 1d1564f71..e89e51b5f 100644 --- a/docs/_sources/news.rst.txt +++ b/docs/_sources/news.rst.txt @@ -15,14 +15,20 @@ What Is New in *stringi* - …todo… #401 (update ICU4C to 69.1), The ICU4C bundle has been updated from version 61.1 to 69.1 which features Unicode 13.0 and CLDR 39. -- …todo… #408 (stri_trans_casefold), +- [NEW FEATURE] #408: …todo… ``stri_trans_casefold()``, -- [INTERNAL] #414: Use ``LEVELS(x)`` macro instead of accessing - ``(x)->sxpinfo.gp`` directly (@lukaszdaniel). +- [NEW FEATURE] #421: ``stri_rank()`` ranks strings in a character + vector (e.g., for ordering data frames with regards to multiple + criteria, the ranks can be passed to ``order()``, see #219). + +- [BUGFIX] ``stri_sort_key()`` now outputs ``bytes``-encoded strings. - [BUGFIX] #415: ``locale=''`` was not equivalent to ``locale=NULL`` in ``stri_opts_collator()``. +- [INTERNAL] #414: Use ``LEVELS(x)`` macro instead of accessing + ``(x)->sxpinfo.gp`` directly (@lukaszdaniel). + 1.5.3 (2020-09-04) **CRAN** --------------------------- diff --git a/docs/_sources/rapi.rst.txt b/docs/_sources/rapi.rst.txt index 216e166d7..687690722 100644 --- a/docs/_sources/rapi.rst.txt +++ b/docs/_sources/rapi.rst.txt @@ -72,6 +72,7 @@ R Package *stringi* Reference rapi/stri_rand_lipsum rapi/stri_rand_shuffle rapi/stri_rand_strings + rapi/stri_rank rapi/stri_read_lines rapi/stri_read_raw rapi/stri_remove_empty diff --git a/docs/_sources/rapi/about_encoding.rst.txt b/docs/_sources/rapi/about_encoding.rst.txt index ee364b6a0..0a43a6b40 100644 --- a/docs/_sources/rapi/about_encoding.rst.txt +++ b/docs/_sources/rapi/about_encoding.rst.txt @@ -43,7 +43,7 @@ Character Encodings in R Data in memory are just bytes (small integer values) – an en\ *coding* is a way to represent characters with such numbers, it is a semantic 'key' to understand a given byte sequence. For example, in ISO-8859-2 (Central European), the value 177 represents Polish “a with ogonek”, and in ISO-8859-1 (Western European), the same value denotes the “plus-minus” sign. Thus, a character encoding is a translation scheme: we need to communicate with R somehow, relying on how it represents strings. -Basically, R has a very simple encoding marking mechanism, see `stri_enc_mark `__. There is an implicit assumption that your platform's default (native) encoding always extends ASCII – stringi checks that whenever your native encoding is being detected automatically on ICU's initialization and each time when you change it manually by calling `stri_enc_set `__. +Overall, R has a very simple encoding marking mechanism, see `stri_enc_mark `__. There is an implicit assumption that your platform's default (native) encoding always extends ASCII – stringi checks that whenever your native encoding is being detected automatically on ICU's initialization and each time when you change it manually by calling `stri_enc_set `__. Character strings in R (internally) can be declared to be in: diff --git a/docs/_sources/rapi/about_locale.rst.txt b/docs/_sources/rapi/about_locale.rst.txt index 9257e65d1..014a69a9a 100644 --- a/docs/_sources/rapi/about_locale.rst.txt +++ b/docs/_sources/rapi/about_locale.rst.txt @@ -54,6 +54,6 @@ See Also Other locale_management: `stri_locale_info() `__, `stri_locale_list() `__, `stri_locale_set() `__ -Other locale_sensitive: `%s<%() `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ +Other locale_sensitive: `%s<%() `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_rank() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ Other stringi_general_topics: `about_arguments `__, `about_encoding `__, `about_search_boundaries `__, `about_search_charclass `__, `about_search_coll `__, `about_search_fixed `__, `about_search_regex `__, `about_search `__, `about_stringi `__ diff --git a/docs/_sources/rapi/about_search_boundaries.rst.txt b/docs/_sources/rapi/about_search_boundaries.rst.txt index 8e404b39f..831b2ee74 100644 --- a/docs/_sources/rapi/about_search_boundaries.rst.txt +++ b/docs/_sources/rapi/about_search_boundaries.rst.txt @@ -43,7 +43,7 @@ References See Also ~~~~~~~~ -Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ +Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_rank() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ Other text_boundaries: `about_search `__, `stri_count_boundaries() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_brkiter() `__, `stri_split_boundaries() `__, `stri_split_lines() `__, `stri_trans_tolower() `__, `stri_wrap() `__ diff --git a/docs/_sources/rapi/about_search_coll.rst.txt b/docs/_sources/rapi/about_search_coll.rst.txt index 5514cf651..13ce9358d 100644 --- a/docs/_sources/rapi/about_search_coll.rst.txt +++ b/docs/_sources/rapi/about_search_coll.rst.txt @@ -29,6 +29,6 @@ See Also Other search_coll: `about_search `__, `stri_opts_collator() `__ -Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ +Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_rank() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ Other stringi_general_topics: `about_arguments `__, `about_encoding `__, `about_locale `__, `about_search_boundaries `__, `about_search_charclass `__, `about_search_fixed `__, `about_search_regex `__, `about_search `__, `about_stringi `__ diff --git a/docs/_sources/rapi/about_stringi.rst.txt b/docs/_sources/rapi/about_stringi.rst.txt index 4f891e487..a82d1573a 100644 --- a/docs/_sources/rapi/about_stringi.rst.txt +++ b/docs/_sources/rapi/about_stringi.rst.txt @@ -4,7 +4,7 @@ about_stringi: THE String Processing Package Description ~~~~~~~~~~~ -stringi is THE R package for fast, correct, consistent, and convenient string/text manipulation. It gives predictable results on every platform, in each locale, and under any “native” character encoding. +stringi is THE R package for fast, correct, consistent, and convenient string/text manipulation. It gives predictable results on every platform, in each locale, and under any native character encoding. **Keywords**: R, text processing, character strings, internationalization, localization, ICU, ICU4C, i18n, l10n, Unicode. @@ -19,7 +19,7 @@ Manual pages on general topics: - `about_encoding `__ – character encoding issues, including information on encoding management in stringi, as well as on encoding detection and conversion. -- `about_locale `__ – locale issues, including locale management and specification in stringi, and the list of locale-sensitive operations. In particular, see `stri_opts_collator `__ for a description of the string collation algorithm, which is used for string comparing, ordering, sorting, case-folding, and searching. +- `about_locale `__ – locale issues, including locale management and specification in stringi, and the list of locale-sensitive operations. In particular, see `stri_opts_collator `__ for a description of the string collation algorithm, which is used for string comparing, ordering, ranking, sorting, case-folding, and searching. - `about_arguments `__ – information on how stringi treats its functions' arguments. @@ -54,7 +54,7 @@ Refer to the following: - `stri_trans_tolower `__ (among others) for case mapping, i.e., conversion to lower, UPPER, or Title Case, `stri_trans_nfc `__ (among others) for Unicode normalization, `stri_trans_char `__ for translating individual code points, and `stri_trans_general `__ for other universal yet powerful text transforms, including transliteration. -- `stri_cmp `__, `%s<% `__, `stri_order `__, `stri_sort `__, `stri_unique `__, and `stri_duplicated `__ for collation-based, locale-aware operations, see also `about_locale `__. +- `stri_cmp `__, `%s<% `__, `stri_order `__, `stri_sort `__, `stri_rank `__, `stri_unique `__, and `stri_duplicated `__ for collation-based, locale-aware operations, see also `about_locale `__. - `stri_split_lines `__ (among others) to split a string into text lines. @@ -69,7 +69,7 @@ Note that each man page provides many further links to other interesting facilit Author(s) ~~~~~~~~~ -Marek Gagolewski, with contributions from Bartek Tartanus and many others. ICU4C was developed by IBM and others. The Unicode Character Database is due to Unicode, Inc.; see the COPYRIGHTS file for more details. +Marek Gagolewski, with contributions from Bartek Tartanus and many others. ICU4C was developed by IBM, Unicode, Inc., and others. References ~~~~~~~~~~ diff --git a/docs/_sources/rapi/operator_compare.rst.txt b/docs/_sources/rapi/operator_compare.rst.txt index 5aebca12e..ebcfa325c 100644 --- a/docs/_sources/rapi/operator_compare.rst.txt +++ b/docs/_sources/rapi/operator_compare.rst.txt @@ -67,7 +67,7 @@ All the functions return a logical vector indicating the result of a pairwise co See Also ~~~~~~~~ -Other locale_sensitive: `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ +Other locale_sensitive: `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_rank() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ Examples ~~~~~~~~ diff --git a/docs/_sources/rapi/stri_compare.rst.txt b/docs/_sources/rapi/stri_compare.rst.txt index ec92c611c..2da14bd78 100644 --- a/docs/_sources/rapi/stri_compare.rst.txt +++ b/docs/_sources/rapi/stri_compare.rst.txt @@ -72,7 +72,7 @@ References See Also ~~~~~~~~ -Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ +Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_rank() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ Examples ~~~~~~~~ diff --git a/docs/_sources/rapi/stri_count_boundaries.rst.txt b/docs/_sources/rapi/stri_count_boundaries.rst.txt index cadcde0bd..308bbb4be 100644 --- a/docs/_sources/rapi/stri_count_boundaries.rst.txt +++ b/docs/_sources/rapi/stri_count_boundaries.rst.txt @@ -51,7 +51,7 @@ See Also Other search_count: `about_search `__, `stri_count() `__ -Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ +Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_rank() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ Other text_boundaries: `about_search_boundaries `__, `about_search `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_brkiter() `__, `stri_split_boundaries() `__, `stri_split_lines() `__, `stri_trans_tolower() `__, `stri_wrap() `__ diff --git a/docs/_sources/rapi/stri_duplicated.rst.txt b/docs/_sources/rapi/stri_duplicated.rst.txt index de02931dd..21173f55c 100644 --- a/docs/_sources/rapi/stri_duplicated.rst.txt +++ b/docs/_sources/rapi/stri_duplicated.rst.txt @@ -68,7 +68,7 @@ References See Also ~~~~~~~~ -Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ +Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_rank() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ Examples ~~~~~~~~ diff --git a/docs/_sources/rapi/stri_enc_detect2.rst.txt b/docs/_sources/rapi/stri_enc_detect2.rst.txt index bf07d139d..533a7b2bc 100644 --- a/docs/_sources/rapi/stri_enc_detect2.rst.txt +++ b/docs/_sources/rapi/stri_enc_detect2.rst.txt @@ -51,6 +51,6 @@ The guesses are ordered by decreasing confidence. See Also ~~~~~~~~ -Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ +Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_rank() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ Other encoding_detection: `about_encoding `__, `stri_enc_detect() `__, `stri_enc_isascii() `__, `stri_enc_isutf16be() `__, `stri_enc_isutf8() `__ diff --git a/docs/_sources/rapi/stri_extract_boundaries.rst.txt b/docs/_sources/rapi/stri_extract_boundaries.rst.txt index aecf953a6..4eb9875e0 100644 --- a/docs/_sources/rapi/stri_extract_boundaries.rst.txt +++ b/docs/_sources/rapi/stri_extract_boundaries.rst.txt @@ -74,7 +74,7 @@ See Also Other search_extract: `about_search `__, `stri_extract_all() `__, `stri_match_all() `__ -Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ +Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_rank() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ Other text_boundaries: `about_search_boundaries `__, `about_search `__, `stri_count_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_brkiter() `__, `stri_split_boundaries() `__, `stri_split_lines() `__, `stri_trans_tolower() `__, `stri_wrap() `__ diff --git a/docs/_sources/rapi/stri_locate_boundaries.rst.txt b/docs/_sources/rapi/stri_locate_boundaries.rst.txt index 3bdc3714e..96b5e6e31 100644 --- a/docs/_sources/rapi/stri_locate_boundaries.rst.txt +++ b/docs/_sources/rapi/stri_locate_boundaries.rst.txt @@ -66,7 +66,7 @@ Other search_locate: `about_search `__, `stri_locate_all() `__, `stri_sub_all() `__, `stri_sub() `__ -Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ +Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_rank() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ Other text_boundaries: `about_search_boundaries `__, `about_search `__, `stri_count_boundaries() `__, `stri_extract_all_boundaries() `__, `stri_opts_brkiter() `__, `stri_split_boundaries() `__, `stri_split_lines() `__, `stri_trans_tolower() `__, `stri_wrap() `__ diff --git a/docs/_sources/rapi/stri_opts_collator.rst.txt b/docs/_sources/rapi/stri_opts_collator.rst.txt index 85989bb7e..db1c9d606 100644 --- a/docs/_sources/rapi/stri_opts_collator.rst.txt +++ b/docs/_sources/rapi/stri_opts_collator.rst.txt @@ -84,7 +84,7 @@ References See Also ~~~~~~~~ -Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_order() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ +Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_order() `__, `stri_rank() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ Other search_coll: `about_search_coll `__, `about_search `__ diff --git a/docs/_sources/rapi/stri_order.rst.txt b/docs/_sources/rapi/stri_order.rst.txt index 81334a958..f7e49d7c8 100644 --- a/docs/_sources/rapi/stri_order.rst.txt +++ b/docs/_sources/rapi/stri_order.rst.txt @@ -33,10 +33,12 @@ Details For more information on ICU's Collator and how to tune it up in stringi, refer to `stri_opts_collator `__. -As usual in stringi, non-character inputs are coerced to strings, see an example below for a perhaps non-intuitive behavior of lexicographic sorting on numeric inputs. +As usual in stringi, non-character inputs are coerced to strings, see an example below for a somewhat non-intuitive behavior of lexicographic sorting on numeric inputs. This function uses a stable sort algorithm (STL's ``stable_sort``), which performs up to *N*log^2(N)* element comparisons, where *N* is the length of ``str``. +For ordering with regards to multiple criteria (such as sorting data frames by more than 1 column), see `stri_rank `__. + Value ~~~~~ @@ -50,7 +52,7 @@ References See Also ~~~~~~~~ -Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ +Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_rank() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ Examples ~~~~~~~~ diff --git a/docs/_sources/rapi/stri_rank.rst.txt b/docs/_sources/rapi/stri_rank.rst.txt new file mode 100644 index 000000000..1f13d4df6 --- /dev/null +++ b/docs/_sources/rapi/stri_rank.rst.txt @@ -0,0 +1,62 @@ +stri_rank: Ranking +================== + +Description +~~~~~~~~~~~ + +This function ranks each string in a character vector according to a locale-dependent lexicographic order. It is a portable replacement for the base ``xtfrm`` function. + +Usage +~~~~~ + +.. code-block:: r + + stri_rank(str, ..., opts_collator = NULL) + +Arguments +~~~~~~~~~ + ++-------------------+----------------------------------------------------------------------------------------------------------------------------------------+ +| ``str`` | a character vector | ++-------------------+----------------------------------------------------------------------------------------------------------------------------------------+ +| ``...`` | additional settings for ``opts_collator`` | ++-------------------+----------------------------------------------------------------------------------------------------------------------------------------+ +| ``opts_collator`` | a named list with ICU Collator's options, see `stri_opts_collator `__, ``NULL`` for default collation options | ++-------------------+----------------------------------------------------------------------------------------------------------------------------------------+ + +Details +~~~~~~~ + +Missing values result in missing ranks and tied observations receive the same ranks (based on min). + +For more information on ICU's Collator and how to tune it up in stringi, refer to `stri_opts_collator `__. + +Value +~~~~~ + +The result is a vector of ranks corresponding to each string in ``str``. + +References +~~~~~~~~~~ + +*Collation* - ICU User Guide, http://userguide.icu-project.org/collation + +See Also +~~~~~~~~ + +Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ + +Examples +~~~~~~~~ + +.. code-block:: r + + stri_rank(c('hladny', 'chladny'), locale='pl_PL') + stri_rank(c('hladny', 'chladny'), locale='sk_SK') + + stri_rank("a" %s+% c(1, 100, 2, 101, 11, 10)) # lexicographic order + stri_rank("a" %s+% c(1, 100, 2, 101, 11, 10), numeric=TRUE) + + # Ordering a data frame with respect to two criteria: + X <- data.frame(a=c("b", NA, "b", "b", NA, "a", "a", "c"), b=runif(8)) + X[order(stri_rank(X$a), X$b), ] diff --git a/docs/_sources/rapi/stri_sort.rst.txt b/docs/_sources/rapi/stri_sort.rst.txt index 64c922946..bff8c070d 100644 --- a/docs/_sources/rapi/stri_sort.rst.txt +++ b/docs/_sources/rapi/stri_sort.rst.txt @@ -4,7 +4,7 @@ stri_sort: Sorting Description ~~~~~~~~~~~ -This function sorts a character vector according to the locale-dependent lexicographic order. +This function sorts a character vector according to a locale-dependent lexicographic order. Usage ~~~~~ @@ -33,7 +33,7 @@ Details For more information on ICU's Collator and how to tune it up in stringi, refer to `stri_opts_collator `__. -As usual in stringi, non-character inputs are coerced to strings, see an example below for a perhaps non-intitive behavior of lexicographic sorting on numeric inputs. +As usual in stringi, non-character inputs are coerced to strings, see an example below for a somewhat non-intuitive behavior of lexicographic sorting on numeric inputs. This function uses a stable sort algorithm (STL's ``stable_sort``), which performs up to *N*log^2(N)* element comparisons, where *N* is the length of ``str``. @@ -50,7 +50,7 @@ References See Also ~~~~~~~~ -Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_sort_key() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ +Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_rank() `__, `stri_sort_key() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ Examples ~~~~~~~~ diff --git a/docs/_sources/rapi/stri_sort_key.rst.txt b/docs/_sources/rapi/stri_sort_key.rst.txt index fb1f33588..1fa67a493 100644 --- a/docs/_sources/rapi/stri_sort_key.rst.txt +++ b/docs/_sources/rapi/stri_sort_key.rst.txt @@ -4,7 +4,7 @@ stri_sort_key: Sort Keys Description ~~~~~~~~~~~ -This function computes a locale-dependent 'sort key', which is an alternative character representation of the string that, when ordered in the C locale (which orders using bytes directly), will give an equivalent ordering to the original string. It is useful for enhancing algorithms that sort only in the C locale with the ability to be locale-aware. +This function computes a locale-dependent sort key, which is an alternative character representation of the string that, when ordered in the C locale (which orders using the underlying bytes directly), will give an equivalent ordering to the original string. It is useful for enhancing algorithms that sort only in the C locale (e.g., the ``strcmp`` function in libc) with the ability to be locale-aware. Usage ~~~~~ @@ -29,10 +29,12 @@ Details For more information on ICU's Collator and how to tune it up in stringi, refer to `stri_opts_collator `__. +See also `stri_rank `__ for ranking strings with a single character vector, i.e., generating relative sort keys. + Value ~~~~~ -The result is a character vector with the same length as ``str`` that contains the sort keys. +The result is a character vector with the same length as ``str`` that contains the sort keys. The output is marked as ``bytes``-encoded. References ~~~~~~~~~~ @@ -42,7 +44,7 @@ References See Also ~~~~~~~~ -Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ +Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_rank() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ Examples ~~~~~~~~ diff --git a/docs/_sources/rapi/stri_split_boundaries.rst.txt b/docs/_sources/rapi/stri_split_boundaries.rst.txt index 4cf25d35e..fc2367aa6 100644 --- a/docs/_sources/rapi/stri_split_boundaries.rst.txt +++ b/docs/_sources/rapi/stri_split_boundaries.rst.txt @@ -60,7 +60,7 @@ See Also Other search_split: `about_search `__, `stri_split_lines() `__, `stri_split() `__ -Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ +Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_rank() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_trans_tolower() `__, `stri_unique() `__, `stri_wrap() `__ Other text_boundaries: `about_search_boundaries `__, `about_search `__, `stri_count_boundaries() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_brkiter() `__, `stri_split_lines() `__, `stri_trans_tolower() `__, `stri_wrap() `__ diff --git a/docs/_sources/rapi/stri_trans_casemap.rst.txt b/docs/_sources/rapi/stri_trans_casemap.rst.txt index 0171d7399..54b76c9f1 100644 --- a/docs/_sources/rapi/stri_trans_casemap.rst.txt +++ b/docs/_sources/rapi/stri_trans_casemap.rst.txt @@ -60,7 +60,7 @@ References See Also ~~~~~~~~ -Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_unique() `__, `stri_wrap() `__ +Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_rank() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_unique() `__, `stri_wrap() `__ Other transform: `stri_trans_char() `__, `stri_trans_general() `__, `stri_trans_list() `__, `stri_trans_nfc() `__ diff --git a/docs/_sources/rapi/stri_unique.rst.txt b/docs/_sources/rapi/stri_unique.rst.txt index ea6906c9c..7feb971ae 100644 --- a/docs/_sources/rapi/stri_unique.rst.txt +++ b/docs/_sources/rapi/stri_unique.rst.txt @@ -44,7 +44,7 @@ References See Also ~~~~~~~~ -Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_wrap() `__ +Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_rank() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_wrap() `__ Examples ~~~~~~~~ diff --git a/docs/_sources/rapi/stri_wrap.rst.txt b/docs/_sources/rapi/stri_wrap.rst.txt index 1ffd8a838..25e4d7fea 100644 --- a/docs/_sources/rapi/stri_wrap.rst.txt +++ b/docs/_sources/rapi/stri_wrap.rst.txt @@ -84,7 +84,7 @@ D.E. Knuth, M.F. Plass, Breaking paragraphs into lines, *Software: Practice and See Also ~~~~~~~~ -Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__ +Other locale_sensitive: `%s<%() `__, `about_locale `__, `about_search_boundaries `__, `about_search_coll `__, `stri_compare() `__, `stri_count_boundaries() `__, `stri_duplicated() `__, `stri_enc_detect2() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_collator() `__, `stri_order() `__, `stri_rank() `__, `stri_sort_key() `__, `stri_sort() `__, `stri_split_boundaries() `__, `stri_trans_tolower() `__, `stri_unique() `__ Other text_boundaries: `about_search_boundaries `__, `about_search `__, `stri_count_boundaries() `__, `stri_extract_all_boundaries() `__, `stri_locate_all_boundaries() `__, `stri_opts_brkiter() `__, `stri_split_boundaries() `__, `stri_split_lines() `__, `stri_trans_tolower() `__ diff --git a/docs/index.html b/docs/index.html index 688ec3cda..56df7130b 100644 --- a/docs/index.html +++ b/docs/index.html @@ -301,6 +301,7 @@

        stringi: THE String Processing Package for Rstri_rand_lipsum: A Lorem Ipsum Generator
      • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
      • stri_rand_strings: Generate Random Strings
      • +
      • stri_rank: Ranking
      • stri_read_lines: Read Text Lines from a Text File
      • stri_read_raw: Read Text File as Raw
      • stri_remove_empty: Remove All Empty Strings from a Character Vector
      • diff --git a/docs/news.html b/docs/news.html index 7b5df2542..3e3dad245 100644 --- a/docs/news.html +++ b/docs/news.html @@ -234,11 +234,15 @@

        1.6.1 (2021-XX-YY) develhttps://stringi.gagolewski.com/_static/vignette/stringi.pdf

      • …todo… #401 (update ICU4C to 69.1), The ICU4C bundle has been updated from version 61.1 to 69.1 which features Unicode 13.0 and CLDR 39.

      • -
      • …todo… #408 (stri_trans_casefold),

      • -
      • [INTERNAL] #414: Use LEVELS(x) macro instead of accessing -(x)->sxpinfo.gp directly (@lukaszdaniel).

      • +
      • [NEW FEATURE] #408: …todo… stri_trans_casefold(),

      • +
      • [NEW FEATURE] #421: stri_rank() ranks strings in a character +vector (e.g., for ordering data frames with regards to multiple +criteria, the ranks can be passed to order(), see #219).

      • +
      • [BUGFIX] stri_sort_key() now outputs bytes-encoded strings.

      • [BUGFIX] #415: locale='' was not equivalent to locale=NULL in stri_opts_collator().

      • +
      • [INTERNAL] #414: Use LEVELS(x) macro instead of accessing +(x)->sxpinfo.gp directly (@lukaszdaniel).

      diff --git a/docs/objects.inv b/docs/objects.inv index ec7322b13..75b0d3775 100644 Binary files a/docs/objects.inv and b/docs/objects.inv differ diff --git a/docs/rapi.html b/docs/rapi.html index 6c33557b5..e66b02496 100644 --- a/docs/rapi.html +++ b/docs/rapi.html @@ -167,6 +167,7 @@
    • stri_rand_lipsum: A Lorem Ipsum Generator
    • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
    • stri_rand_strings: Generate Random Strings
    • +
    • stri_rank: Ranking
    • stri_read_lines: Read Text Lines from a Text File
    • stri_read_raw: Read Text File as Raw
    • stri_remove_empty: Remove All Empty Strings from a Character Vector
    • @@ -356,6 +357,7 @@

      R Package stringi Referencestri_rand_lipsum: A Lorem Ipsum Generator
    • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
    • stri_rand_strings: Generate Random Strings
    • +
    • stri_rank: Ranking
    • stri_read_lines: Read Text Lines from a Text File
    • stri_read_raw: Read Text File as Raw
    • stri_remove_empty: Remove All Empty Strings from a Character Vector
    • diff --git a/docs/rapi/about_arguments.html b/docs/rapi/about_arguments.html index 137a863c2..99bfa14dd 100644 --- a/docs/rapi/about_arguments.html +++ b/docs/rapi/about_arguments.html @@ -175,6 +175,7 @@
    • stri_rand_lipsum: A Lorem Ipsum Generator
    • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
    • stri_rand_strings: Generate Random Strings
    • +
    • stri_rank: Ranking
    • stri_read_lines: Read Text Lines from a Text File
    • stri_read_raw: Read Text File as Raw
    • stri_remove_empty: Remove All Empty Strings from a Character Vector
    • diff --git a/docs/rapi/about_encoding.html b/docs/rapi/about_encoding.html index c954301ef..8d00c4d62 100644 --- a/docs/rapi/about_encoding.html +++ b/docs/rapi/about_encoding.html @@ -177,6 +177,7 @@
    • stri_rand_lipsum: A Lorem Ipsum Generator
    • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
    • stri_rand_strings: Generate Random Strings
    • +
    • stri_rank: Ranking
    • stri_read_lines: Read Text Lines from a Text File
    • stri_read_raw: Read Text File as Raw
    • stri_remove_empty: Remove All Empty Strings from a Character Vector
    • @@ -326,7 +327,7 @@

      UTF-8 and UTF-16

      Character Encodings in R

      Data in memory are just bytes (small integer values) – an encoding is a way to represent characters with such numbers, it is a semantic ‘key’ to understand a given byte sequence. For example, in ISO-8859-2 (Central European), the value 177 represents Polish “a with ogonek”, and in ISO-8859-1 (Western European), the same value denotes the “plus-minus” sign. Thus, a character encoding is a translation scheme: we need to communicate with R somehow, relying on how it represents strings.

      -

      Basically, R has a very simple encoding marking mechanism, see stri_enc_mark. There is an implicit assumption that your platform’s default (native) encoding always extends ASCII – stringi checks that whenever your native encoding is being detected automatically on ICU’s initialization and each time when you change it manually by calling stri_enc_set.

      +

      Overall, R has a very simple encoding marking mechanism, see stri_enc_mark. There is an implicit assumption that your platform’s default (native) encoding always extends ASCII – stringi checks that whenever your native encoding is being detected automatically on ICU’s initialization and each time when you change it manually by calling stri_enc_set.

      Character strings in R (internally) can be declared to be in:

      @@ -332,7 +333,7 @@

      Facilities available

      stri_length (among others) for determining the number of code points in a string. See also stri_count_boundaries for counting the number of Unicode characters and stri_width for approximating the width of a string.

    • stri_trim (among others) for trimming characters from the beginning or/and end of a string, see also about_search_charclass, and stri_pad for padding strings so that they are of the same width. Additionally, stri_wrap wraps text into lines.

    • stri_trans_tolower (among others) for case mapping, i.e., conversion to lower, UPPER, or Title Case, stri_trans_nfc (among others) for Unicode normalization, stri_trans_char for translating individual code points, and stri_trans_general for other universal yet powerful text transforms, including transliteration.

    • -
    • stri_cmp, %s<%, stri_order, stri_sort, stri_unique, and stri_duplicated for collation-based, locale-aware operations, see also about_locale.

    • +
    • stri_cmp, %s<%, stri_order, stri_sort, stri_rank, stri_unique, and stri_duplicated for collation-based, locale-aware operations, see also about_locale.

    • stri_split_lines (among others) to split a string into text lines.

    • stri_escape_unicode (among others) for escaping some code points.

    • stri_rand_strings, stri_rand_shuffle, and stri_rand_lipsum for generating (pseudo)random strings.

    • @@ -342,7 +343,7 @@

      Facilities available

      Author(s)

      -

      Marek Gagolewski, with contributions from Bartek Tartanus and many others. ICU4C was developed by IBM and others. The Unicode Character Database is due to Unicode, Inc.; see the COPYRIGHTS file for more details.

      +

      Marek Gagolewski, with contributions from Bartek Tartanus and many others. ICU4C was developed by IBM, Unicode, Inc., and others.

      References

      diff --git a/docs/rapi/operator_add.html b/docs/rapi/operator_add.html index 7b22ea77a..fe6b403a5 100644 --- a/docs/rapi/operator_add.html +++ b/docs/rapi/operator_add.html @@ -176,6 +176,7 @@
    • stri_rand_lipsum: A Lorem Ipsum Generator
    • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
    • stri_rand_strings: Generate Random Strings
    • +
    • stri_rank: Ranking
    • stri_read_lines: Read Text Lines from a Text File
    • stri_read_raw: Read Text File as Raw
    • stri_remove_empty: Remove All Empty Strings from a Character Vector
    • diff --git a/docs/rapi/operator_compare.html b/docs/rapi/operator_compare.html index 1529bec5f..ffeb58fa8 100644 --- a/docs/rapi/operator_compare.html +++ b/docs/rapi/operator_compare.html @@ -176,6 +176,7 @@
    • stri_rand_lipsum: A Lorem Ipsum Generator
    • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
    • stri_rand_strings: Generate Random Strings
    • +
    • stri_rank: Ranking
    • stri_read_lines: Read Text Lines from a Text File
    • stri_read_raw: Read Text File as Raw
    • stri_remove_empty: Remove All Empty Strings from a Character Vector
    • @@ -363,7 +364,7 @@

      Value

      Examples

      diff --git a/docs/rapi/operator_dollar.html b/docs/rapi/operator_dollar.html index f649c5455..7c549dc0b 100644 --- a/docs/rapi/operator_dollar.html +++ b/docs/rapi/operator_dollar.html @@ -175,6 +175,7 @@
    • stri_rand_lipsum: A Lorem Ipsum Generator
    • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
    • stri_rand_strings: Generate Random Strings
    • +
    • stri_rank: Ranking
    • stri_read_lines: Read Text Lines from a Text File
    • stri_read_raw: Read Text File as Raw
    • stri_remove_empty: Remove All Empty Strings from a Character Vector
    • diff --git a/docs/rapi/stri_compare.html b/docs/rapi/stri_compare.html index a6786bb6e..7e40bf7eb 100644 --- a/docs/rapi/stri_compare.html +++ b/docs/rapi/stri_compare.html @@ -177,6 +177,7 @@
    • stri_rand_lipsum: A Lorem Ipsum Generator
    • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
    • stri_rand_strings: Generate Random Strings
    • +
    • stri_rank: Ranking
    • stri_read_lines: Read Text Lines from a Text File
    • stri_read_raw: Read Text File as Raw
    • stri_remove_empty: Remove All Empty Strings from a Character Vector
    • @@ -366,7 +367,7 @@

      References

      See Also

      -

      Other locale_sensitive: %s<%(), about_locale, about_search_boundaries, about_search_coll, stri_count_boundaries(), stri_duplicated(), stri_enc_detect2(), stri_extract_all_boundaries(), stri_locate_all_boundaries(), stri_opts_collator(), stri_order(), stri_sort_key(), stri_sort(), stri_split_boundaries(), stri_trans_tolower(), stri_unique(), stri_wrap()

      +

      Other locale_sensitive: %s<%(), about_locale, about_search_boundaries, about_search_coll, stri_count_boundaries(), stri_duplicated(), stri_enc_detect2(), stri_extract_all_boundaries(), stri_locate_all_boundaries(), stri_opts_collator(), stri_order(), stri_rank(), stri_sort_key(), stri_sort(), stri_split_boundaries(), stri_trans_tolower(), stri_unique(), stri_wrap()

      Examples

      diff --git a/docs/rapi/stri_count.html b/docs/rapi/stri_count.html index 04088f1e6..e4173d497 100644 --- a/docs/rapi/stri_count.html +++ b/docs/rapi/stri_count.html @@ -176,6 +176,7 @@
    • stri_rand_lipsum: A Lorem Ipsum Generator
    • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
    • stri_rand_strings: Generate Random Strings
    • +
    • stri_rank: Ranking
    • stri_read_lines: Read Text Lines from a Text File
    • stri_read_raw: Read Text File as Raw
    • stri_remove_empty: Remove All Empty Strings from a Character Vector
    • diff --git a/docs/rapi/stri_count_boundaries.html b/docs/rapi/stri_count_boundaries.html index 35da577a7..1e067cd88 100644 --- a/docs/rapi/stri_count_boundaries.html +++ b/docs/rapi/stri_count_boundaries.html @@ -176,6 +176,7 @@
    • stri_rand_lipsum: A Lorem Ipsum Generator
    • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
    • stri_rand_strings: Generate Random Strings
    • +
    • stri_rank: Ranking
    • stri_read_lines: Read Text Lines from a Text File
    • stri_read_raw: Read Text File as Raw
    • stri_remove_empty: Remove All Empty Strings from a Character Vector
    • @@ -347,7 +348,7 @@

      Value
      diff --git a/docs/rapi/stri_datetime_add.html b/docs/rapi/stri_datetime_add.html index c02323227..c4bc03f83 100644 --- a/docs/rapi/stri_datetime_add.html +++ b/docs/rapi/stri_datetime_add.html @@ -177,6 +177,7 @@
    • stri_rand_lipsum: A Lorem Ipsum Generator
    • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
    • stri_rand_strings: Generate Random Strings
    • +
    • stri_rank: Ranking
    • stri_read_lines: Read Text Lines from a Text File
    • stri_read_raw: Read Text File as Raw
    • stri_remove_empty: Remove All Empty Strings from a Character Vector
    • diff --git a/docs/rapi/stri_datetime_create.html b/docs/rapi/stri_datetime_create.html index eca18525b..ced2991b1 100644 --- a/docs/rapi/stri_datetime_create.html +++ b/docs/rapi/stri_datetime_create.html @@ -176,6 +176,7 @@
    • stri_rand_lipsum: A Lorem Ipsum Generator
    • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
    • stri_rand_strings: Generate Random Strings
    • +
    • stri_rank: Ranking
    • stri_read_lines: Read Text Lines from a Text File
    • stri_read_raw: Read Text File as Raw
    • stri_remove_empty: Remove All Empty Strings from a Character Vector
    • diff --git a/docs/rapi/stri_datetime_fields.html b/docs/rapi/stri_datetime_fields.html index 47b59136d..28cd824dd 100644 --- a/docs/rapi/stri_datetime_fields.html +++ b/docs/rapi/stri_datetime_fields.html @@ -176,6 +176,7 @@
    • stri_rand_lipsum: A Lorem Ipsum Generator
    • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
    • stri_rand_strings: Generate Random Strings
    • +
    • stri_rank: Ranking
    • stri_read_lines: Read Text Lines from a Text File
    • stri_read_raw: Read Text File as Raw
    • stri_remove_empty: Remove All Empty Strings from a Character Vector
    • diff --git a/docs/rapi/stri_datetime_format.html b/docs/rapi/stri_datetime_format.html index 464dffaab..d94cd8338 100644 --- a/docs/rapi/stri_datetime_format.html +++ b/docs/rapi/stri_datetime_format.html @@ -177,6 +177,7 @@
    • stri_rand_lipsum: A Lorem Ipsum Generator
    • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
    • stri_rand_strings: Generate Random Strings
    • +
    • stri_rank: Ranking
    • stri_read_lines: Read Text Lines from a Text File
    • stri_read_raw: Read Text File as Raw
    • stri_remove_empty: Remove All Empty Strings from a Character Vector
    • diff --git a/docs/rapi/stri_datetime_fstr.html b/docs/rapi/stri_datetime_fstr.html index 9790c6fc6..e9cde107a 100644 --- a/docs/rapi/stri_datetime_fstr.html +++ b/docs/rapi/stri_datetime_fstr.html @@ -176,6 +176,7 @@
    • stri_rand_lipsum: A Lorem Ipsum Generator
    • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
    • stri_rand_strings: Generate Random Strings
    • +
    • stri_rank: Ranking
    • stri_read_lines: Read Text Lines from a Text File
    • stri_read_raw: Read Text File as Raw
    • stri_remove_empty: Remove All Empty Strings from a Character Vector
    • diff --git a/docs/rapi/stri_datetime_now.html b/docs/rapi/stri_datetime_now.html index d7619955d..01cc34988 100644 --- a/docs/rapi/stri_datetime_now.html +++ b/docs/rapi/stri_datetime_now.html @@ -174,6 +174,7 @@
    • stri_rand_lipsum: A Lorem Ipsum Generator
    • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
    • stri_rand_strings: Generate Random Strings
    • +
    • stri_rank: Ranking
    • stri_read_lines: Read Text Lines from a Text File
    • stri_read_raw: Read Text File as Raw
    • stri_remove_empty: Remove All Empty Strings from a Character Vector
    • diff --git a/docs/rapi/stri_datetime_symbols.html b/docs/rapi/stri_datetime_symbols.html index f48a836bd..35fba4bda 100644 --- a/docs/rapi/stri_datetime_symbols.html +++ b/docs/rapi/stri_datetime_symbols.html @@ -177,6 +177,7 @@
    • stri_rand_lipsum: A Lorem Ipsum Generator
    • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
    • stri_rand_strings: Generate Random Strings
    • +
    • stri_rank: Ranking
    • stri_read_lines: Read Text Lines from a Text File
    • stri_read_raw: Read Text File as Raw
    • stri_remove_empty: Remove All Empty Strings from a Character Vector
    • diff --git a/docs/rapi/stri_detect.html b/docs/rapi/stri_detect.html index 4d7c4241d..acbd039cb 100644 --- a/docs/rapi/stri_detect.html +++ b/docs/rapi/stri_detect.html @@ -176,6 +176,7 @@
    • stri_rand_lipsum: A Lorem Ipsum Generator
    • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
    • stri_rand_strings: Generate Random Strings
    • +
    • stri_rank: Ranking
    • stri_read_lines: Read Text Lines from a Text File
    • stri_read_raw: Read Text File as Raw
    • stri_remove_empty: Remove All Empty Strings from a Character Vector
    • diff --git a/docs/rapi/stri_dup.html b/docs/rapi/stri_dup.html index fa63ddf18..3e7617307 100644 --- a/docs/rapi/stri_dup.html +++ b/docs/rapi/stri_dup.html @@ -176,6 +176,7 @@
    • stri_rand_lipsum: A Lorem Ipsum Generator
    • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
    • stri_rand_strings: Generate Random Strings
    • +
    • stri_rank: Ranking
    • stri_read_lines: Read Text Lines from a Text File
    • stri_read_raw: Read Text File as Raw
    • stri_remove_empty: Remove All Empty Strings from a Character Vector
    • diff --git a/docs/rapi/stri_duplicated.html b/docs/rapi/stri_duplicated.html index 21f5f58f5..3dd0db54a 100644 --- a/docs/rapi/stri_duplicated.html +++ b/docs/rapi/stri_duplicated.html @@ -177,6 +177,7 @@
    • stri_rand_lipsum: A Lorem Ipsum Generator
    • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
    • stri_rand_strings: Generate Random Strings
    • +
    • stri_rank: Ranking
    • stri_read_lines: Read Text Lines from a Text File
    • stri_read_raw: Read Text File as Raw
    • stri_remove_empty: Remove All Empty Strings from a Character Vector
    • @@ -366,7 +367,7 @@

      References

      See Also

      -

      Other locale_sensitive: %s<%(), about_locale, about_search_boundaries, about_search_coll, stri_compare(), stri_count_boundaries(), stri_enc_detect2(), stri_extract_all_boundaries(), stri_locate_all_boundaries(), stri_opts_collator(), stri_order(), stri_sort_key(), stri_sort(), stri_split_boundaries(), stri_trans_tolower(), stri_unique(), stri_wrap()

      +

      Other locale_sensitive: %s<%(), about_locale, about_search_boundaries, about_search_coll, stri_compare(), stri_count_boundaries(), stri_enc_detect2(), stri_extract_all_boundaries(), stri_locate_all_boundaries(), stri_opts_collator(), stri_order(), stri_rank(), stri_sort_key(), stri_sort(), stri_split_boundaries(), stri_trans_tolower(), stri_unique(), stri_wrap()

      Examples

      diff --git a/docs/rapi/stri_enc_detect.html b/docs/rapi/stri_enc_detect.html index bbcc68e67..62f6f0ec5 100644 --- a/docs/rapi/stri_enc_detect.html +++ b/docs/rapi/stri_enc_detect.html @@ -177,6 +177,7 @@
    • stri_rand_lipsum: A Lorem Ipsum Generator
    • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
    • stri_rand_strings: Generate Random Strings
    • +
    • stri_rank: Ranking
    • stri_read_lines: Read Text Lines from a Text File
    • stri_read_raw: Read Text File as Raw
    • stri_remove_empty: Remove All Empty Strings from a Character Vector
    • diff --git a/docs/rapi/stri_enc_detect2.html b/docs/rapi/stri_enc_detect2.html index 053083895..4a886fc84 100644 --- a/docs/rapi/stri_enc_detect2.html +++ b/docs/rapi/stri_enc_detect2.html @@ -175,6 +175,7 @@
    • stri_rand_lipsum: A Lorem Ipsum Generator
    • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
    • stri_rand_strings: Generate Random Strings
    • +
    • stri_rank: Ranking
    • stri_read_lines: Read Text Lines from a Text File
    • stri_read_raw: Read Text File as Raw
    • stri_remove_empty: Remove All Empty Strings from a Character Vector
    • @@ -343,7 +344,7 @@

      Value

      diff --git a/docs/rapi/stri_enc_fromutf32.html b/docs/rapi/stri_enc_fromutf32.html index 097e69ad3..51b45ce4a 100644 --- a/docs/rapi/stri_enc_fromutf32.html +++ b/docs/rapi/stri_enc_fromutf32.html @@ -175,6 +175,7 @@
    • stri_rand_lipsum: A Lorem Ipsum Generator
    • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
    • stri_rand_strings: Generate Random Strings
    • +
    • stri_rank: Ranking
    • stri_read_lines: Read Text Lines from a Text File
    • stri_read_raw: Read Text File as Raw
    • stri_remove_empty: Remove All Empty Strings from a Character Vector
    • diff --git a/docs/rapi/stri_enc_info.html b/docs/rapi/stri_enc_info.html index ce5bf2e52..fce5a0ce0 100644 --- a/docs/rapi/stri_enc_info.html +++ b/docs/rapi/stri_enc_info.html @@ -175,6 +175,7 @@
    • stri_rand_lipsum: A Lorem Ipsum Generator
    • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
    • stri_rand_strings: Generate Random Strings
    • +
    • stri_rank: Ranking
    • stri_read_lines: Read Text Lines from a Text File
    • stri_read_raw: Read Text File as Raw
    • stri_remove_empty: Remove All Empty Strings from a Character Vector
    • diff --git a/docs/rapi/stri_enc_isascii.html b/docs/rapi/stri_enc_isascii.html index b09a58570..53ecfbc01 100644 --- a/docs/rapi/stri_enc_isascii.html +++ b/docs/rapi/stri_enc_isascii.html @@ -176,6 +176,7 @@
    • stri_rand_lipsum: A Lorem Ipsum Generator
    • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
    • stri_rand_strings: Generate Random Strings
    • +
    • stri_rank: Ranking
    • stri_read_lines: Read Text Lines from a Text File
    • stri_read_raw: Read Text File as Raw
    • stri_remove_empty: Remove All Empty Strings from a Character Vector
    • diff --git a/docs/rapi/stri_enc_isutf16.html b/docs/rapi/stri_enc_isutf16.html index 49cdc0163..2ac558345 100644 --- a/docs/rapi/stri_enc_isutf16.html +++ b/docs/rapi/stri_enc_isutf16.html @@ -175,6 +175,7 @@
    • stri_rand_lipsum: A Lorem Ipsum Generator
    • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
    • stri_rand_strings: Generate Random Strings
    • +
    • stri_rank: Ranking
    • stri_read_lines: Read Text Lines from a Text File
    • stri_read_raw: Read Text File as Raw
    • stri_remove_empty: Remove All Empty Strings from a Character Vector
    • diff --git a/docs/rapi/stri_enc_isutf8.html b/docs/rapi/stri_enc_isutf8.html index 4831b3919..e596cec78 100644 --- a/docs/rapi/stri_enc_isutf8.html +++ b/docs/rapi/stri_enc_isutf8.html @@ -176,6 +176,7 @@
    • stri_rand_lipsum: A Lorem Ipsum Generator
    • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
    • stri_rand_strings: Generate Random Strings
    • +
    • stri_rank: Ranking
    • stri_read_lines: Read Text Lines from a Text File
    • stri_read_raw: Read Text File as Raw
    • stri_remove_empty: Remove All Empty Strings from a Character Vector
    • diff --git a/docs/rapi/stri_enc_list.html b/docs/rapi/stri_enc_list.html index e09673e29..96013b309 100644 --- a/docs/rapi/stri_enc_list.html +++ b/docs/rapi/stri_enc_list.html @@ -175,6 +175,7 @@
    • stri_rand_lipsum: A Lorem Ipsum Generator
    • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
    • stri_rand_strings: Generate Random Strings
    • +
    • stri_rank: Ranking
    • stri_read_lines: Read Text Lines from a Text File
    • stri_read_raw: Read Text File as Raw
    • stri_remove_empty: Remove All Empty Strings from a Character Vector
    • diff --git a/docs/rapi/stri_enc_mark.html b/docs/rapi/stri_enc_mark.html index 1f55d8973..77c4c15d9 100644 --- a/docs/rapi/stri_enc_mark.html +++ b/docs/rapi/stri_enc_mark.html @@ -175,6 +175,7 @@
    • stri_rand_lipsum: A Lorem Ipsum Generator
    • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
    • stri_rand_strings: Generate Random Strings
    • +
    • stri_rank: Ranking
    • stri_read_lines: Read Text Lines from a Text File
    • stri_read_raw: Read Text File as Raw
    • stri_remove_empty: Remove All Empty Strings from a Character Vector
    • diff --git a/docs/rapi/stri_enc_set.html b/docs/rapi/stri_enc_set.html index 237e23ddd..bf5b266df 100644 --- a/docs/rapi/stri_enc_set.html +++ b/docs/rapi/stri_enc_set.html @@ -175,6 +175,7 @@
    • stri_rand_lipsum: A Lorem Ipsum Generator
    • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
    • stri_rand_strings: Generate Random Strings
    • +
    • stri_rank: Ranking
    • stri_read_lines: Read Text Lines from a Text File
    • stri_read_raw: Read Text File as Raw
    • stri_remove_empty: Remove All Empty Strings from a Character Vector
    • diff --git a/docs/rapi/stri_enc_toascii.html b/docs/rapi/stri_enc_toascii.html index bc4f73506..480ad9cbf 100644 --- a/docs/rapi/stri_enc_toascii.html +++ b/docs/rapi/stri_enc_toascii.html @@ -175,6 +175,7 @@
    • stri_rand_lipsum: A Lorem Ipsum Generator
    • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
    • stri_rand_strings: Generate Random Strings
    • +
    • stri_rank: Ranking
    • stri_read_lines: Read Text Lines from a Text File
    • stri_read_raw: Read Text File as Raw
    • stri_remove_empty: Remove All Empty Strings from a Character Vector
    • diff --git a/docs/rapi/stri_enc_tonative.html b/docs/rapi/stri_enc_tonative.html index 40aee40ff..66f569785 100644 --- a/docs/rapi/stri_enc_tonative.html +++ b/docs/rapi/stri_enc_tonative.html @@ -175,6 +175,7 @@
    • stri_rand_lipsum: A Lorem Ipsum Generator
    • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
    • stri_rand_strings: Generate Random Strings
    • +
    • stri_rank: Ranking
    • stri_read_lines: Read Text Lines from a Text File
    • stri_read_raw: Read Text File as Raw
    • stri_remove_empty: Remove All Empty Strings from a Character Vector
    • diff --git a/docs/rapi/stri_enc_toutf32.html b/docs/rapi/stri_enc_toutf32.html index 51f2b5146..1bcf418ba 100644 --- a/docs/rapi/stri_enc_toutf32.html +++ b/docs/rapi/stri_enc_toutf32.html @@ -175,6 +175,7 @@
    • stri_rand_lipsum: A Lorem Ipsum Generator
    • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
    • stri_rand_strings: Generate Random Strings
    • +
    • stri_rank: Ranking
    • stri_read_lines: Read Text Lines from a Text File
    • stri_read_raw: Read Text File as Raw
    • stri_remove_empty: Remove All Empty Strings from a Character Vector
    • diff --git a/docs/rapi/stri_enc_toutf8.html b/docs/rapi/stri_enc_toutf8.html index 250391e9e..5cbf81b03 100644 --- a/docs/rapi/stri_enc_toutf8.html +++ b/docs/rapi/stri_enc_toutf8.html @@ -175,6 +175,7 @@
    • stri_rand_lipsum: A Lorem Ipsum Generator
    • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
    • stri_rand_strings: Generate Random Strings
    • +
    • stri_rank: Ranking
    • stri_read_lines: Read Text Lines from a Text File
    • stri_read_raw: Read Text File as Raw
    • stri_remove_empty: Remove All Empty Strings from a Character Vector
    • diff --git a/docs/rapi/stri_encode.html b/docs/rapi/stri_encode.html index 577fbf20d..48d118afc 100644 --- a/docs/rapi/stri_encode.html +++ b/docs/rapi/stri_encode.html @@ -176,6 +176,7 @@
    • stri_rand_lipsum: A Lorem Ipsum Generator
    • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
    • stri_rand_strings: Generate Random Strings
    • +
    • stri_rank: Ranking
    • stri_read_lines: Read Text Lines from a Text File
    • stri_read_raw: Read Text File as Raw
    • stri_remove_empty: Remove All Empty Strings from a Character Vector
    • diff --git a/docs/rapi/stri_escape_unicode.html b/docs/rapi/stri_escape_unicode.html index 1009e95bf..bf04ac1e9 100644 --- a/docs/rapi/stri_escape_unicode.html +++ b/docs/rapi/stri_escape_unicode.html @@ -176,6 +176,7 @@
    • stri_rand_lipsum: A Lorem Ipsum Generator
    • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
    • stri_rand_strings: Generate Random Strings
    • +
    • stri_rank: Ranking
    • stri_read_lines: Read Text Lines from a Text File
    • stri_read_raw: Read Text File as Raw
    • stri_remove_empty: Remove All Empty Strings from a Character Vector
    • diff --git a/docs/rapi/stri_extract.html b/docs/rapi/stri_extract.html index 55386de46..f9e5b5528 100644 --- a/docs/rapi/stri_extract.html +++ b/docs/rapi/stri_extract.html @@ -176,6 +176,7 @@
    • stri_rand_lipsum: A Lorem Ipsum Generator
    • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
    • stri_rand_strings: Generate Random Strings
    • +
    • stri_rank: Ranking
    • stri_read_lines: Read Text Lines from a Text File
    • stri_read_raw: Read Text File as Raw
    • stri_remove_empty: Remove All Empty Strings from a Character Vector
    • diff --git a/docs/rapi/stri_extract_boundaries.html b/docs/rapi/stri_extract_boundaries.html index 004c856fa..b31b065b3 100644 --- a/docs/rapi/stri_extract_boundaries.html +++ b/docs/rapi/stri_extract_boundaries.html @@ -176,6 +176,7 @@
    • stri_rand_lipsum: A Lorem Ipsum Generator
    • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
    • stri_rand_strings: Generate Random Strings
    • +
    • stri_rank: Ranking
    • stri_read_lines: Read Text Lines from a Text File
    • stri_read_raw: Read Text File as Raw
    • stri_remove_empty: Remove All Empty Strings from a Character Vector
    • @@ -372,7 +373,7 @@

      Value
      diff --git a/docs/rapi/stri_flatten.html b/docs/rapi/stri_flatten.html index 1081d15aa..d27338776 100644 --- a/docs/rapi/stri_flatten.html +++ b/docs/rapi/stri_flatten.html @@ -176,6 +176,7 @@
    • stri_rand_lipsum: A Lorem Ipsum Generator
    • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
    • stri_rand_strings: Generate Random Strings
    • +
    • stri_rank: Ranking
    • stri_read_lines: Read Text Lines from a Text File
    • stri_read_raw: Read Text File as Raw
    • stri_remove_empty: Remove All Empty Strings from a Character Vector
    • diff --git a/docs/rapi/stri_info.html b/docs/rapi/stri_info.html index e7ac1c13c..7fbaa0f58 100644 --- a/docs/rapi/stri_info.html +++ b/docs/rapi/stri_info.html @@ -173,6 +173,7 @@
    • stri_rand_lipsum: A Lorem Ipsum Generator
    • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
    • stri_rand_strings: Generate Random Strings
    • +
    • stri_rank: Ranking
    • stri_read_lines: Read Text Lines from a Text File
    • stri_read_raw: Read Text File as Raw
    • stri_remove_empty: Remove All Empty Strings from a Character Vector
    • diff --git a/docs/rapi/stri_isempty.html b/docs/rapi/stri_isempty.html index 8a81aa562..e19285757 100644 --- a/docs/rapi/stri_isempty.html +++ b/docs/rapi/stri_isempty.html @@ -176,6 +176,7 @@
    • stri_rand_lipsum: A Lorem Ipsum Generator
    • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
    • stri_rand_strings: Generate Random Strings
    • +
    • stri_rank: Ranking
    • stri_read_lines: Read Text Lines from a Text File
    • stri_read_raw: Read Text File as Raw
    • stri_remove_empty: Remove All Empty Strings from a Character Vector
    • diff --git a/docs/rapi/stri_join.html b/docs/rapi/stri_join.html index 4c54a1c40..0b6e14862 100644 --- a/docs/rapi/stri_join.html +++ b/docs/rapi/stri_join.html @@ -176,6 +176,7 @@
    • stri_rand_lipsum: A Lorem Ipsum Generator
    • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
    • stri_rand_strings: Generate Random Strings
    • +
    • stri_rank: Ranking
    • stri_read_lines: Read Text Lines from a Text File
    • stri_read_raw: Read Text File as Raw
    • stri_remove_empty: Remove All Empty Strings from a Character Vector
    • diff --git a/docs/rapi/stri_join_list.html b/docs/rapi/stri_join_list.html index 241915e66..247ab31d2 100644 --- a/docs/rapi/stri_join_list.html +++ b/docs/rapi/stri_join_list.html @@ -176,6 +176,7 @@
    • stri_rand_lipsum: A Lorem Ipsum Generator
    • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
    • stri_rand_strings: Generate Random Strings
    • +
    • stri_rank: Ranking
    • stri_read_lines: Read Text Lines from a Text File
    • stri_read_raw: Read Text File as Raw
    • stri_remove_empty: Remove All Empty Strings from a Character Vector
    • diff --git a/docs/rapi/stri_length.html b/docs/rapi/stri_length.html index 7d895ba7f..024276cda 100644 --- a/docs/rapi/stri_length.html +++ b/docs/rapi/stri_length.html @@ -176,6 +176,7 @@
    • stri_rand_lipsum: A Lorem Ipsum Generator
    • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
    • stri_rand_strings: Generate Random Strings
    • +
    • stri_rank: Ranking
    • stri_read_lines: Read Text Lines from a Text File
    • stri_read_raw: Read Text File as Raw
    • stri_remove_empty: Remove All Empty Strings from a Character Vector
    • diff --git a/docs/rapi/stri_list2matrix.html b/docs/rapi/stri_list2matrix.html index 42ad87dc5..30decfca4 100644 --- a/docs/rapi/stri_list2matrix.html +++ b/docs/rapi/stri_list2matrix.html @@ -176,6 +176,7 @@
    • stri_rand_lipsum: A Lorem Ipsum Generator
    • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
    • stri_rand_strings: Generate Random Strings
    • +
    • stri_rank: Ranking
    • stri_read_lines: Read Text Lines from a Text File
    • stri_read_raw: Read Text File as Raw
    • stri_remove_empty: Remove All Empty Strings from a Character Vector
    • diff --git a/docs/rapi/stri_locale_info.html b/docs/rapi/stri_locale_info.html index 3b7c1a431..efe29be22 100644 --- a/docs/rapi/stri_locale_info.html +++ b/docs/rapi/stri_locale_info.html @@ -176,6 +176,7 @@
    • stri_rand_lipsum: A Lorem Ipsum Generator
    • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
    • stri_rand_strings: Generate Random Strings
    • +
    • stri_rank: Ranking
    • stri_read_lines: Read Text Lines from a Text File
    • stri_read_raw: Read Text File as Raw
    • stri_remove_empty: Remove All Empty Strings from a Character Vector
    • diff --git a/docs/rapi/stri_locale_list.html b/docs/rapi/stri_locale_list.html index d37a6385f..46dc9f2f3 100644 --- a/docs/rapi/stri_locale_list.html +++ b/docs/rapi/stri_locale_list.html @@ -174,6 +174,7 @@
    • stri_rand_lipsum: A Lorem Ipsum Generator
    • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
    • stri_rand_strings: Generate Random Strings
    • +
    • stri_rank: Ranking
    • stri_read_lines: Read Text Lines from a Text File
    • stri_read_raw: Read Text File as Raw
    • stri_remove_empty: Remove All Empty Strings from a Character Vector
    • diff --git a/docs/rapi/stri_locale_set.html b/docs/rapi/stri_locale_set.html index dc839f488..20ffe2cbf 100644 --- a/docs/rapi/stri_locale_set.html +++ b/docs/rapi/stri_locale_set.html @@ -176,6 +176,7 @@
    • stri_rand_lipsum: A Lorem Ipsum Generator
    • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
    • stri_rand_strings: Generate Random Strings
    • +
    • stri_rank: Ranking
    • stri_read_lines: Read Text Lines from a Text File
    • stri_read_raw: Read Text File as Raw
    • stri_remove_empty: Remove All Empty Strings from a Character Vector
    • diff --git a/docs/rapi/stri_locate.html b/docs/rapi/stri_locate.html index c14ae0c37..931e5e1e1 100644 --- a/docs/rapi/stri_locate.html +++ b/docs/rapi/stri_locate.html @@ -176,6 +176,7 @@
    • stri_rand_lipsum: A Lorem Ipsum Generator
    • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
    • stri_rand_strings: Generate Random Strings
    • +
    • stri_rank: Ranking
    • stri_read_lines: Read Text Lines from a Text File
    • stri_read_raw: Read Text File as Raw
    • stri_remove_empty: Remove All Empty Strings from a Character Vector
    • diff --git a/docs/rapi/stri_locate_boundaries.html b/docs/rapi/stri_locate_boundaries.html index b11188328..220095c62 100644 --- a/docs/rapi/stri_locate_boundaries.html +++ b/docs/rapi/stri_locate_boundaries.html @@ -176,6 +176,7 @@
    • stri_rand_lipsum: A Lorem Ipsum Generator
    • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
    • stri_rand_strings: Generate Random Strings
    • +
    • stri_rank: Ranking
    • stri_read_lines: Read Text Lines from a Text File
    • stri_read_raw: Read Text File as Raw
    • stri_remove_empty: Remove All Empty Strings from a Character Vector
    • @@ -363,7 +364,7 @@

      Value

      See Also

      Other search_locate: about_search, stri_locate_all()

      Other indexing: stri_locate_all(), stri_sub_all(), stri_sub()

      -

      Other locale_sensitive: %s<%(), about_locale, about_search_boundaries, about_search_coll, stri_compare(), stri_count_boundaries(), stri_duplicated(), stri_enc_detect2(), stri_extract_all_boundaries(), stri_opts_collator(), stri_order(), stri_sort_key(), stri_sort(), stri_split_boundaries(), stri_trans_tolower(), stri_unique(), stri_wrap()

      +

      Other locale_sensitive: %s<%(), about_locale, about_search_boundaries, about_search_coll, stri_compare(), stri_count_boundaries(), stri_duplicated(), stri_enc_detect2(), stri_extract_all_boundaries(), stri_opts_collator(), stri_order(), stri_rank(), stri_sort_key(), stri_sort(), stri_split_boundaries(), stri_trans_tolower(), stri_unique(), stri_wrap()

      Other text_boundaries: about_search_boundaries, about_search, stri_count_boundaries(), stri_extract_all_boundaries(), stri_opts_brkiter(), stri_split_boundaries(), stri_split_lines(), stri_trans_tolower(), stri_wrap()

      diff --git a/docs/rapi/stri_match.html b/docs/rapi/stri_match.html index 3db8d43d5..d41dacd94 100644 --- a/docs/rapi/stri_match.html +++ b/docs/rapi/stri_match.html @@ -176,6 +176,7 @@
    • stri_rand_lipsum: A Lorem Ipsum Generator
    • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
    • stri_rand_strings: Generate Random Strings
    • +
    • stri_rank: Ranking
    • stri_read_lines: Read Text Lines from a Text File
    • stri_read_raw: Read Text File as Raw
    • stri_remove_empty: Remove All Empty Strings from a Character Vector
    • diff --git a/docs/rapi/stri_na2empty.html b/docs/rapi/stri_na2empty.html index a34448b78..802599dc0 100644 --- a/docs/rapi/stri_na2empty.html +++ b/docs/rapi/stri_na2empty.html @@ -175,6 +175,7 @@
    • stri_rand_lipsum: A Lorem Ipsum Generator
    • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
    • stri_rand_strings: Generate Random Strings
    • +
    • stri_rank: Ranking
    • stri_read_lines: Read Text Lines from a Text File
    • stri_read_raw: Read Text File as Raw
    • stri_remove_empty: Remove All Empty Strings from a Character Vector
    • diff --git a/docs/rapi/stri_numbytes.html b/docs/rapi/stri_numbytes.html index ceb98ac0c..48d6a0289 100644 --- a/docs/rapi/stri_numbytes.html +++ b/docs/rapi/stri_numbytes.html @@ -176,6 +176,7 @@
    • stri_rand_lipsum: A Lorem Ipsum Generator
    • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
    • stri_rand_strings: Generate Random Strings
    • +
    • stri_rank: Ranking
    • stri_read_lines: Read Text Lines from a Text File
    • stri_read_raw: Read Text File as Raw
    • stri_remove_empty: Remove All Empty Strings from a Character Vector
    • diff --git a/docs/rapi/stri_opts_brkiter.html b/docs/rapi/stri_opts_brkiter.html index 2ea5d2b0b..8e4af294b 100644 --- a/docs/rapi/stri_opts_brkiter.html +++ b/docs/rapi/stri_opts_brkiter.html @@ -176,6 +176,7 @@
    • stri_rand_lipsum: A Lorem Ipsum Generator
    • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
    • stri_rand_strings: Generate Random Strings
    • +
    • stri_rank: Ranking
    • stri_read_lines: Read Text Lines from a Text File
    • stri_read_raw: Read Text File as Raw
    • stri_remove_empty: Remove All Empty Strings from a Character Vector
    • diff --git a/docs/rapi/stri_opts_collator.html b/docs/rapi/stri_opts_collator.html index b1f83f1c5..c6dc0d66c 100644 --- a/docs/rapi/stri_opts_collator.html +++ b/docs/rapi/stri_opts_collator.html @@ -177,6 +177,7 @@
    • stri_rand_lipsum: A Lorem Ipsum Generator
    • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
    • stri_rand_strings: Generate Random Strings
    • +
    • stri_rank: Ranking
    • stri_read_lines: Read Text Lines from a Text File
    • stri_read_raw: Read Text File as Raw
    • stri_remove_empty: Remove All Empty Strings from a Character Vector
    • @@ -389,7 +390,7 @@

      References

      See Also

      -

      Other locale_sensitive: %s<%(), about_locale, about_search_boundaries, about_search_coll, stri_compare(), stri_count_boundaries(), stri_duplicated(), stri_enc_detect2(), stri_extract_all_boundaries(), stri_locate_all_boundaries(), stri_order(), stri_sort_key(), stri_sort(), stri_split_boundaries(), stri_trans_tolower(), stri_unique(), stri_wrap()

      +

      Other locale_sensitive: %s<%(), about_locale, about_search_boundaries, about_search_coll, stri_compare(), stri_count_boundaries(), stri_duplicated(), stri_enc_detect2(), stri_extract_all_boundaries(), stri_locate_all_boundaries(), stri_order(), stri_rank(), stri_sort_key(), stri_sort(), stri_split_boundaries(), stri_trans_tolower(), stri_unique(), stri_wrap()

      Other search_coll: about_search_coll, about_search

      diff --git a/docs/rapi/stri_opts_fixed.html b/docs/rapi/stri_opts_fixed.html index bc3d4ceca..d1e63d7e8 100644 --- a/docs/rapi/stri_opts_fixed.html +++ b/docs/rapi/stri_opts_fixed.html @@ -177,6 +177,7 @@
    • stri_rand_lipsum: A Lorem Ipsum Generator
    • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
    • stri_rand_strings: Generate Random Strings
    • +
    • stri_rank: Ranking
    • stri_read_lines: Read Text Lines from a Text File
    • stri_read_raw: Read Text File as Raw
    • stri_remove_empty: Remove All Empty Strings from a Character Vector
    • diff --git a/docs/rapi/stri_opts_regex.html b/docs/rapi/stri_opts_regex.html index 37264b316..ce99b5fce 100644 --- a/docs/rapi/stri_opts_regex.html +++ b/docs/rapi/stri_opts_regex.html @@ -177,6 +177,7 @@
    • stri_rand_lipsum: A Lorem Ipsum Generator
    • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
    • stri_rand_strings: Generate Random Strings
    • +
    • stri_rank: Ranking
    • stri_read_lines: Read Text Lines from a Text File
    • stri_read_raw: Read Text File as Raw
    • stri_remove_empty: Remove All Empty Strings from a Character Vector
    • diff --git a/docs/rapi/stri_order.html b/docs/rapi/stri_order.html index 248de7ba5..f5e3b6250 100644 --- a/docs/rapi/stri_order.html +++ b/docs/rapi/stri_order.html @@ -177,6 +177,7 @@
    • stri_rand_lipsum: A Lorem Ipsum Generator
    • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
    • stri_rand_strings: Generate Random Strings
    • +
    • stri_rank: Ranking
    • stri_read_lines: Read Text Lines from a Text File
    • stri_read_raw: Read Text File as Raw
    • stri_remove_empty: Remove All Empty Strings from a Character Vector
    • @@ -337,8 +338,9 @@

      Arguments

      Details

      For more information on ICU’s Collator and how to tune it up in stringi, refer to stri_opts_collator.

      -

      As usual in stringi, non-character inputs are coerced to strings, see an example below for a perhaps non-intuitive behavior of lexicographic sorting on numeric inputs.

      +

      As usual in stringi, non-character inputs are coerced to strings, see an example below for a somewhat non-intuitive behavior of lexicographic sorting on numeric inputs.

      This function uses a stable sort algorithm (STL’s stable_sort), which performs up to N*log^2(N) element comparisons, where N is the length of str.

      +

      For ordering with regards to multiple criteria (such as sorting data frames by more than 1 column), see stri_rank.

      Examples

      diff --git a/docs/rapi/stri_pad.html b/docs/rapi/stri_pad.html index 1b327f1b6..6073303d3 100644 --- a/docs/rapi/stri_pad.html +++ b/docs/rapi/stri_pad.html @@ -175,6 +175,7 @@
    • stri_rand_lipsum: A Lorem Ipsum Generator
    • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
    • stri_rand_strings: Generate Random Strings
    • +
    • stri_rank: Ranking
    • stri_read_lines: Read Text Lines from a Text File
    • stri_read_raw: Read Text File as Raw
    • stri_remove_empty: Remove All Empty Strings from a Character Vector
    • diff --git a/docs/rapi/stri_rand_lipsum.html b/docs/rapi/stri_rand_lipsum.html index df5fce3c3..108dd0f1b 100644 --- a/docs/rapi/stri_rand_lipsum.html +++ b/docs/rapi/stri_rand_lipsum.html @@ -176,6 +176,7 @@
    • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
    • stri_rand_strings: Generate Random Strings
    • +
    • stri_rank: Ranking
    • stri_read_lines: Read Text Lines from a Text File
    • stri_read_raw: Read Text File as Raw
    • stri_remove_empty: Remove All Empty Strings from a Character Vector
    • diff --git a/docs/rapi/stri_rand_shuffle.html b/docs/rapi/stri_rand_shuffle.html index 66f813899..df65684da 100644 --- a/docs/rapi/stri_rand_shuffle.html +++ b/docs/rapi/stri_rand_shuffle.html @@ -176,6 +176,7 @@

  • stri_rand_strings: Generate Random Strings
  • +
  • stri_rank: Ranking
  • stri_read_lines: Read Text Lines from a Text File
  • stri_read_raw: Read Text File as Raw
  • stri_remove_empty: Remove All Empty Strings from a Character Vector
  • diff --git a/docs/rapi/stri_rand_strings.html b/docs/rapi/stri_rand_strings.html index 82e123588..69f4807ee 100644 --- a/docs/rapi/stri_rand_strings.html +++ b/docs/rapi/stri_rand_strings.html @@ -41,7 +41,7 @@ - + @@ -176,6 +176,7 @@
  • Examples
  • +
  • stri_rank: Ranking
  • stri_read_lines: Read Text Lines from a Text File
  • stri_read_raw: Read Text File as Raw
  • stri_remove_empty: Remove All Empty Strings from a Character Vector
  • @@ -283,7 +284,7 @@ diff --git a/docs/rapi/stri_rank.html b/docs/rapi/stri_rank.html new file mode 100644 index 000000000..33ad57ba0 --- /dev/null +++ b/docs/rapi/stri_rank.html @@ -0,0 +1,413 @@ + + + + + + + + + + stri_rank: Ranking — stringi 1.5.4 documentation + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
    + + + +
    + + + + + +
    + +
    + + + + + + + + + + + + + + + + + + + +
    + + + + + + +
    +
    +
    +
    + +
    +

    stri_rank: Ranking

    +
    +

    Description

    +

    This function ranks each string in a character vector according to a locale-dependent lexicographic order. It is a portable replacement for the base xtfrm function.

    +
    +
    +

    Usage

    +
    stri_rank(str, ..., opts_collator = NULL)
    +
    +
    +
    +
    +

    Arguments

    + ++++ + + + + + + + + + + + +

    str

    a character vector

    ...

    additional settings for opts_collator

    opts_collator

    a named list with ICU Collator’s options, see stri_opts_collator, NULL for default collation options

    +
    +
    +

    Details

    +

    Missing values result in missing ranks and tied observations receive the same ranks (based on min).

    +

    For more information on ICU’s Collator and how to tune it up in stringi, refer to stri_opts_collator.

    +
    +
    +

    Value

    +

    The result is a vector of ranks corresponding to each string in str.

    +
    +
    +

    References

    +

    Collation - ICU User Guide, http://userguide.icu-project.org/collation

    +
    + +
    +

    Examples

    +
    stri_rank(c('hladny', 'chladny'), locale='pl_PL')
    +stri_rank(c('hladny', 'chladny'), locale='sk_SK')
    +
    +stri_rank("a" %s+% c(1, 100, 2, 101, 11, 10))  # lexicographic order
    +stri_rank("a" %s+% c(1, 100, 2, 101, 11, 10), numeric=TRUE)
    +
    +# Ordering a data frame with respect to two criteria:
    +X <- data.frame(a=c("b", NA, "b", "b", NA, "a", "a", "c"), b=runif(8))
    +X[order(stri_rank(X$a), X$b), ]
    +
    +
    +
    +
    + + +
    + +
    + +
    +
    + +
    + +
    + + + + + + + + + + + \ No newline at end of file diff --git a/docs/rapi/stri_read_lines.html b/docs/rapi/stri_read_lines.html index f621c4185..0e94d653b 100644 --- a/docs/rapi/stri_read_lines.html +++ b/docs/rapi/stri_read_lines.html @@ -42,7 +42,7 @@ - + @@ -167,6 +167,7 @@
  • stri_rand_lipsum: A Lorem Ipsum Generator
  • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
  • stri_rand_strings: Generate Random Strings
  • +
  • stri_rank: Ranking
  • stri_read_lines: Read Text Lines from a Text File
    • Description
    • Usage
    • @@ -285,7 +286,7 @@ Next - Previous + Previous @@ -352,7 +353,7 @@

      See Also - +
      diff --git a/docs/rapi/stri_read_raw.html b/docs/rapi/stri_read_raw.html index 8e9d123de..200a616d7 100644 --- a/docs/rapi/stri_read_raw.html +++ b/docs/rapi/stri_read_raw.html @@ -167,6 +167,7 @@
    • stri_rand_lipsum: A Lorem Ipsum Generator
    • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
    • stri_rand_strings: Generate Random Strings
    • +
    • stri_rank: Ranking
    • stri_read_lines: Read Text Lines from a Text File
    • stri_read_raw: Read Text File as Raw
      • Description
      • diff --git a/docs/rapi/stri_remove_empty.html b/docs/rapi/stri_remove_empty.html index 1c6194a73..d678a2763 100644 --- a/docs/rapi/stri_remove_empty.html +++ b/docs/rapi/stri_remove_empty.html @@ -167,6 +167,7 @@
      • stri_rand_lipsum: A Lorem Ipsum Generator
      • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
      • stri_rand_strings: Generate Random Strings
      • +
      • stri_rank: Ranking
      • stri_read_lines: Read Text Lines from a Text File
      • stri_read_raw: Read Text File as Raw
      • stri_remove_empty: Remove All Empty Strings from a Character Vector
          diff --git a/docs/rapi/stri_replace.html b/docs/rapi/stri_replace.html index 8122059f5..f6a1f038e 100644 --- a/docs/rapi/stri_replace.html +++ b/docs/rapi/stri_replace.html @@ -167,6 +167,7 @@
        • stri_rand_lipsum: A Lorem Ipsum Generator
        • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
        • stri_rand_strings: Generate Random Strings
        • +
        • stri_rank: Ranking
        • stri_read_lines: Read Text Lines from a Text File
        • stri_read_raw: Read Text File as Raw
        • stri_remove_empty: Remove All Empty Strings from a Character Vector
        • diff --git a/docs/rapi/stri_replace_na.html b/docs/rapi/stri_replace_na.html index 0e13617b8..cf5d00a98 100644 --- a/docs/rapi/stri_replace_na.html +++ b/docs/rapi/stri_replace_na.html @@ -167,6 +167,7 @@
        • stri_rand_lipsum: A Lorem Ipsum Generator
        • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
        • stri_rand_strings: Generate Random Strings
        • +
        • stri_rank: Ranking
        • stri_read_lines: Read Text Lines from a Text File
        • stri_read_raw: Read Text File as Raw
        • stri_remove_empty: Remove All Empty Strings from a Character Vector
        • diff --git a/docs/rapi/stri_reverse.html b/docs/rapi/stri_reverse.html index d513674e2..8623eb78f 100644 --- a/docs/rapi/stri_reverse.html +++ b/docs/rapi/stri_reverse.html @@ -167,6 +167,7 @@
        • stri_rand_lipsum: A Lorem Ipsum Generator
        • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
        • stri_rand_strings: Generate Random Strings
        • +
        • stri_rank: Ranking
        • stri_read_lines: Read Text Lines from a Text File
        • stri_read_raw: Read Text File as Raw
        • stri_remove_empty: Remove All Empty Strings from a Character Vector
        • diff --git a/docs/rapi/stri_sort.html b/docs/rapi/stri_sort.html index e4206baab..0ea743e6e 100644 --- a/docs/rapi/stri_sort.html +++ b/docs/rapi/stri_sort.html @@ -167,6 +167,7 @@
        • stri_rand_lipsum: A Lorem Ipsum Generator
        • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
        • stri_rand_strings: Generate Random Strings
        • +
        • stri_rank: Ranking
        • stri_read_lines: Read Text Lines from a Text File
        • stri_read_raw: Read Text File as Raw
        • stri_remove_empty: Remove All Empty Strings from a Character Vector
        • @@ -300,7 +301,7 @@

          stri_sort: Sorting

          Description

          -

          This function sorts a character vector according to the locale-dependent lexicographic order.

          +

          This function sorts a character vector according to a locale-dependent lexicographic order.

          Usage

          @@ -337,7 +338,7 @@

          Arguments

          Details

          For more information on ICU’s Collator and how to tune it up in stringi, refer to stri_opts_collator.

          -

          As usual in stringi, non-character inputs are coerced to strings, see an example below for a perhaps non-intitive behavior of lexicographic sorting on numeric inputs.

          +

          As usual in stringi, non-character inputs are coerced to strings, see an example below for a somewhat non-intuitive behavior of lexicographic sorting on numeric inputs.

          This function uses a stable sort algorithm (STL’s stable_sort), which performs up to N*log^2(N) element comparisons, where N is the length of str.

          Examples

          diff --git a/docs/rapi/stri_sort_key.html b/docs/rapi/stri_sort_key.html index ea24498b3..c2ca1c21b 100644 --- a/docs/rapi/stri_sort_key.html +++ b/docs/rapi/stri_sort_key.html @@ -167,6 +167,7 @@
        • stri_rand_lipsum: A Lorem Ipsum Generator
        • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
        • stri_rand_strings: Generate Random Strings
        • +
        • stri_rank: Ranking
        • stri_read_lines: Read Text Lines from a Text File
        • stri_read_raw: Read Text File as Raw
        • stri_remove_empty: Remove All Empty Strings from a Character Vector
        • @@ -300,7 +301,7 @@

          stri_sort_key: Sort Keys

          Description

          -

          This function computes a locale-dependent ‘sort key’, which is an alternative character representation of the string that, when ordered in the C locale (which orders using bytes directly), will give an equivalent ordering to the original string. It is useful for enhancing algorithms that sort only in the C locale with the ability to be locale-aware.

          +

          This function computes a locale-dependent sort key, which is an alternative character representation of the string that, when ordered in the C locale (which orders using the underlying bytes directly), will give an equivalent ordering to the original string. It is useful for enhancing algorithms that sort only in the C locale (e.g., the strcmp function in libc) with the ability to be locale-aware.

          Usage

          @@ -331,10 +332,11 @@

          Arguments

          Details

          For more information on ICU’s Collator and how to tune it up in stringi, refer to stri_opts_collator.

          +

          See also stri_rank for ranking strings with a single character vector, i.e., generating relative sort keys.

          Value

          -

          The result is a character vector with the same length as str that contains the sort keys.

          +

          The result is a character vector with the same length as str that contains the sort keys. The output is marked as bytes-encoded.

          Examples

          diff --git a/docs/rapi/stri_split.html b/docs/rapi/stri_split.html index 30cbdcebd..9321fb959 100644 --- a/docs/rapi/stri_split.html +++ b/docs/rapi/stri_split.html @@ -167,6 +167,7 @@
        • stri_rand_lipsum: A Lorem Ipsum Generator
        • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
        • stri_rand_strings: Generate Random Strings
        • +
        • stri_rank: Ranking
        • stri_read_lines: Read Text Lines from a Text File
        • stri_read_raw: Read Text File as Raw
        • stri_remove_empty: Remove All Empty Strings from a Character Vector
        • diff --git a/docs/rapi/stri_split_boundaries.html b/docs/rapi/stri_split_boundaries.html index 254659a0b..51da1d774 100644 --- a/docs/rapi/stri_split_boundaries.html +++ b/docs/rapi/stri_split_boundaries.html @@ -167,6 +167,7 @@
        • stri_rand_lipsum: A Lorem Ipsum Generator
        • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
        • stri_rand_strings: Generate Random Strings
        • +
        • stri_rank: Ranking
        • stri_read_lines: Read Text Lines from a Text File
        • stri_read_raw: Read Text File as Raw
        • stri_remove_empty: Remove All Empty Strings from a Character Vector
        • @@ -358,7 +359,7 @@

          Value
          diff --git a/docs/rapi/stri_split_lines.html b/docs/rapi/stri_split_lines.html index 75ac36590..e68ce334d 100644 --- a/docs/rapi/stri_split_lines.html +++ b/docs/rapi/stri_split_lines.html @@ -167,6 +167,7 @@
        • stri_rand_lipsum: A Lorem Ipsum Generator
        • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
        • stri_rand_strings: Generate Random Strings
        • +
        • stri_rank: Ranking
        • stri_read_lines: Read Text Lines from a Text File
        • stri_read_raw: Read Text File as Raw
        • stri_remove_empty: Remove All Empty Strings from a Character Vector
        • diff --git a/docs/rapi/stri_startsendswith.html b/docs/rapi/stri_startsendswith.html index 2e0ec7824..c74edbd3b 100644 --- a/docs/rapi/stri_startsendswith.html +++ b/docs/rapi/stri_startsendswith.html @@ -167,6 +167,7 @@
        • stri_rand_lipsum: A Lorem Ipsum Generator
        • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
        • stri_rand_strings: Generate Random Strings
        • +
        • stri_rank: Ranking
        • stri_read_lines: Read Text Lines from a Text File
        • stri_read_raw: Read Text File as Raw
        • stri_remove_empty: Remove All Empty Strings from a Character Vector
        • diff --git a/docs/rapi/stri_stats_general.html b/docs/rapi/stri_stats_general.html index 95da6a66c..c8b566b69 100644 --- a/docs/rapi/stri_stats_general.html +++ b/docs/rapi/stri_stats_general.html @@ -167,6 +167,7 @@
        • stri_rand_lipsum: A Lorem Ipsum Generator
        • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
        • stri_rand_strings: Generate Random Strings
        • +
        • stri_rank: Ranking
        • stri_read_lines: Read Text Lines from a Text File
        • stri_read_raw: Read Text File as Raw
        • stri_remove_empty: Remove All Empty Strings from a Character Vector
        • diff --git a/docs/rapi/stri_stats_latex.html b/docs/rapi/stri_stats_latex.html index 818f90eae..1decdff26 100644 --- a/docs/rapi/stri_stats_latex.html +++ b/docs/rapi/stri_stats_latex.html @@ -167,6 +167,7 @@
        • stri_rand_lipsum: A Lorem Ipsum Generator
        • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
        • stri_rand_strings: Generate Random Strings
        • +
        • stri_rank: Ranking
        • stri_read_lines: Read Text Lines from a Text File
        • stri_read_raw: Read Text File as Raw
        • stri_remove_empty: Remove All Empty Strings from a Character Vector
        • diff --git a/docs/rapi/stri_sub.html b/docs/rapi/stri_sub.html index a54538613..d2525df81 100644 --- a/docs/rapi/stri_sub.html +++ b/docs/rapi/stri_sub.html @@ -167,6 +167,7 @@
        • stri_rand_lipsum: A Lorem Ipsum Generator
        • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
        • stri_rand_strings: Generate Random Strings
        • +
        • stri_rank: Ranking
        • stri_read_lines: Read Text Lines from a Text File
        • stri_read_raw: Read Text File as Raw
        • stri_remove_empty: Remove All Empty Strings from a Character Vector
        • diff --git a/docs/rapi/stri_sub_all.html b/docs/rapi/stri_sub_all.html index 335c545d7..33c26525b 100644 --- a/docs/rapi/stri_sub_all.html +++ b/docs/rapi/stri_sub_all.html @@ -167,6 +167,7 @@
        • stri_rand_lipsum: A Lorem Ipsum Generator
        • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
        • stri_rand_strings: Generate Random Strings
        • +
        • stri_rank: Ranking
        • stri_read_lines: Read Text Lines from a Text File
        • stri_read_raw: Read Text File as Raw
        • stri_remove_empty: Remove All Empty Strings from a Character Vector
        • diff --git a/docs/rapi/stri_subset.html b/docs/rapi/stri_subset.html index dbfc78f35..d367019e8 100644 --- a/docs/rapi/stri_subset.html +++ b/docs/rapi/stri_subset.html @@ -167,6 +167,7 @@
        • stri_rand_lipsum: A Lorem Ipsum Generator
        • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
        • stri_rand_strings: Generate Random Strings
        • +
        • stri_rank: Ranking
        • stri_read_lines: Read Text Lines from a Text File
        • stri_read_raw: Read Text File as Raw
        • stri_remove_empty: Remove All Empty Strings from a Character Vector
        • diff --git a/docs/rapi/stri_timezone_info.html b/docs/rapi/stri_timezone_info.html index 94e6558e1..4a2e4a055 100644 --- a/docs/rapi/stri_timezone_info.html +++ b/docs/rapi/stri_timezone_info.html @@ -167,6 +167,7 @@
        • stri_rand_lipsum: A Lorem Ipsum Generator
        • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
        • stri_rand_strings: Generate Random Strings
        • +
        • stri_rank: Ranking
        • stri_read_lines: Read Text Lines from a Text File
        • stri_read_raw: Read Text File as Raw
        • stri_remove_empty: Remove All Empty Strings from a Character Vector
        • diff --git a/docs/rapi/stri_timezone_list.html b/docs/rapi/stri_timezone_list.html index 873b4cd00..4172bf590 100644 --- a/docs/rapi/stri_timezone_list.html +++ b/docs/rapi/stri_timezone_list.html @@ -167,6 +167,7 @@
        • stri_rand_lipsum: A Lorem Ipsum Generator
        • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
        • stri_rand_strings: Generate Random Strings
        • +
        • stri_rank: Ranking
        • stri_read_lines: Read Text Lines from a Text File
        • stri_read_raw: Read Text File as Raw
        • stri_remove_empty: Remove All Empty Strings from a Character Vector
        • diff --git a/docs/rapi/stri_timezone_set.html b/docs/rapi/stri_timezone_set.html index 7388286e4..178bcad31 100644 --- a/docs/rapi/stri_timezone_set.html +++ b/docs/rapi/stri_timezone_set.html @@ -167,6 +167,7 @@
        • stri_rand_lipsum: A Lorem Ipsum Generator
        • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
        • stri_rand_strings: Generate Random Strings
        • +
        • stri_rank: Ranking
        • stri_read_lines: Read Text Lines from a Text File
        • stri_read_raw: Read Text File as Raw
        • stri_remove_empty: Remove All Empty Strings from a Character Vector
        • diff --git a/docs/rapi/stri_trans_casemap.html b/docs/rapi/stri_trans_casemap.html index c108a3f0c..b95b246d0 100644 --- a/docs/rapi/stri_trans_casemap.html +++ b/docs/rapi/stri_trans_casemap.html @@ -167,6 +167,7 @@
        • stri_rand_lipsum: A Lorem Ipsum Generator
        • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
        • stri_rand_strings: Generate Random Strings
        • +
        • stri_rank: Ranking
        • stri_read_lines: Read Text Lines from a Text File
        • stri_read_raw: Read Text File as Raw
        • stri_remove_empty: Remove All Empty Strings from a Character Vector
        • @@ -357,7 +358,7 @@

          References

          See Also

          -

          Other locale_sensitive: %s<%(), about_locale, about_search_boundaries, about_search_coll, stri_compare(), stri_count_boundaries(), stri_duplicated(), stri_enc_detect2(), stri_extract_all_boundaries(), stri_locate_all_boundaries(), stri_opts_collator(), stri_order(), stri_sort_key(), stri_sort(), stri_split_boundaries(), stri_unique(), stri_wrap()

          +

          Other locale_sensitive: %s<%(), about_locale, about_search_boundaries, about_search_coll, stri_compare(), stri_count_boundaries(), stri_duplicated(), stri_enc_detect2(), stri_extract_all_boundaries(), stri_locate_all_boundaries(), stri_opts_collator(), stri_order(), stri_rank(), stri_sort_key(), stri_sort(), stri_split_boundaries(), stri_unique(), stri_wrap()

          Other transform: stri_trans_char(), stri_trans_general(), stri_trans_list(), stri_trans_nfc()

          Other text_boundaries: about_search_boundaries, about_search, stri_count_boundaries(), stri_extract_all_boundaries(), stri_locate_all_boundaries(), stri_opts_brkiter(), stri_split_boundaries(), stri_split_lines(), stri_wrap()

          diff --git a/docs/rapi/stri_trans_char.html b/docs/rapi/stri_trans_char.html index c3c1169c4..6e7abe467 100644 --- a/docs/rapi/stri_trans_char.html +++ b/docs/rapi/stri_trans_char.html @@ -167,6 +167,7 @@
        • stri_rand_lipsum: A Lorem Ipsum Generator
        • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
        • stri_rand_strings: Generate Random Strings
        • +
        • stri_rank: Ranking
        • stri_read_lines: Read Text Lines from a Text File
        • stri_read_raw: Read Text File as Raw
        • stri_remove_empty: Remove All Empty Strings from a Character Vector
        • diff --git a/docs/rapi/stri_trans_general.html b/docs/rapi/stri_trans_general.html index 40dfcfc61..61316a009 100644 --- a/docs/rapi/stri_trans_general.html +++ b/docs/rapi/stri_trans_general.html @@ -167,6 +167,7 @@
        • stri_rand_lipsum: A Lorem Ipsum Generator
        • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
        • stri_rand_strings: Generate Random Strings
        • +
        • stri_rank: Ranking
        • stri_read_lines: Read Text Lines from a Text File
        • stri_read_raw: Read Text File as Raw
        • stri_remove_empty: Remove All Empty Strings from a Character Vector
        • diff --git a/docs/rapi/stri_trans_list.html b/docs/rapi/stri_trans_list.html index ba0f342ad..5ebf9be1d 100644 --- a/docs/rapi/stri_trans_list.html +++ b/docs/rapi/stri_trans_list.html @@ -167,6 +167,7 @@
        • stri_rand_lipsum: A Lorem Ipsum Generator
        • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
        • stri_rand_strings: Generate Random Strings
        • +
        • stri_rank: Ranking
        • stri_read_lines: Read Text Lines from a Text File
        • stri_read_raw: Read Text File as Raw
        • stri_remove_empty: Remove All Empty Strings from a Character Vector
        • diff --git a/docs/rapi/stri_trans_nf.html b/docs/rapi/stri_trans_nf.html index 016448178..ece7199f6 100644 --- a/docs/rapi/stri_trans_nf.html +++ b/docs/rapi/stri_trans_nf.html @@ -167,6 +167,7 @@
        • stri_rand_lipsum: A Lorem Ipsum Generator
        • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
        • stri_rand_strings: Generate Random Strings
        • +
        • stri_rank: Ranking
        • stri_read_lines: Read Text Lines from a Text File
        • stri_read_raw: Read Text File as Raw
        • stri_remove_empty: Remove All Empty Strings from a Character Vector
        • diff --git a/docs/rapi/stri_trim.html b/docs/rapi/stri_trim.html index 9d7f20134..0720939d0 100644 --- a/docs/rapi/stri_trim.html +++ b/docs/rapi/stri_trim.html @@ -167,6 +167,7 @@
        • stri_rand_lipsum: A Lorem Ipsum Generator
        • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
        • stri_rand_strings: Generate Random Strings
        • +
        • stri_rank: Ranking
        • stri_read_lines: Read Text Lines from a Text File
        • stri_read_raw: Read Text File as Raw
        • stri_remove_empty: Remove All Empty Strings from a Character Vector
        • diff --git a/docs/rapi/stri_unescape_unicode.html b/docs/rapi/stri_unescape_unicode.html index 9e0357bea..8e53e931b 100644 --- a/docs/rapi/stri_unescape_unicode.html +++ b/docs/rapi/stri_unescape_unicode.html @@ -167,6 +167,7 @@
        • stri_rand_lipsum: A Lorem Ipsum Generator
        • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
        • stri_rand_strings: Generate Random Strings
        • +
        • stri_rank: Ranking
        • stri_read_lines: Read Text Lines from a Text File
        • stri_read_raw: Read Text File as Raw
        • stri_remove_empty: Remove All Empty Strings from a Character Vector
        • diff --git a/docs/rapi/stri_unique.html b/docs/rapi/stri_unique.html index 1f86b591b..ada34d95a 100644 --- a/docs/rapi/stri_unique.html +++ b/docs/rapi/stri_unique.html @@ -167,6 +167,7 @@
        • stri_rand_lipsum: A Lorem Ipsum Generator
        • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
        • stri_rand_strings: Generate Random Strings
        • +
        • stri_rank: Ranking
        • stri_read_lines: Read Text Lines from a Text File
        • stri_read_raw: Read Text File as Raw
        • stri_remove_empty: Remove All Empty Strings from a Character Vector
        • @@ -343,7 +344,7 @@

          References

          See Also

          -

          Other locale_sensitive: %s<%(), about_locale, about_search_boundaries, about_search_coll, stri_compare(), stri_count_boundaries(), stri_duplicated(), stri_enc_detect2(), stri_extract_all_boundaries(), stri_locate_all_boundaries(), stri_opts_collator(), stri_order(), stri_sort_key(), stri_sort(), stri_split_boundaries(), stri_trans_tolower(), stri_wrap()

          +

          Other locale_sensitive: %s<%(), about_locale, about_search_boundaries, about_search_coll, stri_compare(), stri_count_boundaries(), stri_duplicated(), stri_enc_detect2(), stri_extract_all_boundaries(), stri_locate_all_boundaries(), stri_opts_collator(), stri_order(), stri_rank(), stri_sort_key(), stri_sort(), stri_split_boundaries(), stri_trans_tolower(), stri_wrap()

          Examples

          diff --git a/docs/rapi/stri_width.html b/docs/rapi/stri_width.html index 0d10b47ac..c2288b965 100644 --- a/docs/rapi/stri_width.html +++ b/docs/rapi/stri_width.html @@ -167,6 +167,7 @@
        • stri_rand_lipsum: A Lorem Ipsum Generator
        • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
        • stri_rand_strings: Generate Random Strings
        • +
        • stri_rank: Ranking
        • stri_read_lines: Read Text Lines from a Text File
        • stri_read_raw: Read Text File as Raw
        • stri_remove_empty: Remove All Empty Strings from a Character Vector
        • diff --git a/docs/rapi/stri_wrap.html b/docs/rapi/stri_wrap.html index 44111465e..17318f94e 100644 --- a/docs/rapi/stri_wrap.html +++ b/docs/rapi/stri_wrap.html @@ -167,6 +167,7 @@
        • stri_rand_lipsum: A Lorem Ipsum Generator
        • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
        • stri_rand_strings: Generate Random Strings
        • +
        • stri_rank: Ranking
        • stri_read_lines: Read Text Lines from a Text File
        • stri_read_raw: Read Text File as Raw
        • stri_remove_empty: Remove All Empty Strings from a Character Vector
        • @@ -388,7 +389,7 @@

          References

          See Also

          -

          Other locale_sensitive: %s<%(), about_locale, about_search_boundaries, about_search_coll, stri_compare(), stri_count_boundaries(), stri_duplicated(), stri_enc_detect2(), stri_extract_all_boundaries(), stri_locate_all_boundaries(), stri_opts_collator(), stri_order(), stri_sort_key(), stri_sort(), stri_split_boundaries(), stri_trans_tolower(), stri_unique()

          +

          Other locale_sensitive: %s<%(), about_locale, about_search_boundaries, about_search_coll, stri_compare(), stri_count_boundaries(), stri_duplicated(), stri_enc_detect2(), stri_extract_all_boundaries(), stri_locate_all_boundaries(), stri_opts_collator(), stri_order(), stri_rank(), stri_sort_key(), stri_sort(), stri_split_boundaries(), stri_trans_tolower(), stri_unique()

          Other text_boundaries: about_search_boundaries, about_search, stri_count_boundaries(), stri_extract_all_boundaries(), stri_locate_all_boundaries(), stri_opts_brkiter(), stri_split_boundaries(), stri_split_lines(), stri_trans_tolower()

          diff --git a/docs/rapi/stri_write_lines.html b/docs/rapi/stri_write_lines.html index 23ff4e7dc..1c9395ddc 100644 --- a/docs/rapi/stri_write_lines.html +++ b/docs/rapi/stri_write_lines.html @@ -167,6 +167,7 @@
        • stri_rand_lipsum: A Lorem Ipsum Generator
        • stri_rand_shuffle: Randomly Shuffle Code Points in Each String
        • stri_rand_strings: Generate Random Strings
        • +
        • stri_rank: Ranking
        • stri_read_lines: Read Text Lines from a Text File
        • stri_read_raw: Read Text File as Raw
        • stri_remove_empty: Remove All Empty Strings from a Character Vector
        • diff --git a/docs/searchindex.js b/docs/searchindex.js index ad8b44947..90b3eb05c 100644 --- a/docs/searchindex.js +++ b/docs/searchindex.js @@ -1 +1 @@ -Search.setIndex({docnames:["index","install","news","rapi","rapi/about_arguments","rapi/about_encoding","rapi/about_locale","rapi/about_search","rapi/about_search_boundaries","rapi/about_search_charclass","rapi/about_search_coll","rapi/about_search_fixed","rapi/about_search_regex","rapi/about_stringi","rapi/operator_add","rapi/operator_compare","rapi/operator_dollar","rapi/stri_compare","rapi/stri_count","rapi/stri_count_boundaries","rapi/stri_datetime_add","rapi/stri_datetime_create","rapi/stri_datetime_fields","rapi/stri_datetime_format","rapi/stri_datetime_fstr","rapi/stri_datetime_now","rapi/stri_datetime_symbols","rapi/stri_detect","rapi/stri_dup","rapi/stri_duplicated","rapi/stri_enc_detect","rapi/stri_enc_detect2","rapi/stri_enc_fromutf32","rapi/stri_enc_info","rapi/stri_enc_isascii","rapi/stri_enc_isutf16","rapi/stri_enc_isutf8","rapi/stri_enc_list","rapi/stri_enc_mark","rapi/stri_enc_set","rapi/stri_enc_toascii","rapi/stri_enc_tonative","rapi/stri_enc_toutf32","rapi/stri_enc_toutf8","rapi/stri_encode","rapi/stri_escape_unicode","rapi/stri_extract","rapi/stri_extract_boundaries","rapi/stri_flatten","rapi/stri_info","rapi/stri_isempty","rapi/stri_join","rapi/stri_join_list","rapi/stri_length","rapi/stri_list2matrix","rapi/stri_locale_info","rapi/stri_locale_list","rapi/stri_locale_set","rapi/stri_locate","rapi/stri_locate_boundaries","rapi/stri_match","rapi/stri_na2empty","rapi/stri_numbytes","rapi/stri_opts_brkiter","rapi/stri_opts_collator","rapi/stri_opts_fixed","rapi/stri_opts_regex","rapi/stri_order","rapi/stri_pad","rapi/stri_rand_lipsum","rapi/stri_rand_shuffle","rapi/stri_rand_strings","rapi/stri_read_lines","rapi/stri_read_raw","rapi/stri_remove_empty","rapi/stri_replace","rapi/stri_replace_na","rapi/stri_reverse","rapi/stri_sort","rapi/stri_sort_key","rapi/stri_split","rapi/stri_split_boundaries","rapi/stri_split_lines","rapi/stri_startsendswith","rapi/stri_stats_general","rapi/stri_stats_latex","rapi/stri_sub","rapi/stri_sub_all","rapi/stri_subset","rapi/stri_timezone_info","rapi/stri_timezone_list","rapi/stri_timezone_set","rapi/stri_trans_casemap","rapi/stri_trans_char","rapi/stri_trans_general","rapi/stri_trans_list","rapi/stri_trans_nf","rapi/stri_trim","rapi/stri_unescape_unicode","rapi/stri_unique","rapi/stri_width","rapi/stri_wrap","rapi/stri_write_lines"],envversion:{"sphinx.domains.c":2,"sphinx.domains.changeset":1,"sphinx.domains.citation":1,"sphinx.domains.cpp":3,"sphinx.domains.index":1,"sphinx.domains.javascript":2,"sphinx.domains.math":2,"sphinx.domains.python":2,"sphinx.domains.rst":2,"sphinx.domains.std":2,sphinx:56},filenames:["index.rst","install.rst","news.rst","rapi.rst","rapi/about_arguments.rst","rapi/about_encoding.rst","rapi/about_locale.rst","rapi/about_search.rst","rapi/about_search_boundaries.rst","rapi/about_search_charclass.rst","rapi/about_search_coll.rst","rapi/about_search_fixed.rst","rapi/about_search_regex.rst","rapi/about_stringi.rst","rapi/operator_add.rst","rapi/operator_compare.rst","rapi/operator_dollar.rst","rapi/stri_compare.rst","rapi/stri_count.rst","rapi/stri_count_boundaries.rst","rapi/stri_datetime_add.rst","rapi/stri_datetime_create.rst","rapi/stri_datetime_fields.rst","rapi/stri_datetime_format.rst","rapi/stri_datetime_fstr.rst","rapi/stri_datetime_now.rst","rapi/stri_datetime_symbols.rst","rapi/stri_detect.rst","rapi/stri_dup.rst","rapi/stri_duplicated.rst","rapi/stri_enc_detect.rst","rapi/stri_enc_detect2.rst","rapi/stri_enc_fromutf32.rst","rapi/stri_enc_info.rst","rapi/stri_enc_isascii.rst","rapi/stri_enc_isutf16.rst","rapi/stri_enc_isutf8.rst","rapi/stri_enc_list.rst","rapi/stri_enc_mark.rst","rapi/stri_enc_set.rst","rapi/stri_enc_toascii.rst","rapi/stri_enc_tonative.rst","rapi/stri_enc_toutf32.rst","rapi/stri_enc_toutf8.rst","rapi/stri_encode.rst","rapi/stri_escape_unicode.rst","rapi/stri_extract.rst","rapi/stri_extract_boundaries.rst","rapi/stri_flatten.rst","rapi/stri_info.rst","rapi/stri_isempty.rst","rapi/stri_join.rst","rapi/stri_join_list.rst","rapi/stri_length.rst","rapi/stri_list2matrix.rst","rapi/stri_locale_info.rst","rapi/stri_locale_list.rst","rapi/stri_locale_set.rst","rapi/stri_locate.rst","rapi/stri_locate_boundaries.rst","rapi/stri_match.rst","rapi/stri_na2empty.rst","rapi/stri_numbytes.rst","rapi/stri_opts_brkiter.rst","rapi/stri_opts_collator.rst","rapi/stri_opts_fixed.rst","rapi/stri_opts_regex.rst","rapi/stri_order.rst","rapi/stri_pad.rst","rapi/stri_rand_lipsum.rst","rapi/stri_rand_shuffle.rst","rapi/stri_rand_strings.rst","rapi/stri_read_lines.rst","rapi/stri_read_raw.rst","rapi/stri_remove_empty.rst","rapi/stri_replace.rst","rapi/stri_replace_na.rst","rapi/stri_reverse.rst","rapi/stri_sort.rst","rapi/stri_sort_key.rst","rapi/stri_split.rst","rapi/stri_split_boundaries.rst","rapi/stri_split_lines.rst","rapi/stri_startsendswith.rst","rapi/stri_stats_general.rst","rapi/stri_stats_latex.rst","rapi/stri_sub.rst","rapi/stri_sub_all.rst","rapi/stri_subset.rst","rapi/stri_timezone_info.rst","rapi/stri_timezone_list.rst","rapi/stri_timezone_set.rst","rapi/stri_trans_casemap.rst","rapi/stri_trans_char.rst","rapi/stri_trans_general.rst","rapi/stri_trans_list.rst","rapi/stri_trans_nf.rst","rapi/stri_trim.rst","rapi/stri_unescape_unicode.rst","rapi/stri_unique.rst","rapi/stri_width.rst","rapi/stri_wrap.rst","rapi/stri_write_lines.rst"],objects:{},objnames:{},objtypes:{},terms:{"0000":[5,9],"000a":66,"001a":44,"00ad":100,"0100":23,"0105":9,"0123456789":70,"032":40,"0377":12,"0530":23,"075258":23,"0800":23,"0ooo":12,"0x0a":82,"0x0b":82,"0x0c":82,"0x0d":82,"0x1a":40,"0x1f":98,"0x2028":82,"0x2029":82,"0x3000":100,"0x85":82,"0xff01":100,"0xff5e":100,"100":[2,64,67,78],"100000":30,"101":[67,78],"102":2,"105":2,"106":2,"10646":13,"107":2,"108":2,"109":2,"10ffff":[5,9],"110":2,"111":2,"1119":101,"112":2,"114":2,"116":2,"117":2,"118":2,"1184":101,"119":2,"120":2,"122":2,"123":[2,14,18,27,47,50,51,52,53,62,75,77,81,88,92,93],"1234":75,"124":2,"1250":[30,36],"1251":30,"1252":[2,5,30],"1253":30,"1254":30,"1255":30,"1256":30,"126":2,"127":[5,34,38,40,43],"128":2,"129":2,"12l":21,"132":2,"133":2,"134":2,"135":2,"137":2,"138":2,"139":2,"141":2,"143":2,"144":2,"149":2,"154":2,"157":2,"164":2,"165":2,"168":2,"169":2,"16be":[30,31,35],"16le":[30,31,35],"170":2,"174":2,"175":2,"176":2,"177":5,"180":2,"183":2,"187":2,"188":2,"189":23,"190":69,"193":2,"1970":25,"1981":101,"199":2,"1990":9,"1996":23,"1999":[10,23],"1bc":[21,22],"1st":23,"1to1":33,"2001":2,"2002":12,"200b":100,"2013":0,"2014":[0,20],"2015":[0,21,23],"2016":[0,20],"2017":0,"2018":0,"2019":0,"2020":0,"2021":0,"2022":30,"2028":[9,82],"2029":[9,82],"205":2,"2060":9,"206f":9,"207":2,"210":2,"214":2,"216":2,"220":2,"227":2,"230":2,"231":2,"232":2,"235":23,"2350":23,"238":2,"242":2,"2451334":23,"253":2,"254":2,"258":2,"263":2,"266":2,"267":2,"270":2,"285":2,"288":2,"289":2,"296":2,"2bc":[21,22],"2nd":23,"314":2,"3166":[6,90],"317":2,"318":2,"319":2,"31t23":23,"325":2,"32be":[30,31,35],"32le":[30,31,35],"334":2,"335":2,"337":2,"338":2,"341":2,"343":2,"344":2,"345":2,"3456":[86,87],"347":2,"348":2,"355":2,"362":2,"3629":13,"363":2,"364":2,"366":2,"369":2,"370":2,"372":2,"382":2,"386":2,"393":2,"398":2,"399":2,"3rd":2,"400":2,"401":2,"405":2,"408":2,"414":2,"415":2,"456":[27,52,75,81],"4601":23,"5198":96,"55200":46,"5775":21,"61201235":23,"639":6,"667":[86,87],"789":[27,52,75,81,86,87],"822":23,"8601":23,"8859":[5,30],"8bit":33,"9899":9,"999":21,"abstract":12,"bart\u0142omiej":0,"break":[2,8,19,47,59,63,81,92,101],"byte":[0,2,3,5,7,12,13,30,31,32,33,34,35,36,38,40,41,42,43,44,53,66,79,86,98],"case":[0,1,2,3,4,5,6,7,8,9,10,11,12,13,17,19,24,27,30,31,43,44,46,47,51,53,55,59,63,64,65,66,70,75,80,81,87,94,96,101],"char":84,"class":[0,2,3,7,8,12,13,20,21,22,23,25,26,64,71,90,91,97],"default":[0,1,2,3,5,12,15,17,18,19,20,21,22,23,26,27,29,31,33,37,38,43,44,46,47,55,58,59,60,63,64,65,66,67,68,72,75,78,79,80,81,82,83,88,89,90,92,97,99,101,102],"enum":[2,66],"export":2,"final":[5,6,9,12,100],"float":2,"function":[0,1,2,3,5,9,10,11,13,15,17,18,19,20,23,24,27,29,30,31,32,34,35,36,38,40,41,42,43,44,46,47,51,52,53,54,55,57,58,59,60,61,62,63,64,65,66,67,68,72,75,76,78,79,80,81,82,83,84,85,86,87,88,89,90,91,92,94,96,97,98,99,100,101,102],"import":[2,4],"long":[1,2,4,23,89,90],"new":[0,12,14,81,101],"null":[1,2,6,17,18,19,20,21,22,23,26,27,29,31,32,33,39,41,42,44,46,47,51,52,55,57,58,59,60,63,64,67,72,75,78,79,80,81,83,88,89,91,92,99,101,102],"public":9,"return":[2,5,7,12,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,68,69,70,71,72,73,74,75,76,77,80,81,82,83,84,85,86,87,88,89,90,91,92,93,94,95,96,97,98,99,100,101,102],"short":[1,2,9,11,23,49,89],"static":2,"strin\u0261i":0,"switch":[2,5],"throw":2,"true":[2,5,9,12,17,19,21,23,27,29,37,43,44,46,47,48,49,51,52,54,58,59,64,65,66,67,68,69,71,74,75,78,80,81,82,86,87,88,101],"try":[1,2,31],"var":1,"while":[2,5,6,8,17,39],Added:2,For:[0,1,3,4,5,6,8,9,10,12,17,19,23,24,30,32,36,37,43,44,45,46,47,53,58,59,60,62,63,66,67,75,78,79,81,83,86,87,89,91,92,94,97,98],Into:[0,3],Its:[12,36,86,87],Los:23,Mrs:[59,81],NAs:[0,3],NFs:96,Not:[30,46,57,62,75,86,91],One:6,Such:[5,29,86,87,99],Sys:[5,38,39],THE:[3,47,80],The:[0,1,2,5,6,7,8,9,10,11,12,13,17,19,20,23,25,27,30,31,34,36,37,41,48,54,58,59,60,62,63,67,69,72,75,78,79,80,81,88,90,96,98,100,101],Their:[6,12],There:5,These:[5,7,8,9,14,15,17,18,19,23,27,35,44,46,47,51,52,58,59,60,68,75,80,82,83,88,92,96,97],Use:[2,58,59],Used:89,Useful:2,Uses:98,Using:2,With:[12,55,92],_boundari:[2,7,59],_charclass:[2,7,9,83],_coll:[2,7,10,83],_count:2,_euro:6,_fix:[2,7,65,83],_limit:2,_regex:[2,7,12,58,60,75],_static:2,_word:[47,59],_xpg6:2,a_b_c__d:80,a_b_c_d:80,aaa:[23,46,58,97],aaaa:[46,58,75],aaaaaaaa:[46,58],aabbcc:[46,58],ab_c:80,aba:46,ababa:83,abababa:46,abaca:75,abbrevi:[23,26],abc:[9,14,27,28,46,50,51,53,58,62,77,86,87,92],abcd:[60,68],abcdefghi:70,abcdefghijk:[46,58],abil:[72,79,102],abl:[2,7],about:[0,2],about_argu:[0,3,5,6,7,8,9,10,11,12,13],about_encod:[0,3,4,6,7,8,9,10,11,12,13,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44],about_local:[0,3,4,5,7,8,9,10,11,12,13,15,17,19,29,31,47,55,56,57,59,64,67,78,79,81,92,99,101],about_search:[0,3,4,5,6,8,9,10,11,12,13,18,19,27,46,47,58,59,60,63,64,65,66,75,80,81,82,83,88,92,97,101],about_search_boundari:[0,3,4,5,6,7,9,10,11,12,13,15,17,19,29,31,47,59,63,64,67,78,79,81,82,92,99,101],about_search_charclass:[0,3,4,5,6,7,8,10,11,12,13,97],about_search_col:[0,3,4,5,6,7,8,9,11,12,13,15,17,19,29,31,47,59,64,67,78,79,81,92,99,101],about_search_fix:[0,3,4,5,6,7,8,9,10,12,13,65],about_search_regex:[0,3,4,5,6,7,8,9,10,11,13,66],about_stringi:[0,3,4,5,6,7,8,9,10,11,12],abov:[9,31,54,60,64],absolut:1,ac_config_fil:2,ac_subst:2,acagagactttagatagagaaga:[58,60],accent:[9,10,11,94],accept:[2,63,88],access:[1,2,9,16,42],accompani:13,accord:[9,38,44,46,62,64,78,80,92],accordingli:2,account:[8,10,17,30,65,68,89,101],acd:9,acgt:[60,93],achiev:94,across:2,act:[2,14,35,63,68,101],action:63,activ:[5,9,62,96],actual:[11,101],add:[2,20,44,68],added:[2,68],adding:20,addit:[1,2,17,18,19,23,27,29,46,47,58,59,60,67,75,78,79,80,81,83,88,90,92,99],addition:[2,5,13,17,37,38,60],address:2,adipis:[18,75,84,85,86,101],adjac:23,adjust:97,advanc:[4,9,12,63],aesthet:101,affect:[2,80,81,94],after:[2,12,30,64],aga:[46,58,75],agaga:[46,58,75],again:[2,9],against:[1,2,30],aggreg:[84,85],agonek:77,ahead:12,aim:[2,9,19,44,72],ala:[65,66],algorithm:[2,9,10,11,13,67,78,79,85,96,101],alia:[2,17,29,44,54,64,66,69,72,73,74,75,86,87,101,102],alias:[2,9,37,51,52],align:[0,3],alik:64,aliquet:[84,101],all:[0,1,2,3,4,5,6,7,9,10,12,13,15,17,18,19,22,23,26,27,28,29,30,31,33,34,36,38,40,43,44,45,46,47,52,56,57,58,59,60,61,64,75,80,81,90,91,96,97,101,102],alloc:2,allow:[2,5,9,10,12,17,18,21,27,32,46,58,60,66,86,101],almost:[4,5,90],alon:23,along:30,alpha:27,alphabet:[9,12],alphanumer:5,alreadi:[1,29,91],also:[0,1,2,68,77],alter:12,altern:[2,9,12,58,79,86],alternate_shift:64,alwai:[5,9,17,31,39,40,44,51,54,56,57,71,72,88,90,96,101],ambigu:5,america:23,amet:[18,52,69,75,80,84,85,86,101],among:[0,2,5,9,13,60,68],amount:[5,20,30,90],ampm:[22,26],analog:94,analysi:[0,2,3,7,12,13,19,47,59,63,81,101],angel:23,angl:[12,30],ani:[0,2,4,5,6,9,12,13,17,23,29,32,43,45,51,55,63,64,65,66,75,82,86,87,89,94,96,100],annex:[9,96,100],anno:23,anoth:[9,94],anydupl:29,anymor:2,anyth:[55,86],anywai:[1,2],apart:[5,37],api:[0,2,9,13,24,26,32,38,63,64,66,90,91],apidoc:[9,13,26,63,64,66,90,91],appear:[5,6,12,23,63,71,80,82,84,85],append:23,appli:[4,9,12,14,80,82,87,90,100,101],applic:[2,5,86,87],appreci:0,appropri:[1,8,44,46,64,80],approxim:[2,13,100],arab:30,arbitrari:[32,83,97],architectur:64,archiv:1,area:90,arg:[1,2],argument:[0,1,2,3,5,6,13],aris:96,arithmet:[0,3],arrai:2,arrang:101,asan:2,ascend:67,ascii:[0,2,3,5,9,12,23,31,33,36,38,39,43,44,45,66,71,94,98,100,101],ascii_hex_digit:9,asian:100,ask:6,assert:12,assum:[1,2,4,5,38,39,40,43,44,96],assumpt:[5,38,40],asymmetr:9,atom:[2,4,12,16,51,54],atomic_vector:16,attempt:2,attr:22,attrib:2,attribut:[2,37,64,99],augu:[84,85,101],australian:6,author:0,auto:2,autoconf:2,autom:5,automat:[5,6,9,38,44,96],avail:[0,2,3,6,7,9,12,37,46,65,66,75,89,94],avoid:[2,6,9,96],awar:[6,11,12,13,27,64,79],baaab:18,baab:18,bab:18,babaab:93,babab:18,back:[6,9,12,23,86],backslash:[9,66,75],backtrack:66,backward:[2,64],bacon:[19,52,59,60,81],bartek:13,bartolini:[46,58],base:[1,2,5,7,9,10,13,15,16,21,22,24,29,31,59,64,69,83,86,87,94,99,100,101],basic:[2,5,8,23,33,54,55,89],bastienfr:2,bbbbb:58,bear:75,becam:2,becaus:[1,2,4,6,11,14,30,31,36,44,65,72,96],becom:[1,23,80,102],been:[0,1,2,5,9,30,53,63,83,91],befor:[2,9,12,30,45,64,89,101],begin:[12,13,67,78,85,90],behavior:[4,6,8,12,43,51,63,64,65,66,67,78,90],behaviour:2,behind:[2,12],being:[2,5,12,23,55,64,86,101],bell:12,belong:9,below:[2,4,5,8,9,12,17,23,33,46,58,64,67,75,78,84],best:[5,6,30,31],better:[5,12,29,65,70,99],between:[0,2,3,5,9,10,12,17,24,48,59,64,80,97,101],bewar:98,biarch:2,bibliograph:9,bidi:9,bidi_control:9,bidi_mirror:9,bidirect:[9,70,71,77,86],big5:30,big:[1,2,71],bin:[1,2],binari:[0,2,3,7,14,18,72,73,84,97,102],bit:[5,31,32,33,36,39,40,42,43,62,90],bitcoin:97,bitwis:11,black:75,bogu:43,bom:[2,5,17,43,44],both:[2,5,17,19,20,35,43,68,74,86,97,101],bound:[9,86],boundari:[0,2,3,7,12,13,63,66,80,92,101],boundaryanalysi:[8,63],box:[1,2],bracket:[9,12,30],breakfast:60,breakiter:[0,2,3,8,19,47,59,81,92,101],briefli:9,bring:2,british:2,broader:94,broken:2,brown:[59,75,81],bsd:[0,2,13],buddhist:26,buffer:2,bug:[0,1,2],bugfix:2,build:[0,2],built:[1,2,49,51,54,94],bundl:[1,2],by_row:54,byrow:[2,46,47,54,80,81],bytewis:[29,64,99],c90:9,calendar:[2,6,20,21,22,23,26,89],call:[0,1,2,4,5,6,11,14,15,17,18,19,27,30,41,42,43,44,46,47,48,55,57,58,59,60,72,75,80,81,83,87,88,90,94,101],cam:100,can:[0,1,2,5,8,9,30,32,38,41,43,44,70,73,87,92,94,97,101],canadian:64,cannot:[2,8,44,72,98],canon:[2,10,15,17,29,33,37,96,99],capabl:94,capit:[8,92],captur:[0,2,3,12,46,75],care:[4,86],carefulli:5,carriag:[12,82],cascad:5,case_ignor:9,case_insensit:[2,27,46,58,65,66,75],case_level:[17,64],case_map:65,case_sensit:9,casemap:92,cat:[1,5,68,69,100,101],categori:[5,7,12,18,38,39,63,97,100],caus:[2,9,43,64],cbind:[86,87],ccc:23,cccc:23,ccccc:23,cccccc:23,center:[0,3],cento:[1,2],central:5,certain:[23,45],certainli:36,cflag:1,cg_miss:[2,60],chain:[2,69,94],chang:[2,5,6,9,12,30,39,42,57,66,68,86,90,91,92,101],changes_when_casefold:9,changes_when_casemap:9,changes_when_lowercas:9,changes_when_nfkc_casefold:9,changes_when_titlecas:9,changes_when_uppercas:9,charact:[0,2,3,4,6,7,8,13,15,16,17,18,19,23,24,27,28,29,32,34,35,36,38,40,41,42,43,44,45,46,47,48,49,50,52,53,55,56,58,59,60,61,62,63,67,68,69,70,71,72,75,77,78,79,80,81,82,83,87,88,90,92,94,95,96,98,99,100,101,102],character_set:30,charclass:[2,9,18,27,46,58,71,75,80,83,84,88,97,100],charmod:96,charscmdenvir:85,charset:[39,49],charsiz:33,charsnwhit:84,charswhit:85,charsword:85,charsxp:2,chartr:2,check:[0,1,2,3,5,6,9,17,30,31,38,46,64,68,83],chines:[8,9,23,30],chladni:[17,67,78,79],choic:[5,23],choos:1,chunk:7,circul:6,circumst:24,citi:23,civil:6,cjkv:9,clang:2,clariti:9,classicu_1_1col:64,classicu_1_1dateformatsymbol:26,classicu_1_1timezon:[90,91],classicu_1_1unicodeset:9,classif:9,classifi:35,claus:[0,2,13],cldr:2,clean:2,clever:[17,44],clock:[22,23],close:[1,9],closer:90,cluster:12,cmd:[1,85],code:[0,2,3,5,6,8,9,12,13,15,17,19,31,32,33,40,42,43,44,59,62,64,65,68,71,77,83,84,86,90,92,93,99,101],codec:2,codepoint:96,coerc:[2,37,48,54,67,78],coercibl:[4,14,15,17,19,20,22,23,32,38,42,47,50,51,53,59,62,76,81,100],coercion:2,coexist:5,coll:[18,27,46,58,64,65,75,80,83,88],collaps:[2,4,30,48,51,52,69,70],collat:[0,2,3,6,7,10,13,29,67,78,79,99],collect:2,colour:1,column:[2,22,54,58,59,60,86,87,100],com:[1,2,13],combin:[9,12,55,94,96],come:[8,92],command:[0,1,3],comment:[12,66],common:[1,2,40,89],commonli:[9,30],commun:[5,6],compar:[0,3,5,6,12,13,29,60,62,75],comparison:[2,5,6,15,17,64,67,78],compat:[2,23,96,100,101],competit:5,compil:[1,2],complement:9,complex:[1,5,10,11,64,93,101],complic:55,compon:[13,26,31,33,49,89],composit:[94,96],compound:94,comprehens:[2,9],comput:[5,6,22,62,79],con:[2,72,73,102],concaten:[0,2,3,5,13,28],concept:6,concern:90,concis:49,conclus:0,condition:2,confid:[30,31],config:[1,2],configur:[1,2,30,86],conform:[2,12,72],confus:51,conjoin:[10,11],conjunct:2,connect:[2,9,54,72,73,102],connector_punctu:12,consectetur:[18,75,84,85,86,101],consecut:[27,46,58,75,101],consequ:[15,39],consid:[44,64],consider:5,consist:[0,2,4,5,9,13,17,24,40,47,52,60,68,69,71,92,93],consol:[5,53,68,101],conson:100,consortium:13,constant:[2,12,66],construct:[2,21],contain:[0,3,9,49,63,66,75,79,84,101],content:[13,82,96],context:[12,23,26,65,85,92],continu:9,contrari:[97,101],contribut:[0,13],contributor:85,control:[2,8,9,12,64,66,67,78,83,98,100],conveni:[0,2,13,18,27,32,46,57,58,60,63,64,65,66,68,75,76,80,83,88,94,97],convent:[6,19,45,47,59,92,101],convers:[2,11,13,24,30,44,73,94],convert:[0,2,3,4,5,9,23,31,37,45,94,96],converted_str:44,cooki:92,coordin:90,copi:[1,2,4,86,87,99],coptic:26,copyright:[2,13],correct:[0,2,6,10,11,13,86],correctli:[1,2,5,39],correspond:[2,4,9,15,17,27,32,34,36,42,51,53,60,75,82,86,87,90,93],cost:[2,101],cost_expon:101,could:[2,6,30],count:[0,2,3,7,8,13,23,83,85,86],counterpart:[29,99],countri:[6,55,90],cours:[2,4,30,31,83],cover:[5,12,31],cpp:[2,31],cppflag:1,cpu:66,cra:[84,101],cran:0,creat:[0,1,3,5,14,56],crlf:82,csrucod:31,cstring:2,cultur:6,currenc:[6,9],current:[0,1,2,3,6,9,12,22,23,39,41,44,49,57,60,62,69,72,89,91,102],custom:[1,2,63],customis:0,cxx11:[1,2],cxx1x:2,cxxcpp:2,cxxflag:1,cyclic:23,cyril:[9,94],czech:30,czw:23,d_ef_g:80,dai:[20,21,22,23],danish:30,dash:[2,9],dat:2,data:[0,1,2,3,5,9,11,22,23,30,31,38,44,59,62,64,69,80,90,102],databas:[9,13],date:[0,2,3,13,24,90,91],date_long:23,dateformatsymbol:26,datetim:[20,21,22,23,24,25,26,89,90,91],datetime_relative_medium:23,davisvaughan:2,daylight:[23,89,90],dayofweek:22,dayofyear:22,de_d:[17,92],deal:[2,4,5,42,53],debian:1,debug:2,decid:5,decim:[9,12],decimal_numb:12,declar:[0,2,3,5,39,40,41,43,44],decnumb:2,decod:[32,94],decomposit:96,decreas:[30,31,67,78],def:27,default_ignorable_code_point:9,default_local:2,defin:[9,10,12,32,39,49,64,80,82,83,86,87,90,96,98],definit:[64,66],delimit:80,deliv:6,denorm:5,denot:[5,9,22,48,75,83,86,101],depend:[1,2,5,6,8,9,12,15,17,18,22,23,27,29,46,57,58,66,67,75,78,79,80,82,83,88,91,92,99,101],deprec:[0,2,3,9,29,63,64,65,66,69,72,73,102],descend:67,describ:[9,10,11,12,54],design:[2,5,23,90,94],desir:[6,66,71,76,94],dessert:60,detail:4,detect:[0,2,3,6,7,13,35,38,39,42,53,60,65,73,84],determin:[0,2,3,5,9,13,17,19,27,30,40,80,82,91,96,101],dev:[1,2,9,13,26,63,64,66,90,91],devel:[0,1],develop:[1,5,13],diacrit:[8,9,17],diagnos:44,diagnost:2,did:[2,6],differ:[2,5,6,8,9,12,17,18,19,30,46,48,51,58,60,66,75,92,93,94,96,97],digit:[5,9,12,13,23,45,64,71,90,98],digraph:9,dim:4,dimitri:2,dir:[1,2],directli:[2,58,79,83],directori:1,disabl:[1,2,12],disallow:[9,44],disappear:9,discourag:9,discret:69,discuss:[5,39,44,55],disjoint:87,dispatch:68,displai:[2,5,8,9,23,69],display_typ:89,distinguish:12,distribut:[1,2,13,69],divers:1,doc:[9,10,13,26,63,64,66,90,91],document:[2,8,9,13,26,63,64,66,90,91,96],doe:[1,2,5,6,8,9,12,17,23,24,33,55,60,64,90,100,101],dog:75,doing:[4,5,39],dolor:[18,52,69,75,80,84,85,86,101],domini:23,done:[11,71],dot:9,dot_al:66,dotal:66,download:[0,1,2],draft:[0,2,13,96],drastic:2,draw:71,drop:4,dst:[89,90],dt_relative_styl:23,dt_style:23,du_disable_renam:2,dual:[32,42],due:[1,4,5,13,37],dummi:[2,69],duplic:[0,2,3,37,99],dure:[6,56,80,90],dutch:30,dynam:[2,101],dynlib:2,e0000:9,e0fff:9,each:[0,2,3,4,5,6,7,8,9,13,14,18,24,27,28,29,30,31,32,37,40,42,46,47,51,52,53,54,58,60,62,68,71,72,75,76,80,82,83,84,85,86,87,92,93,94,95,96,101,102],eagerli:2,earli:2,eas:2,easier:[5,88],easili:[2,42,102],east:100,eee:23,eeee:23,eeeee:23,eeeeee:23,effect:[39,57,90],effici:[2,4,10,12,43],efficient_text_searching_in_java:10,egg:[19,59,60,81],eight:12,either:[1,5,9,12,18,23,24,27,44,45,46,63,80,83,88,90,92],element:[0,2,3,4,6,13,15,17,18,27,30,31,34,36,37,42,46,47,48,50,51,53,54,58,60,67,71,75,78,80,82,83,84,85,87,102],elit:[18,75,84,85,86,101],ellipsi:36,embed:44,emoji:[2,9,46],emoji_modifi:9,emoji_modifier_bas:9,emoji_present:9,emploi:9,empti:[0,2,3,4,6,9,12,18,27,31,46,47,48,50,51,80,81,82,83,86],emul:2,en_au:6,en_u:[6,57,59,81,92],enabl:[12,30,65,66],enc2utf8:[42,43],enc:[33,39],enclos:[9,23],encod:[0,2,3,9,13,30,32,34,35,36,40,42,43,49,53,62,72,73,88,96,102],encoding_convers:[5,32,40,41,42,43,44],encoding_detect:[5,30,31,34,35,36],encoding_manag:[5,33,37,38,39],encodingnam:44,encount:[5,12,39],encourag:[1,100],end:[0,2,3,7,8,9,12,13,27,30,32,46,57,58,59,62,63,66,67,75,78,82,85,86,87,90,91,97,101],endian:[1,2],engin:[0,2,3,7,9,11,12,13,18,27,30,46,58,60,75,80,83,88],english:[6,10,30],enhanc:79,entir:66,entireti:72,entri:[0,37,66],enumer:100,envir:85,environ:[1,2,41,85],equal:[17,23,29,30,31,51,52,64,68,71,80,81,99,100],equat:90,equip:2,equival:[2,5,9,10,15,16,17,19,29,38,42,48,51,59,64,65,66,75,76,79,82,88,96,99,100],era:[22,23,26],erron:44,error:[2,4,9,12,33,53,66,84,101],error_on_unknown_escap:66,escap:[0,3,12,13,23,66,75],especi:[1,5,10,30,86],essenti:96,establish:[2,4,57,64,91],eszett:92,etc:[1,2,4,5,12,21,22,26,42,46,63,80],etiam:[84,101],euc:30,euro:[2,6],europ:[89,91],european:[5,6],evalu:12,even:[5,8,12,23,30,54,55],evenli:101,ever:5,everi:[13,60,75,77,101],everyth:9,exact:[2,12],exactli:[5,12,17,32,33,38,42,68],examin:[5,27],exampl:[0,2,5,6,8,9,11,12],examplercppstringi:2,exce:[44,72],except:[2,9,12,23,101],exclud:[63,88],exclus:[86,87],exdent:[2,101],execut:[1,45],exemplar:23,exemplari:23,exercis:69,exist:[1,2,5,12],expand:2,expect:[1,4,6,9,66],experi:[1,101],expert:39,explain:[4,5,6,7],explicit:5,explicitli:[44,86],expon:101,express:[0,3,4,5,7,9,13,66,82,97],extend:[5,9,23,36,38,40,43],extens:2,extern:[2,5],extra:[1,64,93],extract:[0,2,3,7,12,13,29,58,80,81],face:1,facil:[10,11,30,31,66,98],fact:[30,37],factor:4,fail:[1,2,5,6,12,30,31,39,41,43,62,66],failur:[2,12,30,31],fall:[9,23],fallback:1,fallback_encod:[2,72],fals:[2,5,21,23,27,29,30,35,36,37,43,44,46,47,48,49,51,54,58,59,60,63,64,65,67,68,69,74,75,78,80,81,82,83,86,87,88,101],famili:[2,31,37,63],familiar:2,fanci:[13,48],faq:5,fashion:[2,17],fast:[0,2,11,12,13],faster:[9,44,83,88],fastest:50,fcd:64,featur:[0,1,2,12,19,59,68,81,101],feature_test:2,februari:20,fedora:1,feed:[12,82],feel:[14,15,17,83],fetch:[1,89,90],few:[0,1,12,30,31],fewer:12,fff0:9,fffb:9,fffd:44,field:[0,2,3,23,80],file:[0,1,2,3,5,13,30,63,82,84,85],fill:[2,46,47,54,80,81],filter:[30,81],filter_angle_bracket:30,find:[1,4,8,9,50,58,67],first:[1,2,4,7,8,9,10,12,17,22,23,29,31,33,46,48,51,52,58,59,60,75,83,90,92,94,97,101],fit:[5,8,63],fix:[0,2,3,10,12,18,27,43,46,49,58,62,66,75,80,83,88],flag:[1,2,12,23,49,66],flatten:[0,3],flavor:[1,9],flavour:2,floor:[68,101],fname:[2,72,73,102],fold:[2,13,96],follow:[1,2,5,6,7,9,12,13,19,22,26,29,30,31,33,45,47,49,55,59,63,69,82,84,85,89,92,94,96,98,100,101],font:100,food:60,forc:[1,2,64],form:[5,6,9,12,16,23,24,36,40,42,49,55,57,60,64,75,82,86,96,98],formal:[96,100],format:[0,2,3,8,9,12,13,30,90,96],formatpars:[23,26],formatt:24,found:[29,40,44,46,58],four:5,fox:75,fraction:[21,23],fragment:12,frame:[2,22,30,31,90],free:12,freeli:9,french:[6,30,64],frequent:[2,30],friedl:12,friend:15,friendli:[2,5,33,39,86,87],from:[0,1,2,3,4,5,9,12,13,17,21,23,29,30,37,43,44,46,51,58,66,67,69,71,75,78,80,82,83,87,88,90,94,96],from_last:[2,29],fromlast:[2,29],front:86,full:[2,23,65,80,81,92,94,100],fulli:[0,31,60],fundament:6,further:[5,13],futur:[2,23,63,64,65,66,84,85],gaertner:17,gagolew:[1,2],gagolewski:[0,2,13],gain:2,garbag:2,gather:13,gb18030:30,gcing:2,gcmask:2,gcuacggagcuucggagcuag:93,gener:[0,1,2,3,4,7,8,12,13,18,23,27,32,39,40,42,44,46,53,61,70,83,86,87,92,95,96,97,100],general_categori:9,generic_loc:89,generic_long:89,generic_short:89,german:[6,30,92],get:[0,1,2,3,4,5,6,33,45,51,52,53,55,58,59,64,74,84,94,97,101],getlocal:[5,38,39],getopt:[68,101],ggg:23,gggg:23,ggggg:23,ghi:27,github:[0,1,2,9,13,26,63,64,66,90,91],give:[0,2,5,11,12,13,23,29,37,38,49,57,58,59,60,67,68,70,71,76,77,79,80,81,83,84,85,86,87,93,101],given:[0,2,3,4,5,7,12,17,18,23,24,27,32,33,35,36,37,38,39,46,47,49,52,53,54,58,60,66,67,68,69,75,76,80,81,82,83,86,90,93,94,97,98,101,102],glanc:[9,10],glibc:2,gmt:[23,89,90],gmt_long:89,gmt_short:89,good:[12,46],graphem:[5,12],great:4,greater:[5,17,36,38,40,51,52,62,71,101],greatest:31,greatli:0,greedi:[2,101],greek:[9,30,94],greenwich:90,gregorian:[2,20,21,22,23,26,89],gro:[29,94,99],gross:[29,99],group:[0,2,3,5,6,12,30,46,75],gru:23,grudnia:23,guarante:[1,2],guess:[30,31],guid:[5,6,8,9,10,12,17,20,23,26,29,30,44,63,64,65,66,67,78,79,90,92,94,95,96,99],guidelin:[23,72,82],had:[2,5],hadlei:0,half:90,halfwidth:94,hand:[80,81],handl:[2,5,6,8,30,38,50,53,62,76,86,94,98],hangul:100,happi:[59,81],hard:63,has:[0,1,2,5,30,38,39,43,48,51,52,53,83,86,91],have:[1,2,5,6,8,9,12,23,29,31,33,39,44,54,63,68,100,101],hbox:2,he_il:26,heap:66,hebrew:[20,21,22,26,30],help:1,hemispher:90,henc:[29,99],here:[9,10,11,12,17,23,30,38,41,43,53,58,60,92],hesit:1,heurist:[30,31],hex:[12,45,94,98],hex_digit:9,hexadecim:9,hhhh:12,hhhhhhhh:12,higher:[30,31],hiragana:63,histor:90,hit:31,hladn:17,hladni:[17,67,78,79],hms:23,hold:[17,38],home:[2,13],homepag:[0,13],honour:2,hopefulli:1,horizont:[12,101],host:0,hour12:22,hour:[20,21,22,23,89,90],how:[2,4,5,6,7,9,10,12,13,17,55,67,78,79],howev:[1,2,5,6,9,14,30,35,36,44,54,55,62,75,94],html:[5,6,9,10,12,13,26,30,63,64,66,82,90,91],http:[1,2,5,6,8,9,10,12,13,17,20,23,26,29,30,44,63,64,65,66,67,78,79,82,85,90,91,92,94,95,96,99,100],human:[6,89],hundr:[5,30,31],hungarian:30,hyphen:[9,100],i18n:[2,13,31],iana:33,ibm420:30,ibm424:30,ibm:[13,33],icecream:60,iconv:44,icu4c:[0,2,9,13,26,63,64,66,90,91],icu52dt:2,icu55:[1,2],icu61:2,icu:[0,1,2,5,6,7,8,9,10,13,17,19,20,23,24,26,29,30,31,33,37,38,39,44,46,47,49,55,56,59,60,63,64,65,66,67,75,78,79,81,89,90,91,92,94,95,96,98,99,101],icudt52b:2,icudt61b:2,icudt61l:2,icudt:[1,2],icudt_dir:1,id456:88,id_:14,id_continu:9,id_start:9,ident:90,identifi:[0,2,3,9,19,20,21,22,23,26,31,33,37,47,55,56,59,89,91,92,94,95,101],ideograph:[9,63],iec:9,ietf:[13,96],ifels:102,iff:31,ignor:[2,5,6,9,10,11,12,17,19,23,25,30,44,47,51,52,59,64,71,80,86,90,93,96],ignore_nul:[2,51],ill:[32,40,42,98],imag:30,imbal:2,implement:[2,6,10,11,12,44,69,72,83,85,92],impli:36,implicit:[5,9,38],imprecis:[5,30,31],improp:6,improv:2,inc:13,incident:5,includ:[0,1,2,3,6,7,8,9,12,13,18,26,27,46,58,60,62,75,80,83,85,86,88,100],inclus:[9,86],incompat:2,inconsist:24,incorrect:[2,43,44,53],incorrectli:2,increas:78,increment:64,inde:36,indent:[2,101],independ:[2,7,13,15,17,34,35,36,75],index:[2,29,58,59,83,86,87],indian:26,indic:[2,7,15,17,29,31,34,36,44,46,47,49,58,59,60,81,86,87,99],individu:[2,6,13,42,46,80],influenti:1,info:[12,90],inform:[2,5,6,10,12,13,17,19,33,37,47,49,55,56,57,59,67,78,79,81,89,90,91],initi:[2,5,6,9,31,101],inject:86,input:[2,5,11,12,17,30,32,38,40,44,45,51,59,63,64,66,67,72,75,78,80,82,86,87,92,93,94,96,101],ins:72,insensit:[0,3,5,9,12,17,65,66],insert:2,insid:[12,23,66],insight:55,inspect:27,inspir:[0,12,31],instal:[0,2],instanc:[4,5,18,23,27,36,37,46,58,60,83,86,97],instead:[2,62,68,101],instruct:2,integ:[4,5,17,18,19,20,21,27,28,29,32,42,53,54,58,59,62,64,66,67,68,69,71,80,81,83,84,85,86,87,100,101],intellig:2,intens:2,interact:6,interchang:[90,96],interest:[4,13,27,83,88],interestingli:10,interfer:30,intern:[2,5,13,30,32,39,44,49,62,91],internation:13,internet:1,interoper:[5,96],interpret:[5,23,40,43],intersect:9,intit:78,introduc:[2,96],introduct:[0,12],inttoutf8:32,intuit:[5,38,67],invalid:[2,43],invis:[39,57,91],ipa:0,ipsum:[0,2,3,18,52,75,80,84,85,86,101],is_unknown_8bit:[5,43],isalnum:9,ish:2,islam:[6,26],ismwx:12,iso8601:23,iso:[5,6,9,13,23,30,90],ispunct:9,issu:[1,2,4,13,42,44],italian:30,iter:[2,4,8,9,19,47,59,63,81,92,101],its:[2,4,5,6,9,12,13,15,17,29,37,86,99],itself:[40,90],ja_jp_tradit:26,jamo:100,januari:[20,22],japanes:[8,9,26,30,94],java:[0,10,12,13,33],jdk:12,jkl:27,john:2,join:[14,28,48,51,52],jone:[59,81],joy:13,juli:23,julian:23,jump:75,just:[2,5,6,8,12,19,29,31,41,47,58,59,60,69,75,87,99],kana:63,katakana:[9,63,94],keep:58,kei:[0,2,3,5,64],keyboard:[5,38],keyword:[6,13,20,21,22,23],kile:85,kind:9,know:[4,5,39],knowledg:5,known:[0,2,3,5,31,45,56,66,98],knuth:[2,11,101],koi8:30,korean:[9,30],l10n:13,lacinia:[84,85,101],lai:69,languag:[0,2,3,5,6,7,8,11,13,17,29,31,55,57,64,65,92,94,99,101],language_countri:[6,55,57],language_country_vari:[6,57],lappli:90,larg:9,larger:[2,5],largest:12,last:[2,7,12,29,46,58,59,60,75,82,83,86,93,97,101],latest:1,latex:[0,3],latin1:[2,5,38,44],latin:[9,68,69,71,94,101],lazi:75,lc_ctype:[5,38,39],ldflag:[1,2],lead:[4,5,9,12,17],leak:2,leap:[25,90],least:[4,12,27,30,31,68,71,84],leav:[86,87],led:2,ledkov:2,left:[0,3,9,46,58,64,66,75,101],legal:9,legibl:30,length:[0,2,3,4,9,11,12,29,30,31,38,46,47,48,51,52,53,54,58,59,62,67,68,69,71,75,78,79,80,81,86,87,96,100,101],lenient:[21,23],less:[12,17,54,58],let:5,letter:[6,8,9,10,11,14,18,23,24,30,34,36,48,50,51,53,62,63,64,66,70,71,78,90,92,94,100],level:[2,64],lexicograph:[17,67,78],lib64:1,lib:[1,2,49],libc:2,libicu:[1,2],librari:[1,2,17,31,49,97],licens:[0,2,13],ligatur:17,like:[0,1,2,4,5,9,13,14,19,23,31,47,51,58,59,68,75,81,87,92,99,101],limit:[30,66],line:[0,1,2,3,8,9,12,13,19,30,59,63,66,68,73,81,84,85,101],line_break:[8,19,47,59,63,81],linesnempti:84,linguist:[8,9],link:[1,2,9,13],linker:1,linux:[2,5],lipca:23,list:[0,1,2,3,4,5,6,8,9,12,13,16,17,18,19,27,29,30,31,32,33,34,35,36,39,42,44,46,47,49,55,58,59,60,67,75,78,79,80,81,82,83,87,88,89,92,94,99,100,101],liter:[12,23,66,75],littl:1,lll:23,llll:23,lllll:23,load:[2,5,30,84,85],local:[0,2,3,7,8,9,12,13,15,17,19,20,21,22,23,26,29,46,47,49,58,59,63,64,67,78,79,81,89,90,92,99,101],locale_manag:[6,55,56,57],locale_sensit:[6,8,10,15,17,19,29,31,47,59,64,67,78,79,81,92,99,101],localiz:[0,2,3],locat:[0,2,3,7,8,10,11,19,23,44,47,81],locate_first:58,locate_last:58,log:[67,78],logic:[4,15,17,21,23,27,29,30,34,35,36,37,43,44,46,47,48,49,50,51,54,58,59,60,63,64,65,66,67,68,69,75,78,80,81,82,83,86,87,88,96,101],london:89,longer:[2,36,72,93],longest:[51,54],look:[2,12,14,15,17,30,80,83],lookahead:58,lookup:12,loos:12,lorem:[0,2,3,18,52,75,80,84,85,86,101],los_angel:23,lower:[13,64,92,94],lowercas:[9,94],lukaszdaniel:2,lunar:23,lunch:60,machin:[1,5,39],macro:2,made:2,magrittr:[2,86,87],mai:[1,2,4,5,6,7,8,9,11,12,17,19,20,21,22,23,24,30,33,35,38,39,40,42,43,44,53,54,55,56,57,58,59,62,63,66,68,70,71,75,76,77,80,81,83,84,85,86,92,95,96,97,101],main:30,mainli:94,major:5,make:[1,2,5,8,83,96],makeconf:1,makevar:2,malform:[2,9,55],malici:2,man:[4,7,9,13,45],manag:[1,2,13],mandatori:63,mani:[0,2,6,7,9,12,13,55,57,91,96,97,101],manipul:[5,13],manual:[0,1,2,4,5,12,13,24],map:[0,2,3,5,6,13,40,43,55,65],marek:[0,13],margin:8,mario:17,mark:[2,5,8,9,12,27,30,32,34,35,36,38,40,41,43,44,62,72,86,96],marker:[23,44,72],markov:69,markup:30,mask:98,master:[1,12],match:[0,2,3,6,7,8,9,10,12,13,30,31,38,39,46,47,58,59,65,66,75,82,97],matcher:[0,3,4],math:9,mathemat:[9,94],matric:[2,58,59,60,86,87],matrix:[0,3,46,47,58,59,60,80,81,86],max:33,max_count:[2,27],maxim:[33,44,66,72,80,81,101],maximum:1,mean:[9,23,35,36,57,66,84,90,91],meaning:5,mechan:[5,38],medial:100,medium:23,memcheck:2,memori:[2,5,62,73],mention:[19,59,64,81],mere:46,merg:[2,30,46,58,75],messag:[2,12],met:1,meta:83,metacharact:66,method:[53,91,101],mgk25:100,microsystem:2,middl:[8,9,86],might:[9,11,17,19,23,27,30,37,44,86,90],migrat:[9,65],mileston:2,millisecond:[20,22,23,66],mime:33,mimic:2,min:33,mind:[5,58],minim:[2,33,54,68,101],minu:5,minut:[20,21,22,23],mirror:[1,2],misalign:2,mislead:[5,53],miss:[0,2,3,27,29,38,40,42,43,44,46,47,48,50,51,53,58,59,60,61,62,64,66,67,74,78,80,84,86,87,88],mmm:23,mmmm:23,mmmmm:23,mode:[46,58,60,66,72,73,75,101,102],model:[69,96],modifi:[6,9,20,23,57,85,88],mondai:23,mono:100,monster:92,month:[20,21,22,23,26],more:[0,1,2,4,5,6,8,9,10,12,13,17,18,19,23,24,27,30,31,33,37,43,44,46,47,48,56,57,58,59,60,64,67,72,75,78,79,80,81,83,88,89,91,92,96,97,101],moreov:[0,1,2,5,9,19,24,27,38,51,53,54,58,75,82,98,101],morri:[2,11],most:[0,1,2,4,5,9,23,24,26,30,35,36,64,66,96,97,101],mostli:30,move:[2,64],much:[2,10,17,29,72,94,99],multi:[5,9,30],multi_lin:66,multilin:66,multipl:[0,2,3,23,68,86,101],multitud:0,must:[6,8,12,75,87],mutual:[86,87],n_max:2,n_min:[2,54,80,81],n_paragraph:[2,69],na_character_:[2,32,54,60,90],na_empti:[2,48,74],na_integer_:90,na_last:[2,67,78],name:[1,2,4,5,9,12,17,18,19,20,21,22,23,26,27,29,30,31,33,37,39,44,46,47,55,57,58,59,60,63,64,65,66,67,72,73,75,78,79,80,81,83,84,85,88,89,90,92,94,99,102],narrow:26,nativ:[0,2,3,5,9,13,38,39,43,44,49,62,96],natur:[2,5,7,11,13,17,29,64,99,101],nchar:[2,100],necessari:[1,4,15,18,27,46,58,60,71,75,80,83,88],necessarili:6,need:[2,4,5,12,30,62,86,87,90,97],neg:[12,27,29,80,81,83,86,101],negat:[2,9,27,83,88],neither:[39,43],nel:82,network:96,never:[80,82],new_substr:86,newer:1,newlin:[12,72,82,102],next:82,nfc:[86,96,100],nfd:[64,94,96],nfkc:96,nfkc_casefold:96,nfkd:[94,96],nibh:[84,85,101],nice:2,nie:94,nil:2,nisan:21,nix:2,non:[2,4,5,9,10,12,17,19,20,21,22,23,27,29,45,47,59,64,67,70,71,77,78,81,84,86,98,99,101],noncharacter_code_point:9,nondecreas:[67,78],none:[2,84,101],nonincreas:[67,78],nor:[39,43],norm:96,normal:[0,2,3,5,9,13,17,37,53,62,64,69,70,71,77,86,94,97,99,100,101],normalis:[0,2,64,101],northern:90,norwegian:30,note:[1,2,5,8,9,10,11,12,13,14,17,18,19,20,22,23,30,32,35,36,39,40,41,43,44,46,47,51,53,56,57,58,59,60,63,66,68,75,77,80,81,83,86,90,92,94,96,97,98,100,101],noteworthi:102,noth:[23,102],notion:[10,17,100],now:[1,2],nparagraph:[2,69],npattern:75,nth:12,nul:[44,62],number100:64,number2:64,number:[0,1,2,3,5,6,7,9,12,13,20,22,23,25,27,28,31,33,46,54,63,68,69,71,75,80,81,84,85,92,93,100,101],numer:[2,4,5,9,21,23,30,31,64,67,78,90,101],numeric_valu:9,object:[0,2,3,14,15,17,19,20,22,23,25,32,38,42,46,47,50,51,53,59,62,63,64,65,66,72,73,76,80,81,86,88,100,102],observ:[2,5,6,43,71,90],obtain:[0,2,5,9,30,31,55,84,85,90],occur:[7,8,12,30,44],occurr:[0,2,3,7,18,27,31,44],octal:[12,98],off:1,offset:[89,90],often:[0,10,30,35,62,69,94,96,97],ogonek:[5,36,77,96],old:39,older:1,oldloc:57,oldrel:2,oldtz:91,omit:[1,48,63,82],omit_empti:[2,48,80,82],omit_na:[2,86,87,88],omit_no_match:[2,46,47,52,58,59,60,87],onc:[4,27,73],one:[1,2,4,5,6,8,9,12,18,20,23,26,27,32,33,38,42,44,46,48,53,54,55,58,59,60,62,63,64,68,71,75,84,87,88,89,90,92,94,96,102],ones:[33,64,98],onli:[2,4,5,9,12,30,33,38,39,46,48,51,52,58,59,60,63,66,68,75,79,80,81,82,86,87,88,90,92,97,101],ooo:[12,98],oooo:23,open:[0,2,9,72,73,102],opensus:[1,2],oper:[0,1,2,3,4,5,7,8,9,13,14,15,17,21,29,30,32,42,57,62,66,68,70,71,77,86,87,91,94,99,101],operator_add:[0,3],operator_compar:[0,3],operator_dollar:[0,3],opposit:64,optim:5,option:[1,2,6,15,17,29,30,43,51,52,67,78,79,99],opts_brkit:[2,19,47,59,81,92],opts_col:[2,17,18,27,29,46,58,64,67,75,78,79,80,83,88,99],opts_fix:[2,18,27,46,58,65,75,80,83,88],opts_regex:[2,18,27,46,58,60,66,75,80,88],oracl:2,order:[0,2,3,5,6,9,13,17,27,30,31,43,44,64,70,72,77,78,79,86,96],ordinari:[51,64],org:[1,5,6,8,9,10,12,13,17,20,23,26,29,30,44,63,64,65,66,67,78,79,82,90,91,92,94,95,96,97,99,100],orient:85,origin:[2,79,85],other:[0,2,4,5,6,7,8,9,10,11,12,13,14,15,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,68,69,70,71,72,73,74,75,76,78,79,80,81,82,83,84,85,86,87,88,89,90,91,92,93,94,95,96,97,98,99,100,101,102],otherwis:[4,23,27,29,44,45,46,47,49,51,52,54,66,71,80,81,84,89,90,101],our:[1,2,4,5,97],out:[1,2,5,9,46,50,68,69,86,97],output:[2,5,23,42,43,44,47,53,67,68,70,71,72,73,77,78,88,96,102],outsid:[12,23],over:[2,5,14,15,16,17,18,19,20,21,22,23,27,28,30,31,46,47,51,58,59,60,68,71,75,80,81,82,83,86,87,88,92,93,97,101],overal:12,overflow:2,overful:2,overlap:[2,9,46,58,60,65,75],overload:16,overrid:1,overwhelm:1,own:44,pace:13,pacif:23,packag:[1,2,5,9,47,57,68,91],pad:[0,2,3,13],page:[2,4,5,7,13,24,45],pair:9,pairwis:15,paper:[0,2,10],paragraph:[0,2,3,8,9,69,82],paramet:[2,10,82,86,87],parametr:6,parenthes:[12,60,75],pars:[0,2,3,13],part:[1,2,9,38,39,75,86,87],particular:[1,4,5,6,8,9,13,63,86,94],pass:[0,1,2,3,16,18,27,46,55,58,59,60,63,64,65,66,75,80,83,86,87,88],password:71,past:[2,48,51,76],pat1:9,pat2:9,pat:[58,83],patch:2,path:1,patter:2,pattern:[0,2,3,4,7,10,12,13,23,30,66,71,93,97],pdf:2,pdt:23,peculiar:[4,70,71,77],pellentesqu:[84,101],per:[4,6,57,69,101],perform:[0,2,3,4,5,6,7,9,10,11,12,15,17,19,29,47,56,57,59,62,63,64,66,67,73,78,81,94],perhap:[67,78],perl:[9,12],permiss:64,permut:[0,2,3,70,77],persian:26,phonebook:[6,17],php:85,piec:[9,10,19,80,81],pipabl:2,pipe:[2,86,87],pizza:60,pkg:[1,2],pkg_config:[1,2],pkg_config_path:1,pl_fonipa:94,pl_pl:[17,23,26,55,67,78,79],place:[9,86,87,88],plai:[5,87],plain:76,plass:101,platform:[1,2,5,6,13,38,82,91,102],pleas:[1,4,5,9,10,17,24,44,60,63,97],plu:[5,9,12],point:[0,2,3,5,8,9,12,13,15,17,19,31,32,33,40,42,44,59,62,64,65,68,71,77,83,84,86,90,92,93,99,101],polish:[5,6,17,30],poor:2,poorli:66,portabl:[0,1,2,5,9,44],portion:12,portugues:30,posit:[2,5,8,9,12,35,36,58,59,63,64,80,81,83,86,101],posix:[2,65],posix_alnum:9,posix_blank:9,posix_graph:9,posix_print:9,posix_xdigit:9,posixct:[20,21,22,23,25],posixst:23,possess:12,possibl:[0,1,2,3,4,5,12,31,38,63,65,80,81,83,96,101],potenti:96,power:[0,12,13],pqrst:28,practic:101,pratt:[2,11],pre:[2,94],preced:[9,12],precis:[5,6,66,90],predefin:[9,69],predict:13,prefer:12,prefix:[2,101],prepar:2,preprocessor:1,preserv:[2,97,101],prevent:[2,63],previou:[12,57,91],previous:[2,39,57,91],primari:64,print:[2,5,8,9,20,53,68,86,87,88,100,101],printabl:45,prioriti:86,privat:9,probabl:71,problem:[1,2,96],problemat:44,proce:100,process:[2,3,5,7,8,9,10,11,17,29,30,45,47,62,66,68,69,80,91,94,96,97,99,101],produc:[23,44,65],prof:[59,81],program:[5,6,101],proin:[85,101],project:[1,2,5,6,8,9,10,12,13,17,20,23,26,29,30,44,63,64,65,66,67,78,79,90,92,94,95,96,97,99],pronounc:0,propag:1,proper:36,properli:[1,5,6,10,38,50,53,62],properti:[4,7,12,18,84,97,100],protect:2,protocol:5,provid:[2,5,6,9,10,11,12,13,16,17,31,33,47,49,51,55,60,64,86,89,90,93,94,101],pseudo:[2,13,69,70,71],pt_br:57,punct:9,punctuat:[8,9,10,11,23],purpos:[2,5,8,82],put:[67,78,96,101],python:16,qqq:23,qqqq:23,qqqqq:23,quarter:[23,26],quaternari:64,queri:[0,3,6,56,91],quick:75,quicker:75,quit:[0,5,12,66],quot:[9,12,23,45],quotat:9,quotation_mark:9,r_home:1,r_inst_dir:1,r_usedynamicsymbol:2,ragged:[2,101],rais:[2,33],random:[0,2,3,9,13,69,70,77],randomli:[0,3,69],rang:[0,5,9,12,23,86,87,94],ranki:94,rare:[2,4,5],rather:[27,44,66,68,83,88,96,101],raw:[0,3,5,30,31,34,35,36,42,44,89,90],rawoffset:89,rawtochar:[30,44],rbbi:63,rbind:90,rbuildignor:1,rchk:2,rcpp:[0,2],read:[0,2,3,5,13,38,41],readabl:89,readbin:30,readlin:[30,72,84,85],real:23,realli:[5,55],rearrang:67,reason:[2,4,5,43,44],recal:9,recent:1,recogn:[6,45,66,98],recommend:[96,101],recycl:[2,4,15,18,27,46,58,60,71,75,80,83,87,88],redund:71,refer:[0,1,2,18,24,27,46,58,60,75,80,83,88],referenc:6,reflect:[6,33],reformat:101,regard:29,regardless:5,regex:[0,2,3,4,7,9,18,27,46,58,75,80,83,88],regexmatch:2,regexp:[9,12,66],region:[6,90],regular:[0,3,4,5,7,9,13,66,82,97],reilli:12,rel:[1,23],relat:[13,15,17,23],relationship:64,releas:[0,1,2,84,85],relev:1,reli:[1,2,5,83,97],reliabl:64,remaind:[80,81],rememb:4,remov:[0,2,3,5,9,17,30,37,43,63,64,65,66,67,75,78,80,82,94,96,97,99],renam:2,rep:70,replac:[0,2,3,7,13,20,23,24,40,43,44,71,80,88,93,97,101],repo:1,report:[1,2,9,12,19,66,82,96,100],repres:[5,9,17,23,25,30,32,33,36,37,46,58,60,66,82,84,85,90],represent:[2,5,21,33,79,89,91],request:[5,6,24,56],requir:[1,2,11,12,23,63],reserv:[9,23],resolv:1,resourc:[6,56],respect:[2,4,9,12,18,23,27,46,47,58,59,75,80,81,83,86,87,88,93],rest:92,restor:[57,91],restrict:94,result:[2,4,5,6,9,11,12,13,14,15,17,18,19,23,27,28,29,35,36,37,41,43,46,47,49,51,52,54,55,58,60,64,65,69,70,71,75,77,78,79,80,81,82,83,87,88,92,98],retri:12,reus:4,revers:[0,3,13,33,68,70],revert:2,rexamin:75,rf_error:2,rfc3629:13,rfc5198:96,rfc:[13,23,96],rid:[2,74],right:[0,3,9,46,58,75],robust:72,role:[5,87],romanian:30,roughli:[31,42,76,88,100],round:[2,60,75],routin:[2,5],row:[23,46,47,54,58,59,60,80,81],rpm:1,rule:[2,4,19,47,59,63,64,82,87,90,96],run:[2,30,46,57,62,75,83,86,91],russian:30,sake:23,same:[2,5,6,9,13,17,29,33,38,39,50,53,54,55,57,62,64,79,80,90,96,99,100],sampl:[71,78],saniti:2,sappli:[69,89],sausag:52,save:[89,90],scelerisqu:[84,85,101],scenario:[46,58,60,87],scharf:92,schedul:2,scheme:[5,9,33],scp:1,screen:68,script:[1,2,9,68,71,94,101],search:[0,1,2,3,4,5,6,9,11,12,13,18,19,27,29,46,47,58,59,60,63,64,66,71,75,80,81,83,84,88,97,100],search_charclass:[7,9,97],search_col:[7,10,64],search_count:[7,18,19],search_detect:[7,27,83],search_extract:[7,46,47,60],search_fix:[7,11,65],search_loc:[7,58,59],search_regex:[7,12,66],search_replac:[7,75,97],search_split:[7,80,81,82],search_subset:[7,88],second:[2,17,20,21,22,23,25,58,59,60,90],secondari:64,section:[6,9,12,66],sed:[1,84,85,101],see:[0,1,2,16,68,77],seek:13,seem:10,seen:[2,38],segfault:2,select:[0,3,5,6,22,31,33,69,101],selector:26,semant:5,sens:5,sensit:[0,3,7,13,23,57,65,66,92],sentenc:[8,19,59,63,69,81,92],sep:[2,14,23,48,51,52,68,69,76,101,102],separ:[8,9,23,47,48,51,52,55,58,63,72,80,82,83,84,85,94,102],septemb:23,sequenc:[0,1,2,3,5,11,12,23,30,32,34,36,40,42,43,44,53,58,66,82,94,96,101],seri:[9,94],serv:[44,82],server:[1,2],servic:[2,5,6,10,56,64,90,94],session:1,set:[0,1,2,3,4,5,6,9,11,12,17,18,19,20,21,22,23,27,29,32,42,43,44,46,47,51,53,58,59,60,67,69,71,75,78,79,80,81,82,83,88,92,99],setdatadirectori:2,setup:1,sever:[6,30],shall:2,shape:9,shift_ji:30,ship:[1,2],shorter:[15,18,27,46,58,60,75,80,83,88],should:[1,2,5,6,21,23,29,30,38,39,44,48,49,54,58,63,65,67,68,69,74,75,78,80,82,88,97,100,101],show:30,shown:[5,9,12],shuffl:[0,3],side:[0,3,68,101],sign:[2,5,9,20,25],signific:[2,6,23],significantli:[29,99],silent:[2,4,5,17,43,51,52,86],similar:[2,5,6,9,12,16,43,54,55,90],simpl:[2,5,38,65,69,101],simplest:87,simpli:[1,2],simplifi:[2,30,37,46,47,69,80,81,101],simplify2arrai:54,sinc:[0,9,12,25,46,75,90],singl:[2,5,8,9,16,19,20,21,22,23,26,27,29,30,31,32,33,37,39,40,43,44,46,47,48,49,51,52,54,55,57,58,59,60,63,64,65,67,68,69,71,72,75,76,78,80,81,82,83,86,87,88,89,90,91,92,93,94,97,101],singleton:27,sit:[18,52,69,75,80,84,85,86,101],site:[1,2,13,90],situat:39,six:12,size:[33,44,66,72],sk_sk:[17,46,58,67,78,79,89],skip:[46,58,75],skip_:63,skip_line_hard:63,skip_line_soft:63,skip_sentence_sep:[63,81],skip_sentence_term:63,skip_word_ideo:63,skip_word_kana:63,skip_word_lett:[63,81],skip_word_non:[19,59,63,81],skip_word_numb:[63,81],slash:9,slightli:[83,85],slovak:17,slow:75,slower:[10,14,29,99],small:[5,71,85,92,94],smaller:87,smith:[59,81],snprintf:2,soft:[9,63,100],soft_dot:9,softwar:101,solari:[1,2,39],sole:[2,5],solut:1,solv:2,some:[1,2,4,5,9,11,12,13,23,24,30,33,37,44,48,55,56,57,58,63,66,85,86,89,98],somehow:5,someth:[9,75],sometim:[4,35,53,82],somewhat:12,sort:[0,2,3,5,6,13,37,64,67,87],sourc:[0,1,2,69],sourceforg:85,southern:90,space:[2,5,8,9,12,18,23,46,58,66,75,84,85,97,100,101],space_separ:12,spaghetti:60,spam:[19,52,59,81],sparc:1,speak:5,special:[5,9,45,63,66],specif:[2,6,8,9,10,11,13,17,20,23,31,56,83,90,96],specifi:[2,5,6,9,12,20,21,22,23,24,37,44,63,71,75,94,96,97,101],spectrum:5,speed:[2,5,66],spell:2,split:[0,2,3,7,12,13,72,73,101],spontan:2,sprintf:[0,2,3],squar:[9,101],src:[1,2],sse2:2,sss:23,ssss:23,ssz:23,stabl:[67,78],stable_sort:[67,78],stack:[2,66],stack_limit:[2,66],stage:2,stand:[6,9,22,23,26],standalon:26,standard:[0,1,2,5,6,9,12,33,59,62,81,82,96,98,100],start:[0,2,3,7,8,9,27,46,58,59,66,68,69,75,86,87,97,101],start_lipsum:69,stat:[84,85],state:[2,9,20,68,89,101],statist:[0,3,5,13,30,31],statu:[2,19,47,59],stdin:[5,38],step:94,stick:97,still:[1,6],sting:27,stl:[67,78],stop:[2,27,66],storag:[5,66],store:[5,62],str2:76,str:[2,11,18,19,23,27,28,29,30,31,34,35,36,38,40,41,42,43,44,45,46,47,48,50,53,58,59,60,62,67,68,70,75,76,77,78,79,80,81,82,83,84,85,86,87,88,92,93,94,96,97,98,99,100,101,102],str_split_fix:2,strchr:2,strcmp:17,stream:[0,3,40,43],strength:[17,29,46,58,64,83,99],strftime:[23,24],stri:[2,14,15,16,28],stri_:[2,4,7,9,10,12,65,83],stri_brkit:2,stri_c:[2,51],stri_c_list:52,stri_cmp:[2,13,17,64],stri_cmp_eq:[2,17,92],stri_cmp_equiv:[2,15,17],stri_cmp_g:[2,17],stri_cmp_gt:[2,17],stri_cmp_l:[2,15,17],stri_cmp_lt:[2,17],stri_cmp_neq:[2,17],stri_cmp_nequiv:[2,17],stri_col:64,stri_compar:[0,3,6,8,10,15,19,29,31,47,59,64,67,78,79,81,92,99,101],stri_conv:44,stri_count:[0,2,3,7,19],stri_count_:7,stri_count_boundari:[0,2,3,6,7,8,10,13,15,17,18,29,31,47,53,59,63,64,67,78,79,81,82,92,99,101],stri_count_charclass:18,stri_count_col:18,stri_count_fix:[2,18,65],stri_count_regex:[18,66],stri_count_word:[2,19,47,59],stri_datetime_add:[0,2,3,21,22,23,24,25,26,89,90,91],stri_datetime_cr:[0,2,3,20,22,23,24,25,26,89,90,91],stri_datetime_field:[0,2,3,20,21,23,24,25,26,89,90,91],stri_datetime_format:[0,2,3,13,20,21,22,24,25,26,89,90,91],stri_datetime_fstr:[0,2,3,20,21,22,23,25,26,89,90,91],stri_datetime_now:[0,2,3,20,21,22,23,24,26,89,90,91],stri_datetime_pars:[2,23,24],stri_datetime_symbol:[0,2,3,20,21,22,23,24,25,89,90,91],stri_detect:[0,2,3,7,83,88],stri_detect_:[2,7],stri_detect_charclass:27,stri_detect_col:[27,64],stri_detect_fix:[27,65],stri_detect_regex:[2,27,66,83],stri_dup:[0,2,3,13,14,48,51,52],stri_dupl:[0,2,3,6,8,10,13,15,17,19,31,47,59,64,67,78,79,81,92,99,101],stri_duplicated_ani:[2,29],stri_enc_detect2:[0,2,3,5,6,8,10,15,17,19,29,30,34,35,36,47,59,64,67,78,79,81,92,99,101],stri_enc_detect:[0,2,3,5,31,34,35,36,73],stri_enc_fromutf32:[0,3,5,40,41,42,43,44,46,100],stri_enc_get:[5,38,39,41,43,44],stri_enc_info:[0,3,5,37,38,39,49],stri_enc_isascii:[0,2,3,5,30,31,35,36],stri_enc_isnf:2,stri_enc_isutf16:[0,3],stri_enc_isutf16b:[5,30,31,34,35,36],stri_enc_isutf16l:35,stri_enc_isutf32b:35,stri_enc_isutf32l:35,stri_enc_isutf8:[0,2,3,5,30,31,34,35],stri_enc_list:[0,3,5,33,38,39,44],stri_enc_mark:[0,2,3,5,33,37,39,40,41,43,44],stri_enc_nf:2,stri_enc_set:[0,2,3,5,33,37,38],stri_enc_toascii:[0,3,5,32,41,42,43,44],stri_enc_ton:[0,2,3,5,32,40,42,43,44],stri_enc_toutf32:[0,3,5,32,40,41,43,44],stri_enc_toutf8:[0,2,3,5,32,40,41,42,44,53,76],stri_encod:[0,2,3,5,30,32,40,41,42,43,72,73],stri_endswith:[2,27,83],stri_endswith_:[2,7],stri_endswith_charclass:83,stri_endswith_col:83,stri_endswith_fix:83,stri_escape_unicod:[0,3,13,62,98],stri_extract:[0,2,3,7,58,60],stri_extract_:[2,7,46,47],stri_extract_al:[2,7,46,47,54,60,87],stri_extract_all_:[2,46,47],stri_extract_all_boundari:[6,7,8,10,15,17,19,29,31,46,47,59,60,63,64,67,78,79,81,82,92,99,101],stri_extract_all_charclass:[2,46],stri_extract_all_col:46,stri_extract_all_fix:[2,46,65],stri_extract_all_regex:[2,46,52,60],stri_extract_all_word:[2,8,12,19,47,52,59],stri_extract_boundari:[0,3],stri_extract_first:[46,86],stri_extract_first_:[46,47],stri_extract_first_boundari:47,stri_extract_first_charclass:46,stri_extract_first_col:46,stri_extract_first_fix:46,stri_extract_first_regex:46,stri_extract_first_word:[2,47],stri_extract_last:[46,86],stri_extract_last_:[46,47],stri_extract_last_boundari:47,stri_extract_last_charclass:46,stri_extract_last_col:46,stri_extract_last_fix:46,stri_extract_last_regex:46,stri_extract_last_word:[2,47],stri_extract_word:2,stri_flatten:[0,2,3,13,14,28,30,51,52,69],stri_info:[0,2,3,39],stri_install_check:2,stri_install_icudt:2,stri_isempti:[0,3,53,62,100],stri_join:[0,2,3,4,13,14,28,48,52],stri_join_list:[0,2,3,14,28,48,51],stri_length:[0,2,3,13,19,50,62,93,100],stri_list2matrix:[0,2,3,46,47,61,74,76,80,81],stri_loc:[0,2,3,7],stri_locale_get:57,stri_locale_info:[0,3,6,49,56,57],stri_locale_list:[0,3,6,55,57],stri_locale_set:[0,3,6,55,56],stri_locate_:[7,58,59],stri_locate_al:[7,58,59,86,87],stri_locate_all_:[2,58,59],stri_locate_all_boundari:[2,6,7,8,10,15,17,19,29,31,47,58,59,63,64,67,78,79,81,82,86,87,92,99,101],stri_locate_all_charclass:[2,58],stri_locate_all_col:58,stri_locate_all_fix:[2,58,65],stri_locate_all_regex:[44,58,87],stri_locate_all_word:[2,19,59],stri_locate_boundari:[0,2,3],stri_locate_first:[58,86,87],stri_locate_first_:[58,59],stri_locate_first_boundari:[2,59],stri_locate_first_charclass:58,stri_locate_first_col:58,stri_locate_first_fix:58,stri_locate_first_regex:[58,86],stri_locate_first_word:[2,59],stri_locate_last:[58,86,87],stri_locate_last_:[58,59],stri_locate_last_boundari:[2,59],stri_locate_last_charclass:58,stri_locate_last_col:58,stri_locate_last_fix:58,stri_locate_last_regex:[58,86],stri_locate_last_word:[2,59],stri_locate_regex:2,stri_locate_word:2,stri_match:[0,2,3,7,12,46],stri_match_:[2,60],stri_match_al:[7,46,47,60],stri_match_all_:[2,60],stri_match_all_regex:60,stri_match_first:60,stri_match_first_regex:60,stri_match_last:60,stri_match_last_regex:60,stri_na2empti:[0,2,3,54,74,76],stri_numbyt:[0,3,19,50,53,100],stri_omit_empti:[2,74],stri_omit_empty_na:[2,74],stri_omit_na:[2,74],stri_opts_brkit:[0,2,3,7,8,19,47,59,81,82,92,101],stri_opts_col:[0,2,3,6,7,8,10,13,15,17,18,19,27,29,31,46,47,58,59,67,75,78,79,80,81,83,88,92,99,101],stri_opts_fix:[0,2,3,7,11,18,27,46,58,75,80,83,88],stri_opts_regex:[0,2,3,7,12,18,27,46,58,60,75,80,88],stri_ord:[0,2,3,6,8,10,13,15,17,19,29,31,47,59,64,78,79,81,92,99,101],stri_pad:[0,2,3,13,101],stri_pad_:[2,68],stri_pad_both:[2,68],stri_pad_left:[2,68],stri_pad_right:[2,68],stri_past:[2,51,58,70,71,76,83,101],stri_paste_list:52,stri_prepare_arg_posixct:2,stri_rand_lipsum:[0,2,3,13,70,71],stri_rand_shuffl:[0,2,3,13,69,71,77],stri_rand_str:[0,2,3,9,13,69,70],stri_read_bin:2,stri_read_lin:[0,2,3,13,73,84,102],stri_read_raw:[0,2,3,13,72,102],stri_remove_empti:[0,2,3,54,61,76],stri_remove_empty_na:[2,74],stri_remove_na:[2,74],stri_replac:[0,3,7,97],stri_replace_:[7,75],stri_replace_al:[2,7,75,97],stri_replace_all_:[2,75],stri_replace_all_charclass:[2,75],stri_replace_all_col:75,stri_replace_all_fix:[2,75],stri_replace_all_regex:75,stri_replace_first:[75,86],stri_replace_first_charclass:75,stri_replace_first_col:75,stri_replace_first_fix:75,stri_replace_first_regex:75,stri_replace_last:[75,86],stri_replace_last_charclass:75,stri_replace_last_col:75,stri_replace_last_fix:75,stri_replace_last_regex:75,stri_replace_na:[0,2,3,54,61,74],stri_revers:[0,3,13,70],stri_sort:[0,2,3,6,8,10,13,15,17,19,29,31,47,59,64,67,79,81,92,99,101],stri_sort_kei:[0,2,3,6,8,10,15,17,19,29,31,47,59,64,67,78,81,92,99,101],stri_split:[0,2,3,7,54,81,82],stri_split_:[2,7],stri_split_boundari:[0,2,3,6,7,8,10,15,17,19,29,31,47,59,63,64,67,78,79,80,82,92,99,101],stri_split_charclass:[2,80],stri_split_col:[2,80],stri_split_fix:[2,55,80],stri_split_lin:[0,3,7,8,13,19,47,59,63,80,81,92,101],stri_split_lines1:[72,73,82],stri_split_regex:[2,80],stri_startsendswith:[0,3],stri_startswith:[2,7,27,83],stri_startswith_:[2,7],stri_startswith_charclass:83,stri_startswith_col:83,stri_startswith_fix:83,stri_stats_gener:[0,3,13,85],stri_stats_latex:[0,3,13,84],stri_sub:[0,2,3,13,58,59,87],stri_sub_al:[0,2,3,58,59,86],stri_sub_all_replac:87,stri_sub_replac:[2,86],stri_sub_replace_al:[2,87],stri_subset:[0,2,3,7,27],stri_subset_:[2,7],stri_subset_charclass:88,stri_subset_col:88,stri_subset_fix:88,stri_subset_regex:88,stri_timezone_get:[2,20,21,22,23,24,25,26,89,90,91],stri_timezone_info:[0,2,3,20,21,22,23,24,25,26,90,91],stri_timezone_list:[0,2,3,20,21,22,23,24,25,26,89,91],stri_timezone_set:[0,2,3],stri_trans_casefold:2,stri_trans_casemap:[0,3],stri_trans_char:[0,2,3,13,92,94,95,96],stri_trans_gener:[0,2,3,13,92,93,95,96],stri_trans_isnf:[2,96],stri_trans_isnfc:96,stri_trans_isnfd:96,stri_trans_isnfkc:96,stri_trans_isnfkc_casefold:96,stri_trans_isnfkd:96,stri_trans_list:[0,2,3,92,93,94,96],stri_trans_nf:[0,2,3],stri_trans_nfc:[5,13,53,86,92,93,94,95,96,100,101],stri_trans_nfd:[77,94,96],stri_trans_nfkc:96,stri_trans_nfkc_casefold:96,stri_trans_nfkd:[17,19,29,53,68,96,99,100],stri_trans_to:2,stri_trans_tolow:[6,7,8,10,13,15,17,19,29,31,47,59,63,64,67,78,79,81,82,92,93,94,95,96,99,101],stri_trans_totitl:[2,8,92],stri_trans_toupp:[92,94],stri_trim:[0,3,7,13,75],stri_trim_both:[7,9,75,97],stri_trim_left:[68,97],stri_trim_right:97,stri_unescape_unicod:[0,3,45],stri_uniqu:[0,2,3,6,8,10,13,15,17,19,29,31,47,59,64,67,78,79,81,92,101],stri_width:[0,2,3,13,50,53,62,68,101],stri_wrap:[0,2,3,6,7,8,10,13,15,17,19,29,31,47,59,63,64,67,68,69,78,79,81,82,92,99],stri_write_lin:[0,2,3,13,72,73],stricontainerutf16:2,stricontainerutf8:2,strictest:64,striexcept:2,string8:2,string:[2,3,4,5,6,9,11,12,16,18,19,20,21,22,23,26,27,29,30,31,32,33,34,35,36,39,40,45,46,47,49,51,53,54,55,57,58,59,60,62,63,64,65,66,67,69,72,75,76,78,79,84,85,86,87,88,89,90,91,93,94,96,99,100,101],stringi:[7,13,17,18,19,25,27,32,34,35,36,37,38,44,46,47,51,55,56,58,59,60,63,64,65,66,67,68,71,75,78,79,80,81,82,83,84,85,86,88,92,94,96,97,99,100,101],stringi_1:1,stringi_cflag:[1,2],stringi_cppflag:[1,2],stringi_cxxflag:[1,2],stringi_disable_cxx11:[1,2],stringi_disable_icu_bundl:[1,2],stringi_disable_pkg_config:[1,2],stringi_general_top:[4,5,6,7,8,9,10,11,12,13],stringi_ldflag:[1,2],stringi_lib:[1,2],stringr:[0,2],stringsearch:[7,10],strncpy:2,strongli:[1,9],strptime:[0,2,3],strrringi:[18,27],strstr:2,strsxp:2,strwrap:[2,101],stubdata:2,student:2,studio:2,stuff:[84,85],style:[0,3,9,23,30],sub:[12,60,88],sub_index:2,submiss:2,subsequ:101,subset:[1,2,4,5,7,9,27,33],substitut:[2,5,40,44,72,80,86,87,88,101,102],substr:[0,2,3,12,13,46,59,60,64,75,80],success:1,successfulli:1,suffici:2,suggest:[0,1,2,6,101,102],suit:[29,97,99],suitabl:[1,2,101],summar:[9,12],sun:2,sundai:22,superset:[5,39],supplementari:[18,27,46,58,60,75,80,83,88],suppli:[2,12,30,31,75],support:[0,2,5,6,9,23,24,37,39,44,46,49,60,62,80,89,96],suppos:2,suppress:2,sure:[1,35],surrog:9,surround:92,suscipit:[84,85,101],swedish:30,sxpinfo:2,syllabl:9,symbol:[2,9,23],synonym:28,syntax:[9,12,16,23,63],sys:2,system:[1,2,5,6,8,9,38,39,49],tab:[9,12,82,101],tabl:30,tabul:12,take:[10,17,65,68,89,101],taken:[8,30],tar:1,target:[2,44],tartanu:[0,13],task:[2,7,12,13,94,95],tato:94,team:85,technic:[5,8,12,44,82,96],techniqu:30,technolog:2,tellu:[84,101],temporari:14,term:[51,90],termin:[12,27,63,66],terminal_punctu:9,tertiari:64,test1:76,test2:19,test:[2,6,9,15,17,19,27,29,30,39,59,76,81,83,99],text:[0,2,3,5,7,9,12,13,23,30,31,63,68,69,80,84,85,86,92,96,100],text_boundari:[7,8,19,47,59,63,81,82,92,101],textbf:85,textit:85,textual:9,tf08:5,tgca:93,th_th_tradit:26,than:[2,4,5,8,9,10,12,14,17,23,29,38,40,44,51,52,54,58,62,64,70,71,87,99,101],thank:[0,2],thei:[2,5,6,9,12,13,15,17,23,32,43,44,46,58,59,60,63,65,67,75,78,83,88,94],them:[5,6,17,30,33,95],themselv:[66,80],theoret:9,therefor:[5,9,17,82],therein:13,thereof:44,thi:[0,1,2,4,5,6,7,8,9,17,18,19,22,23,27,30,31,32,33,34,36,37,38,40,41,42,43,44,46,50,51,53,54,55,58,59,60,61,62,63,64,65,66,67,68,70,71,72,75,76,77,78,79,81,82,83,84,85,90,94,96,99,101,102],think:8,third:[8,60,64],those:[5,6,10],though:[2,12],thought:5,three:[12,23,30,31,90,92],through:9,throughout:90,thu:[4,5,59,80,96,102],tie:9,time:[0,2,3,5,9,11,12,13,14,24,28,29,66,80,88,93],time_limit:[2,66],timezon:[20,23,89,90,91],titl:[13,92,94],to_raw:44,todo:2,togeth:[0,1,3,6,49,94],token:[80,81],tokens_onli:[2,80,81],toler:1,too:2,took:4,tool:[2,12,13,96],top:64,topic:[12,13],total:[12,31,68,84,97,101],tr11:100,tr13:82,tr15:96,tr18:[12,82],tr29:66,tr44:9,tr_tr:92,tracker:0,tradit:[30,66],trail:62,transform:[0,2,3,13,93,96],transit:12,translat:[0,3,5,13,33],transliter:[0,2,3,13],transpos:54,transposit:54,treat:[12,13,23,48,51,64,66,74],treatment:[67,78],tri:[2,5,8,12,31,37,39],trick:1,trim:[0,3,13,83],trivial:2,truncat:[23,69],tue:23,tuesdai:23,tune:[6,10,11,12,17,18,27,46,58,63,64,65,66,67,75,78,79,80,83,88],turkish:30,turn:64,tutori:12,tweak:[1,2,11],two:[0,2,3,5,6,9,12,15,17,23,53,58,59,82,86,87,90,92,93,96],txt:[9,30,96],type:[1,2,5,8,9,19,44,53,59,63,73,80,81,86,87,92,102],typic:[5,14,15,83,90,96],tzone:22,u0000:9,u0007:12,u0009:12,u000a:12,u000c:12,u000d:12,u0010ffff:[9,12],u001a:44,u001b:12,u0032:98,u00a0abov:[19,59,81],u00a9:19,u00df:[19,29,92,94,99],u00e1rio:17,u00e4rtn:17,u00fd:[17,46,58],u0104123:77,u0104:[34,36,50,53,62,92,94],u0105:[9,17,29,34,36,45,50,53,62,77,92,96,98,99,100],u0119:19,u0153:19,u0222:36,u03c0:19,u0627:[58,83],u0633:[58,83],u0635:[58,83],u0639:[58,83],u0644:[58,83],u0645xyz:[58,83],u0647:[58,83],u0648:[58,83],u0649:[58,83],u064a:[58,83],u105:17,u1234:36,u200c:12,u200d:12,u2190:19,u2192:19,u2193:19,u2620:94,u7fffffff:62,u_charset_is_utf8:[2,39,49],u_ea_fullwidth:100,u_ea_wid:100,u_hst_trailing_jamo:100,u_hst_vowel_jamo:100,u_init:2,u_missing_resource_error:2,u_toupp:65,uax:100,ubbfc:68,ubc1f:100,ubrk:63,ubrk_8h:63,ubrk_word_non:[19,47,59],ubsan:2,ubuntu:[1,2],uc74c:68,uc815:68,ucd:13,uchar32:33,uchar:33,uchar_east_asian_width:100,uchar_hangul_syllable_typ:100,ucs:100,ud6c8:68,ufb00:17,ufdfa:[58,83,96],ufdfaxyz:[58,83],ufffd:[43,44],uhhhh:12,uhhhhhhhh:12,uint32_t:2,umlaut:36,unambigu:82,unassign:9,unavail:[33,56,60],unbound:12,unchang:[43,75,86,87],under:[0,2,5,13],underli:[18,27,46,58,60,75,80,83,88],underscor:55,understand:[5,55,98],undesir:39,unfortun:5,unicod:[0,2,3,5,7,8,11,12,13,17,19,26,32,33,42,43,49,53,62,63,64,66,68,70,71,72,77,80,82,84,86,90,91,92,93,94,97,98,99,100,101],unicode_equival:96,unicodeset:[2,94],unicodestr:2,unidata:9,uninspect:27,union:9,uniqu:[0,2,3,6,8,29,37,93],unit:[2,5,8,9,20,92],unitialis:2,univers:[2,5,13,90,97],unix:[2,5,9,66],unix_lin:66,unknown:[2,5,6,30,33,38],unless:[5,9,27,39,51,52,91],unlik:[23,29,38,42,58,99],unnecessari:97,unprotect:2,unrecogn:66,unsupport:55,until:12,unzip:1,updat:2,upgrad:2,upon:1,upper:[9,13,64,92,94],uppercas:[9,94],uppercase_first:64,ups:[2,5],uregex_8h:66,uregexpflag:66,usag:[1,2,9],use:[1,2,4,9,10,12,38,42,43,44,48,62,66,80,83,85,88,90,94,96,100],use_length:[68,101],use_width:2,usearch:2,used:[1,2,4,5,6,9,13,17,18,19,23,24,27,30,32,33,38,39,40,43,44,45,46,47,48,49,51,52,53,55,57,58,59,60,62,63,64,65,68,69,72,75,76,80,82,83,86,88,89,90,91,92,93,95,97,101],usedynlib:2,useful:[2,5,7,9,19,54,59,79,81,94],user:[1,2,5,6,8,9,10,12,17,20,23,26,29,30,39,44,63,64,65,66,67,78,79,90,92,94,95,96,99],userguid:[5,6,8,9,10,12,17,20,23,26,29,30,44,63,64,65,66,67,78,79,90,92,94,95,96,99],uses:[2,6,8,9,26,30,31,38,65,66,67,78,89,96],usesdaylighttim:89,using:[2,5,6,9,10,15,23,24,30,31,66,79,91,96,102],uslax:23,usr:1,usual:[11,15,32,45,51,53,67,78,87,88,96,99],utc:[25,90],utf8:[5,37,49],utf8toint:42,utf:[0,2,3,13,17,30,31,33,38,39,40,41,44,49,51,53,62,72,88,96,98,102],utf_8:5,utf_bom:5,util:[6,12,54,61,74,76,91,101],utr22:33,utr:82,uuuu:23,uword:66,uxxxx:[45,98],uxxxxxxxx:[45,98],valgrind:2,valid:[2,5,6,17,31,34,35,36,37,43,98],valu:[0,2,3,5,6,9,12],vari:90,variabl:[1,2,23,64],variant:[6,55,75,86,87],varieti:94,variou:[5,68,101],vec:32,vector:[0,2,3,5,7,13,15,16,17,18,19,20,21,22,23,24,27,28,29,30,31,32,34,35,36,37,38,40,41,42,43,44,45,46,47,48,50,52,53,54,56,58,59,60,61,62,67,68,69,70,71,72,73,75,77,78,79,80,81,82,83,87,88,90,92,93,94,95,96,97,98,99,100,101,102],vectorise_al:75,vectorize_al:[2,75],vel:[84,101],veri:[0,1,2,5,9,11,12,19,39,59,69,81,101],verifi:6,versa:23,version:[1,2,20,32,44,49,74,78,86,87,88,98,99],vertic:82,via:[1,2,11,12,30,38,51,65],vice:23,video:0,vietnames:9,vignett:2,violat:2,vowel:100,vvv:23,vvvv:23,w3c:96,wai:[2,5,10,11,12,16,23,34,35,36,44,50,64,72,76,80,94,101,102],want:[2,6,42,43],warn:[2,4,9,12,18,24,27,32,39,40,42,44,53,63,64,65,66,83,93,98],warnfix:2,warsaw:[2,91],wcwidth:100,weakli:78,web:96,wed:23,week:[20,23],weekdai:26,weekofmonth:22,weekofyear:22,weight:64,well:[2,9,13,36,45,49,64,86,100],were:[2,5,60,94],werner:10,western:5,wget:1,what:[0,4,5,8,9,11,17,39,43],whatev:12,when:[2,4,5,6,8,12,17,23,43,53,64,66,68,79,82,89,90,101],whenev:[4,5,65],where:[2,5,17,23,24,32,39,42,43,51,58,63,67,75,78,82,83,84,85,88,90,97,101],wherea:23,wherev:[76,86,87],whether:[2,6,17,23,27,29,31,34,35,36,38,44,46,49,50,58,64,66,80,82,83,86,87,88,89,96,99],which:[1,2,5,6,8,9,10,13,19,29,30,40,44,51,62,64,67,68,72,78,79,80,81,90,96,101],white:[2,9,12,13,18,46,58,66,75,84,85,97,101],white_spac:[9,18,75,80,84],whitespace_onli:[2,101],who:6,whole:[8,60,65],wickham:0,wide:[0,5,26,96],width:[0,2,3,9,13,23,26,53,68,101],wieczori:94,wiki:96,wikipedia:96,win:2,winbuild:2,window:[2,5,30,33,36,62,89,98,102],windtfmt:2,winnmfmt:2,wise:[2,7,13],wish:[1,12,48,75,80,83],within:[1,2,4,6,8,12,18,23,27,30,46,58,60,66,86,87,101],without:[0,3,6,23,66],word:[0,2,3,8,9,12,19,47,59,63,66,69,75,81,85,88,92],word_boundari:66,work:[1,2,5,30,31,41,65,86,96,98],world:[5,96],worst:11,worth:92,would:[8,62,66,97],wparenthes:2,wraca:94,wrap:[0,2,3,8,13,68,87],wrapper:[60,97],write:[0,3,8,13],writelin:102,written:[5,30,66],wspace:[83,97],www:[5,6,9,12,82,96,100],x1a:40,xaaaax:[46,58],xhh:12,xml:30,xnox:2,xxx:[23,48,98],xxxx:23,xxxxx:23,xyx:60,xyz:51,year:[5,20,21,22,23,89,90],yet:[2,13,96,97],yield:[2,23,46,67],you:[0,1,2,4,5,6,9,10,11,12,17,30,31,38,39,42,43,48,51,52,55,57,58,59,62,66,70,75,80,83,84,96,97,101],your:[1,4,5,6,9,38,39,62,83,97],yutannihil:2,yyyi:23,yyyyi:23,zc1:27,zero:[0,2,3,5,9,12,23,58,80,100,101],zip:[1,2],zipf:69,zone:[0,2,3,13,20,21,22,23],zwnbsp:9,zwsp:9,zxy:77,zzz:23,zzzz:23,zzzzz:23},titles:["stringi: THE String Processing Package for R","Installing stringi","What Is New in stringi","R Package stringi Reference","about_arguments: Passing Arguments to Functions in stringi","about_encoding: Character Encodings and stringi","about_locale: Locales and stringi","about_search: String Searching","about_search_boundaries: Text Boundary Analysis in stringi","about_search_charclass: Character Classes in stringi","about_search_coll: Locale-Sensitive Text Searching in stringi","about_search_fixed: Locale-Insensitive Fixed Pattern Matching in stringi","about_search_regex: Regular Expressions in stringi","about_stringi: THE String Processing Package","operator_add: Concatenate Two Character Vectors","operator_compare: Compare Strings with or without Collation","operator_dollar: C-Style Formatting with sprintf as a Binary Operator","stri_compare: Compare Strings with or without Collation","stri_count: Count the Number of Pattern Matches","stri_count_boundaries: Count the Number of Text Boundaries","stri_datetime_add: Date and Time Arithmetic","stri_datetime_create: Create a Date-Time Object","stri_datetime_fields: Get Values for Date and Time Fields","stri_datetime_format: Date and Time Formatting and Parsing","stri_datetime_fstr: Convert strptime-Style Format Strings","stri_datetime_now: Get Current Date and Time","stri_datetime_symbols: List Localizable Date-Time Formatting Data","stri_detect: Detect a Pattern Match","stri_dup: Duplicate Strings","stri_duplicated: Determine Duplicated Elements","stri_enc_detect: Detect Character Set and Language","stri_enc_detect2: [DEPRECATED] Detect Locale-Sensitive Character Encoding","stri_enc_fromutf32: Convert From UTF-32","stri_enc_info: Query a Character Encoding","stri_enc_isascii: Check If a Data Stream Is Possibly in ASCII","stri_enc_isutf16: Check If a Data Stream Is Possibly in UTF-16 or UTF-32","stri_enc_isutf8: Check If a Data Stream Is Possibly in UTF-8","stri_enc_list: List Known Character Encodings","stri_enc_mark: Get Declared Encodings of Each String","stri_enc_set: Set or Get Default Character Encoding in stringi","stri_enc_toascii: Convert To ASCII","stri_enc_tonative: Convert Strings To Native Encoding","stri_enc_toutf32: Convert Strings To UTF-32","stri_enc_toutf8: Convert Strings To UTF-8","stri_encode: Convert Strings Between Given Encodings","stri_escape_unicode: Escape Unicode Code Points","stri_extract: Extract Occurrences of a Pattern","stri_extract_boundaries: Extract Data Between Text Boundaries","stri_flatten: Flatten a String","stri_info: Query Default Settings for stringi","stri_isempty: Determine if a String is of Length Zero","stri_join: Concatenate Character Vectors","stri_join_list: Concatenate Strings in a List","stri_length: Count the Number of Code Points","stri_list2matrix: Convert a List to a Character Matrix","stri_locale_info: Query Given Locale","stri_locale_list: List Available Locales","stri_locale_set: Set or Get Default Locale in stringi","stri_locate: Locate Occurrences of a Pattern","stri_locate_boundaries: Locate Text Boundaries","stri_match: Extract Regex Pattern Matches, Together with Capture Groups","stri_na2empty: Replace NAs with Empty Strings","stri_numbytes: Count the Number of Bytes","stri_opts_brkiter: Generate a List with BreakIterator Settings","stri_opts_collator: Generate a List with Collator Settings","stri_opts_fixed: Generate a List with Fixed Pattern Search Engine\u2019s Settings","stri_opts_regex: Generate a List with Regex Matcher Settings","stri_order: Ordering Permutation","stri_pad: Pad (Center/Left/Right Align) a String","stri_rand_lipsum: A Lorem Ipsum Generator","stri_rand_shuffle: Randomly Shuffle Code Points in Each String","stri_rand_strings: Generate Random Strings","stri_read_lines: Read Text Lines from a Text File","stri_read_raw: Read Text File as Raw","stri_remove_empty: Remove All Empty Strings from a Character Vector","stri_replace: Replace Occurrences of a Pattern","stri_replace_na: Replace Missing Values in a Character Vector","stri_reverse: Reverse Each String","stri_sort: Sorting","stri_sort_key: Sort Keys","stri_split: Split a String By Pattern Matches","stri_split_boundaries: Split a String at Text Boundaries","stri_split_lines: Split a String Into Text Lines","stri_startsendswith: Determine if the Start or End of a String Matches a Pattern","stri_stats_general: General Statistics for a Character Vector","stri_stats_latex: Statistics for a Character Vector Containing LaTeX Commands","stri_sub: Extract a Substring From or Replace a Substring In a Character Vector","stri_sub_all: Extract or Replace Multiple Substrings","stri_subset: Select Elements that Match a Given Pattern","stri_timezone_info: Query a Given Time Zone","stri_timezone_list: List Available Time Zone Identifiers","stri_timezone_set: Set or Get Default Time Zone in stringi","stri_trans_casemap: Transform Strings with Case Mapping","stri_trans_char: Translate Characters","stri_trans_general: General Text Transforms, Including Transliteration","stri_trans_list: List Available Text Transforms and Transliterators","stri_trans_nf: Perform or Check For Unicode Normalization","stri_trim: Trim Characters from the Left and/or Right Side of a String","stri_unescape_unicode: Un-escape All Escape Sequences","stri_unique: Extract Unique Elements","stri_width: Determine the Width of Code Points","stri_wrap: Word Wrap Text to Format Paragraphs","stri_write_lines: Write Text Lines to a Text File"],titleterms:{"2013":2,"2014":2,"2015":2,"2016":2,"2017":2,"2018":2,"2019":2,"2020":2,"2021":2,"byte":[11,62],"case":92,"class":9,"default":[6,39,49,57,91],"function":[4,6,12],"new":2,For:96,Into:82,NAs:[4,61],THE:[0,13],about_argu:4,about_encod:5,about_local:6,about_search:7,about_search_boundari:8,about_search_charclass:9,about_search_col:10,about_search_fix:11,about_search_regex:12,about_stringi:13,align:68,all:[74,98],also:[4,5,6,7,8,9,10,11,12,13,14,15,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,69,70,71,72,73,74,75,76,78,79,80,81,82,83,84,85,86,87,88,89,90,91,92,93,94,95,96,97,98,99,100,101,102],analysi:8,argument:[4,14,15,16,17,18,19,20,21,22,23,24,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,57,58,59,60,61,62,63,64,65,66,67,68,69,70,71,72,73,74,75,76,77,78,79,80,81,82,83,84,85,86,87,88,89,90,91,92,93,94,96,97,98,99,100,101,102],arithmet:20,ascii:[34,40],attribut:4,author:13,avail:[13,56,90,95],awar:10,between:[44,47],binari:[9,16],boundari:[8,19,47,59,81],breakiter:63,build:1,captur:60,categori:9,center:68,charact:[5,9,12,14,30,31,33,37,39,51,54,74,76,84,85,86,93,97],check:[34,35,36,96],code:[45,53,70,100],coercion:4,collat:[15,17,64],command:85,compar:[11,15,17],concaten:[14,51,52],conclus:1,contain:85,convers:5,convert:[24,32,40,41,42,43,44,54],count:[18,19,53,62],cran:2,creat:21,current:25,customis:1,data:[26,34,35,36,47],date:[20,21,22,23,25,26],declar:38,deprec:31,descript:[4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,68,69,70,71,72,73,74,75,76,77,78,79,80,81,82,83,84,85,86,87,88,89,90,91,92,93,94,95,96,97,98,99,100,101,102],detail:[5,6,7,8,9,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,50,51,52,53,54,55,56,57,58,59,60,62,63,64,65,66,67,68,69,70,71,72,73,75,76,77,78,79,80,81,82,83,84,85,86,87,88,89,90,91,92,93,94,96,97,98,99,100,101,102],detect:[5,27,30,31],determin:[29,50,83,100],devel:2,duplic:[28,29],each:[38,70,77],element:[29,88,99],empti:[61,74],encod:[5,31,33,37,38,39,41,44],end:83,engin:[10,65],escap:[45,98],exampl:[14,15,16,17,18,19,20,21,22,23,24,26,27,28,29,30,34,36,45,46,47,48,50,51,52,53,54,55,57,58,59,60,61,62,64,65,66,67,68,69,70,71,74,75,76,77,78,79,80,81,83,84,85,86,87,88,89,90,91,92,93,94,96,97,98,99,100,101],express:12,extract:[46,47,60,86,87,99],facil:13,field:22,file:[72,73,102],fix:[11,65],flatten:48,format:[16,23,24,26,101],from:[32,72,74,86,97],gener:[9,63,64,65,66,69,71,84,94],get:[22,25,38,39,57,91],given:[44,55,88,89],glanc:12,group:60,handl:4,icu4c:1,icu:12,identifi:[6,90],includ:94,input:4,insensit:11,instal:1,introduct:1,ipsum:69,kei:79,known:37,languag:30,latex:85,left:[68,97],length:50,line:[72,82,102],list:[26,37,52,54,56,63,64,65,66,90,95],local:[6,10,11,31,55,56,57],localiz:26,locat:[58,59],lorem:69,map:92,match:[11,18,27,60,80,83,88],matcher:66,matrix:54,meta:12,miss:[4,76],multipl:87,nativ:41,normal:96,note:6,number:[18,19,53,62],object:[4,21],occurr:[46,58,75],oper:[12,16],operator_add:14,operator_compar:15,operator_dollar:16,order:67,packag:[0,3,13],pad:68,paragraph:101,pars:23,pass:4,pattern:[9,11,18,27,46,58,60,65,75,80,83,88],perform:96,permut:67,point:[45,53,70,100],posix:9,possibl:[34,35,36],preserv:4,process:[0,1,13],properti:9,queri:[33,49,55,89],random:71,randomli:70,raw:73,read:[72,73],refer:[3,5,6,8,9,10,12,13,17,20,23,26,29,30,44,63,64,65,66,67,78,79,82,90,91,92,94,95,96,99,100,101],regex:[12,60,66],regular:12,remov:74,replac:[61,75,76,86,87],revers:77,right:[68,97],search:[7,10,65],see:[4,5,6,7,8,9,10,11,12,13,14,15,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,69,70,71,72,73,74,75,76,78,79,80,81,82,83,84,85,86,87,88,89,90,91,92,93,94,95,96,97,98,99,100,101,102],select:88,sensit:[6,10,31],sequenc:98,set:[30,39,49,57,63,64,65,66,91],shuffl:70,side:97,sort:[78,79],split:[80,81,82],sprintf:16,start:83,statist:[84,85],stream:[34,35,36],stri_compar:17,stri_count:18,stri_count_boundari:19,stri_datetime_add:20,stri_datetime_cr:21,stri_datetime_field:22,stri_datetime_format:23,stri_datetime_fstr:24,stri_datetime_now:25,stri_datetime_symbol:26,stri_detect:27,stri_dup:28,stri_dupl:29,stri_enc_detect2:31,stri_enc_detect:30,stri_enc_fromutf32:32,stri_enc_info:33,stri_enc_isascii:34,stri_enc_isutf16:35,stri_enc_isutf8:36,stri_enc_list:37,stri_enc_mark:38,stri_enc_set:39,stri_enc_toascii:40,stri_enc_ton:41,stri_enc_toutf32:42,stri_enc_toutf8:43,stri_encod:44,stri_escape_unicod:45,stri_extract:46,stri_extract_boundari:47,stri_flatten:48,stri_info:49,stri_isempti:50,stri_join:51,stri_join_list:52,stri_length:53,stri_list2matrix:54,stri_loc:58,stri_locale_info:55,stri_locale_list:56,stri_locale_set:57,stri_locate_boundari:59,stri_match:60,stri_na2empti:61,stri_numbyt:62,stri_opts_brkit:63,stri_opts_col:64,stri_opts_fix:65,stri_opts_regex:66,stri_ord:67,stri_pad:68,stri_rand_lipsum:69,stri_rand_shuffl:70,stri_rand_str:71,stri_read_lin:72,stri_read_raw:73,stri_remove_empti:74,stri_replac:75,stri_replace_na:76,stri_revers:77,stri_sort:78,stri_sort_kei:79,stri_split:80,stri_split_boundari:81,stri_split_lin:82,stri_startsendswith:83,stri_stats_gener:84,stri_stats_latex:85,stri_sub:86,stri_sub_al:87,stri_subset:88,stri_timezone_info:89,stri_timezone_list:90,stri_timezone_set:91,stri_trans_casemap:92,stri_trans_char:93,stri_trans_gener:94,stri_trans_list:95,stri_trans_nf:96,stri_trim:97,stri_unescape_unicod:98,stri_uniqu:99,stri_width:100,stri_wrap:101,stri_write_lin:102,string:[0,7,10,13,15,17,24,28,38,41,42,43,44,48,50,52,61,68,70,71,74,77,80,81,82,83,92,97],stringi:[0,1,2,3,4,5,6,8,9,10,11,12,39,49,57,91],strptime:24,style:[16,24],substr:[86,87],support:1,text:[8,10,19,47,59,72,73,81,82,94,95,101,102],time:[20,21,22,23,25,26,89,90,91],togeth:60,transform:[92,94,95],translat:93,transliter:[94,95],trim:97,two:14,unicod:[9,45,96],unicodeset:9,uniqu:99,usag:[14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,68,69,70,71,72,73,74,75,76,77,78,79,80,81,82,83,84,85,86,87,88,89,90,91,92,93,94,95,96,97,98,99,100,101,102],utf:[5,32,35,36,42,43],valu:[4,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,68,69,70,71,72,73,74,75,76,77,78,79,80,81,82,83,84,85,86,87,88,89,90,91,92,93,94,95,96,97,98,99,100,101,102],vector:[4,14,51,74,76,84,85,86],what:2,width:100,without:[15,17],word:101,wrap:101,write:102,zero:50,zone:[89,90,91]}}) \ No newline at end of file +Search.setIndex({docnames:["index","install","news","rapi","rapi/about_arguments","rapi/about_encoding","rapi/about_locale","rapi/about_search","rapi/about_search_boundaries","rapi/about_search_charclass","rapi/about_search_coll","rapi/about_search_fixed","rapi/about_search_regex","rapi/about_stringi","rapi/operator_add","rapi/operator_compare","rapi/operator_dollar","rapi/stri_compare","rapi/stri_count","rapi/stri_count_boundaries","rapi/stri_datetime_add","rapi/stri_datetime_create","rapi/stri_datetime_fields","rapi/stri_datetime_format","rapi/stri_datetime_fstr","rapi/stri_datetime_now","rapi/stri_datetime_symbols","rapi/stri_detect","rapi/stri_dup","rapi/stri_duplicated","rapi/stri_enc_detect","rapi/stri_enc_detect2","rapi/stri_enc_fromutf32","rapi/stri_enc_info","rapi/stri_enc_isascii","rapi/stri_enc_isutf16","rapi/stri_enc_isutf8","rapi/stri_enc_list","rapi/stri_enc_mark","rapi/stri_enc_set","rapi/stri_enc_toascii","rapi/stri_enc_tonative","rapi/stri_enc_toutf32","rapi/stri_enc_toutf8","rapi/stri_encode","rapi/stri_escape_unicode","rapi/stri_extract","rapi/stri_extract_boundaries","rapi/stri_flatten","rapi/stri_info","rapi/stri_isempty","rapi/stri_join","rapi/stri_join_list","rapi/stri_length","rapi/stri_list2matrix","rapi/stri_locale_info","rapi/stri_locale_list","rapi/stri_locale_set","rapi/stri_locate","rapi/stri_locate_boundaries","rapi/stri_match","rapi/stri_na2empty","rapi/stri_numbytes","rapi/stri_opts_brkiter","rapi/stri_opts_collator","rapi/stri_opts_fixed","rapi/stri_opts_regex","rapi/stri_order","rapi/stri_pad","rapi/stri_rand_lipsum","rapi/stri_rand_shuffle","rapi/stri_rand_strings","rapi/stri_rank","rapi/stri_read_lines","rapi/stri_read_raw","rapi/stri_remove_empty","rapi/stri_replace","rapi/stri_replace_na","rapi/stri_reverse","rapi/stri_sort","rapi/stri_sort_key","rapi/stri_split","rapi/stri_split_boundaries","rapi/stri_split_lines","rapi/stri_startsendswith","rapi/stri_stats_general","rapi/stri_stats_latex","rapi/stri_sub","rapi/stri_sub_all","rapi/stri_subset","rapi/stri_timezone_info","rapi/stri_timezone_list","rapi/stri_timezone_set","rapi/stri_trans_casemap","rapi/stri_trans_char","rapi/stri_trans_general","rapi/stri_trans_list","rapi/stri_trans_nf","rapi/stri_trim","rapi/stri_unescape_unicode","rapi/stri_unique","rapi/stri_width","rapi/stri_wrap","rapi/stri_write_lines"],envversion:{"sphinx.domains.c":2,"sphinx.domains.changeset":1,"sphinx.domains.citation":1,"sphinx.domains.cpp":3,"sphinx.domains.index":1,"sphinx.domains.javascript":2,"sphinx.domains.math":2,"sphinx.domains.python":2,"sphinx.domains.rst":2,"sphinx.domains.std":2,sphinx:56},filenames:["index.rst","install.rst","news.rst","rapi.rst","rapi/about_arguments.rst","rapi/about_encoding.rst","rapi/about_locale.rst","rapi/about_search.rst","rapi/about_search_boundaries.rst","rapi/about_search_charclass.rst","rapi/about_search_coll.rst","rapi/about_search_fixed.rst","rapi/about_search_regex.rst","rapi/about_stringi.rst","rapi/operator_add.rst","rapi/operator_compare.rst","rapi/operator_dollar.rst","rapi/stri_compare.rst","rapi/stri_count.rst","rapi/stri_count_boundaries.rst","rapi/stri_datetime_add.rst","rapi/stri_datetime_create.rst","rapi/stri_datetime_fields.rst","rapi/stri_datetime_format.rst","rapi/stri_datetime_fstr.rst","rapi/stri_datetime_now.rst","rapi/stri_datetime_symbols.rst","rapi/stri_detect.rst","rapi/stri_dup.rst","rapi/stri_duplicated.rst","rapi/stri_enc_detect.rst","rapi/stri_enc_detect2.rst","rapi/stri_enc_fromutf32.rst","rapi/stri_enc_info.rst","rapi/stri_enc_isascii.rst","rapi/stri_enc_isutf16.rst","rapi/stri_enc_isutf8.rst","rapi/stri_enc_list.rst","rapi/stri_enc_mark.rst","rapi/stri_enc_set.rst","rapi/stri_enc_toascii.rst","rapi/stri_enc_tonative.rst","rapi/stri_enc_toutf32.rst","rapi/stri_enc_toutf8.rst","rapi/stri_encode.rst","rapi/stri_escape_unicode.rst","rapi/stri_extract.rst","rapi/stri_extract_boundaries.rst","rapi/stri_flatten.rst","rapi/stri_info.rst","rapi/stri_isempty.rst","rapi/stri_join.rst","rapi/stri_join_list.rst","rapi/stri_length.rst","rapi/stri_list2matrix.rst","rapi/stri_locale_info.rst","rapi/stri_locale_list.rst","rapi/stri_locale_set.rst","rapi/stri_locate.rst","rapi/stri_locate_boundaries.rst","rapi/stri_match.rst","rapi/stri_na2empty.rst","rapi/stri_numbytes.rst","rapi/stri_opts_brkiter.rst","rapi/stri_opts_collator.rst","rapi/stri_opts_fixed.rst","rapi/stri_opts_regex.rst","rapi/stri_order.rst","rapi/stri_pad.rst","rapi/stri_rand_lipsum.rst","rapi/stri_rand_shuffle.rst","rapi/stri_rand_strings.rst","rapi/stri_rank.rst","rapi/stri_read_lines.rst","rapi/stri_read_raw.rst","rapi/stri_remove_empty.rst","rapi/stri_replace.rst","rapi/stri_replace_na.rst","rapi/stri_reverse.rst","rapi/stri_sort.rst","rapi/stri_sort_key.rst","rapi/stri_split.rst","rapi/stri_split_boundaries.rst","rapi/stri_split_lines.rst","rapi/stri_startsendswith.rst","rapi/stri_stats_general.rst","rapi/stri_stats_latex.rst","rapi/stri_sub.rst","rapi/stri_sub_all.rst","rapi/stri_subset.rst","rapi/stri_timezone_info.rst","rapi/stri_timezone_list.rst","rapi/stri_timezone_set.rst","rapi/stri_trans_casemap.rst","rapi/stri_trans_char.rst","rapi/stri_trans_general.rst","rapi/stri_trans_list.rst","rapi/stri_trans_nf.rst","rapi/stri_trim.rst","rapi/stri_unescape_unicode.rst","rapi/stri_unique.rst","rapi/stri_width.rst","rapi/stri_wrap.rst","rapi/stri_write_lines.rst"],objects:{},objnames:{},objtypes:{},terms:{"0000":[5,9],"000a":66,"001a":44,"00ad":101,"0100":23,"0105":9,"0123456789":70,"032":40,"0377":12,"0530":23,"075258":23,"0800":23,"0ooo":12,"0x0a":83,"0x0b":83,"0x0c":83,"0x0d":83,"0x1a":40,"0x1f":99,"0x2028":83,"0x2029":83,"0x3000":101,"0x85":83,"0xff01":101,"0xff5e":101,"100":[2,64,67,72,79],"100000":30,"101":[67,72,79],"102":2,"105":2,"106":2,"10646":13,"107":2,"108":2,"109":2,"10ffff":[5,9],"110":2,"111":2,"1119":102,"112":2,"114":2,"116":2,"117":2,"118":2,"1184":102,"119":2,"120":2,"122":2,"123":[2,14,18,27,47,50,51,52,53,62,76,78,82,89,93,94],"1234":76,"124":2,"1250":[30,36],"1251":30,"1252":[2,5,30],"1253":30,"1254":30,"1255":30,"1256":30,"126":2,"127":[5,34,38,40,43],"128":2,"129":2,"12l":21,"132":2,"133":2,"134":2,"135":2,"137":2,"138":2,"139":2,"141":2,"143":2,"144":2,"149":2,"154":2,"157":2,"164":2,"165":2,"168":2,"169":2,"16be":[30,31,35],"16le":[30,31,35],"170":2,"174":2,"175":2,"176":2,"177":5,"180":2,"183":2,"187":2,"188":2,"189":23,"190":69,"193":2,"1970":25,"1981":102,"199":2,"1990":9,"1996":23,"1999":[10,23],"1bc":[21,22],"1st":23,"1to1":33,"2001":2,"2002":12,"200b":101,"2013":0,"2014":[0,20],"2015":[0,21,23],"2016":[0,20],"2017":0,"2018":0,"2019":0,"2020":0,"2021":0,"2022":30,"2028":[9,83],"2029":[9,83],"205":2,"2060":9,"206f":9,"207":2,"210":2,"214":2,"216":2,"219":2,"220":2,"227":2,"230":2,"231":2,"232":2,"235":23,"2350":23,"238":2,"242":2,"2451334":23,"253":2,"254":2,"258":2,"263":2,"266":2,"267":2,"270":2,"285":2,"288":2,"289":2,"296":2,"2bc":[21,22],"2nd":23,"314":2,"3166":[6,91],"317":2,"318":2,"319":2,"31t23":23,"325":2,"32be":[30,31,35],"32le":[30,31,35],"334":2,"335":2,"337":2,"338":2,"341":2,"343":2,"344":2,"345":2,"3456":[87,88],"347":2,"348":2,"355":2,"362":2,"3629":13,"363":2,"364":2,"366":2,"369":2,"370":2,"372":2,"382":2,"386":2,"393":2,"398":2,"399":2,"3rd":2,"400":2,"401":2,"405":2,"408":2,"414":2,"415":2,"421":2,"456":[27,52,76,82],"4601":23,"5198":97,"55200":46,"5775":21,"61201235":23,"639":6,"667":[87,88],"789":[27,52,76,82,87,88],"822":23,"8601":23,"8859":[5,30],"8bit":33,"9899":9,"999":21,"abstract":12,"bart\u0142omiej":0,"break":[2,8,19,47,59,63,82,93,102],"byte":[0,2,3,5,7,12,13,30,31,32,33,34,35,36,38,40,41,42,43,44,53,66,80,87,99],"case":[0,1,2,3,4,5,6,7,8,9,10,11,12,13,17,19,24,27,30,31,43,44,46,47,51,53,55,59,63,64,65,66,70,76,81,82,88,95,97,102],"char":85,"class":[0,2,3,7,8,12,13,20,21,22,23,25,26,64,71,91,92,98],"default":[0,1,2,3,5,12,15,17,18,19,20,21,22,23,26,27,29,31,33,37,38,43,44,46,47,55,58,59,60,63,64,65,66,67,68,72,73,76,79,80,81,82,83,84,89,90,91,93,98,100,102,103],"enum":[2,66],"export":2,"final":[5,6,9,12,101],"float":2,"function":[0,1,2,3,5,9,10,11,13,15,17,18,19,20,23,24,27,29,30,31,32,34,35,36,38,40,41,42,43,44,46,47,51,52,53,54,55,57,58,59,60,61,62,63,64,65,66,67,68,72,73,76,77,79,80,81,82,83,84,85,86,87,88,89,90,91,92,93,95,97,98,99,100,101,102,103],"import":[2,4],"long":[1,2,4,23,90,91],"new":[0,12,14,82,102],"null":[1,2,6,17,18,19,20,21,22,23,26,27,29,31,32,33,39,41,42,44,46,47,51,52,55,57,58,59,60,63,64,67,72,73,76,79,80,81,82,84,89,90,92,93,100,102,103],"public":9,"return":[2,5,7,12,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,68,69,70,71,73,74,75,76,77,78,81,82,83,84,85,86,87,88,89,90,91,92,93,94,95,96,97,98,99,100,101,102,103],"short":[1,2,9,11,23,49,90],"static":2,"strin\u0261i":0,"switch":[2,5],"throw":2,"true":[2,5,9,12,17,19,21,23,27,29,37,43,44,46,47,48,49,51,52,54,58,59,64,65,66,67,68,69,71,72,75,76,79,81,82,83,87,88,89,102],"try":[1,2,31],"var":1,"while":[2,5,6,8,17,39],Added:2,For:[0,1,3,4,5,6,8,9,10,12,17,19,23,24,30,32,36,37,43,44,45,46,47,53,58,59,60,62,63,66,67,72,76,79,80,82,84,87,88,90,92,93,95,98,99],Into:[0,3],Its:[12,36,87,88],Los:23,Mrs:[59,82],NAs:[0,3],NFs:97,Not:[30,46,57,62,76,87,92],One:6,Such:[5,29,87,88,100],Sys:[5,38,39],THE:[3,47,81],The:[0,1,2,5,6,7,8,9,10,11,12,13,17,19,20,23,25,27,30,31,34,36,37,41,48,54,58,59,60,62,63,67,69,72,73,76,79,80,81,82,89,91,97,99,101,102],Their:[6,12],There:5,These:[5,7,8,9,14,15,17,18,19,23,27,35,44,46,47,51,52,58,59,60,68,76,81,83,84,89,93,97,98],Use:[2,58,59],Used:90,Useful:2,Uses:99,Using:2,With:[12,55,93],_boundari:[2,7,59],_charclass:[2,7,9,84],_coll:[2,7,10,84],_count:2,_euro:6,_fix:[2,7,65,84],_limit:2,_regex:[2,7,12,58,60,76],_static:2,_word:[47,59],_xpg6:2,a_b_c__d:81,a_b_c_d:81,aaa:[23,46,58,98],aaaa:[46,58,76],aaaaaaaa:[46,58],aabbcc:[46,58],ab_c:81,aba:46,ababa:84,abababa:46,abaca:76,abbrevi:[23,26],abc:[9,14,27,28,46,50,51,53,58,62,78,87,88,93],abcd:[60,68],abcdefghi:70,abcdefghijk:[46,58],abil:[73,80,103],abl:[2,7],about:[0,2],about_argu:[0,3,5,6,7,8,9,10,11,12,13],about_encod:[0,3,4,6,7,8,9,10,11,12,13,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44],about_local:[0,3,4,5,7,8,9,10,11,12,13,15,17,19,29,31,47,55,56,57,59,64,67,72,79,80,82,93,100,102],about_search:[0,3,4,5,6,8,9,10,11,12,13,18,19,27,46,47,58,59,60,63,64,65,66,76,81,82,83,84,89,93,98,102],about_search_boundari:[0,3,4,5,6,7,9,10,11,12,13,15,17,19,29,31,47,59,63,64,67,72,79,80,82,83,93,100,102],about_search_charclass:[0,3,4,5,6,7,8,10,11,12,13,98],about_search_col:[0,3,4,5,6,7,8,9,11,12,13,15,17,19,29,31,47,59,64,67,72,79,80,82,93,100,102],about_search_fix:[0,3,4,5,6,7,8,9,10,12,13,65],about_search_regex:[0,3,4,5,6,7,8,9,10,11,13,66],about_stringi:[0,3,4,5,6,7,8,9,10,11,12],abov:[9,31,54,60,64],absolut:1,ac_config_fil:2,ac_subst:2,acagagactttagatagagaaga:[58,60],accent:[9,10,11,95],accept:[2,63,89],access:[1,2,9,16,42],accompani:13,accord:[9,38,44,46,62,64,72,79,81,93],accordingli:2,account:[8,10,17,30,65,68,90,102],acd:9,acgt:[60,94],achiev:95,across:2,act:[2,14,35,63,68,102],action:63,activ:[5,9,62,97],actual:[11,102],add:[2,20,44,68],added:[2,68],adding:20,addit:[1,2,17,18,19,23,27,29,46,47,58,59,60,67,72,76,79,80,81,82,84,89,91,93,100],addition:[2,5,13,17,37,38,60],address:2,adipis:[18,76,85,86,87,102],adjac:23,adjust:98,advanc:[4,9,12,63],aesthet:102,affect:[2,81,82,95],after:[2,12,30,64],aga:[46,58,76],agaga:[46,58,76],again:[2,9],against:[1,2,30],aggreg:[85,86],agonek:78,ahead:12,aim:[2,9,19,44,73],ala:[65,66],algorithm:[2,9,10,11,13,67,79,80,86,97,102],alia:[2,17,29,44,54,64,66,69,73,74,75,76,87,88,102,103],alias:[2,9,37,51,52],align:[0,3],alik:64,aliquet:[85,102],all:[0,1,2,3,4,5,6,7,9,10,12,13,15,17,18,19,22,23,26,27,28,29,30,31,33,34,36,38,40,43,44,45,46,47,52,56,57,58,59,60,61,64,76,81,82,91,92,97,98,102,103],alloc:2,allow:[2,5,9,10,12,17,18,21,27,32,46,58,60,66,87,102],almost:[4,5,91],alon:23,along:30,alpha:27,alphabet:[9,12],alphanumer:5,alreadi:[1,29,92],also:[0,1,2,68,78],alter:12,altern:[2,9,12,58,80,87],alternate_shift:64,alwai:[5,9,17,31,39,40,44,51,54,56,57,71,73,89,91,97,102],ambigu:5,america:23,amet:[18,52,69,76,81,85,86,87,102],among:[0,2,5,9,13,60,68],amount:[5,20,30,91],ampm:[22,26],analog:95,analysi:[0,2,3,7,12,13,19,47,59,63,82,102],angel:23,angl:[12,30],ani:[0,2,4,5,6,9,12,13,17,23,29,32,43,45,51,55,63,64,65,66,76,83,87,88,90,95,97,101],annex:[9,97,101],anno:23,anoth:[9,95],anydupl:29,anymor:2,anyth:[55,87],anywai:[1,2],apart:[5,37],api:[0,2,9,13,24,26,32,38,63,64,66,91,92],apidoc:[9,13,26,63,64,66,91,92],appear:[5,6,12,23,63,71,81,83,85,86],append:23,appli:[4,9,12,14,81,83,88,91,101,102],applic:[2,5,87,88],appreci:0,appropri:[1,8,44,46,64,81],approxim:[2,13,101],arab:30,arbitrari:[32,84,98],architectur:64,archiv:1,area:91,arg:[1,2],argument:[0,1,2,3,5,6,13],aris:97,arithmet:[0,3],arrai:2,arrang:102,asan:2,ascend:67,ascii:[0,2,3,5,9,12,23,31,33,36,38,39,43,44,45,66,71,95,99,101,102],ascii_hex_digit:9,asian:101,ask:6,assert:12,assum:[1,2,4,5,38,39,40,43,44,97],assumpt:[5,38,40],asymmetr:9,atom:[2,4,12,16,51,54],atomic_vector:16,attempt:2,attr:22,attrib:2,attribut:[2,37,64,100],augu:[85,86,102],australian:6,author:0,auto:2,autoconf:2,autom:5,automat:[5,6,9,38,44,97],avail:[0,2,3,6,7,9,12,37,46,65,66,76,90,95],avoid:[2,6,9,97],awar:[6,11,12,13,27,64,80],baaab:18,baab:18,bab:18,babaab:94,babab:18,back:[6,9,12,23,87],backslash:[9,66,76],backtrack:66,backward:[2,64],bacon:[19,52,59,60,82],bartek:13,bartolini:[46,58],base:[1,2,5,7,9,10,13,15,16,21,22,24,29,31,59,64,69,72,84,87,88,95,100,101,102],basic:[2,5,8,23,33,54,55,90],bastienfr:2,bbbbb:58,bear:76,becam:2,becaus:[1,2,4,6,11,14,30,31,36,44,65,73,97],becom:[1,23,81,103],been:[0,1,2,5,9,30,53,63,84,92],befor:[2,9,12,30,45,64,90,102],begin:[12,13,67,79,86,91],behavior:[4,6,8,12,43,51,63,64,65,66,67,79,91],behaviour:2,behind:[2,12],being:[2,5,12,23,55,64,87,102],bell:12,belong:9,below:[2,4,5,8,9,12,17,23,33,46,58,64,67,76,79,85],best:[5,6,30,31],better:[5,12,29,65,70,100],between:[0,2,3,5,9,10,12,17,24,48,59,64,81,98,102],bewar:99,biarch:2,bibliograph:9,bidi:9,bidi_control:9,bidi_mirror:9,bidirect:[9,70,71,78,87],big5:30,big:[1,2,71],bin:[1,2],binari:[0,2,3,7,14,18,73,74,85,98,103],bit:[5,31,32,33,36,39,40,42,43,62,91],bitcoin:98,bitwis:11,black:76,bogu:43,bom:[2,5,17,43,44],both:[2,5,17,19,20,35,43,68,75,87,98,102],bound:[9,87],boundari:[0,2,3,7,12,13,63,66,81,93,102],boundaryanalysi:[8,63],box:[1,2],bracket:[9,12,30],breakfast:60,breakiter:[0,2,3,8,19,47,59,82,93,102],briefli:9,bring:2,british:2,broader:95,broken:2,brown:[59,76,82],bsd:[0,2,13],buddhist:26,buffer:2,bug:[0,1,2],bugfix:2,build:[0,2],built:[1,2,49,51,54,95],bundl:[1,2],by_row:54,byrow:[2,46,47,54,81,82],bytewis:[29,64,100],c90:9,calendar:[2,6,20,21,22,23,26,90],call:[0,1,2,4,5,6,11,14,15,17,18,19,27,30,41,42,43,44,46,47,48,55,57,58,59,60,73,76,81,82,84,88,89,91,95,102],cam:101,can:[0,1,2,5,8,9,30,32,38,41,43,44,70,74,88,93,95,98,102],canadian:64,cannot:[2,8,44,73,99],canon:[2,10,15,17,29,33,37,97,100],capabl:95,capit:[8,93],captur:[0,2,3,12,46,76],care:[4,87],carefulli:5,carriag:[12,83],cascad:5,case_ignor:9,case_insensit:[2,27,46,58,65,66,76],case_level:[17,64],case_map:65,case_sensit:9,casemap:93,cat:[1,5,68,69,101,102],categori:[5,7,12,18,38,39,63,98,101],caus:[2,9,43,64],cbind:[87,88],ccc:23,cccc:23,ccccc:23,cccccc:23,center:[0,3],cento:[1,2],central:5,certain:[23,45],certainli:36,cflag:1,cg_miss:[2,60],chain:[2,69,95],chang:[2,5,6,9,12,30,39,42,57,66,68,87,91,92,93,102],changes_when_casefold:9,changes_when_casemap:9,changes_when_lowercas:9,changes_when_nfkc_casefold:9,changes_when_titlecas:9,changes_when_uppercas:9,charact:[0,2,3,4,6,7,8,13,15,16,17,18,19,23,24,27,28,29,32,34,35,36,38,40,41,42,43,44,45,46,47,48,49,50,52,53,55,56,58,59,60,61,62,63,67,68,69,70,71,72,73,76,78,79,80,81,82,83,84,88,89,91,93,95,96,97,99,100,101,102,103],character_set:30,charclass:[2,9,18,27,46,58,71,76,81,84,85,89,98,101],charmod:97,charscmdenvir:86,charset:[39,49],charsiz:33,charsnwhit:85,charswhit:86,charsword:86,charsxp:2,chartr:2,check:[0,1,2,3,5,6,9,17,30,31,38,46,64,68,84],chines:[8,9,23,30],chladni:[17,67,72,79,80],choic:[5,23],choos:1,chunk:7,circul:6,circumst:24,citi:23,civil:6,cjkv:9,clang:2,clariti:9,classicu_1_1col:64,classicu_1_1dateformatsymbol:26,classicu_1_1timezon:[91,92],classicu_1_1unicodeset:9,classif:9,classifi:35,claus:[0,2,13],cldr:2,clean:2,clever:[17,44],clock:[22,23],close:[1,9],closer:91,cluster:12,cmd:[1,86],code:[0,2,3,5,6,8,9,12,13,15,17,19,31,32,33,40,42,43,44,59,62,64,65,68,71,78,84,85,87,91,93,94,100,102],codec:2,codepoint:97,coerc:[2,37,48,54,67,79],coercibl:[4,14,15,17,19,20,22,23,32,38,42,47,50,51,53,59,62,77,82,101],coercion:2,coexist:5,coll:[18,27,46,58,64,65,76,81,84,89],collaps:[2,4,30,48,51,52,69,70],collat:[0,2,3,6,7,10,13,29,67,72,79,80,100],collect:2,colour:1,column:[2,22,54,58,59,60,67,87,88,101],com:[1,2,13],combin:[9,12,55,95,97],come:[8,93],command:[0,1,3],comment:[12,66],common:[1,2,40,90],commonli:[9,30],commun:[5,6],compar:[0,3,5,6,12,13,29,60,62,76],comparison:[2,5,6,15,17,64,67,79],compat:[2,23,97,101,102],competit:5,compil:[1,2],complement:9,complex:[1,5,10,11,64,94,102],complic:55,compon:[13,26,31,33,49,90],composit:[95,97],compound:95,comprehens:[2,9],comput:[5,6,22,62,80],con:[2,73,74,103],concaten:[0,2,3,5,13,28],concept:6,concern:91,concis:49,conclus:0,condition:2,confid:[30,31],config:[1,2],configur:[1,2,30,87],conform:[2,12,73],confus:51,conjoin:[10,11],conjunct:2,connect:[2,9,54,73,74,103],connector_punctu:12,consectetur:[18,76,85,86,87,102],consecut:[27,46,58,76,102],consequ:[15,39],consid:[44,64],consider:5,consist:[0,2,4,5,9,13,17,24,40,47,52,60,68,69,71,93,94],consol:[5,53,68,102],conson:101,consortium:13,constant:[2,12,66],construct:[2,21],contain:[0,3,9,49,63,66,76,80,85,102],content:[13,83,97],context:[12,23,26,65,86,93],continu:9,contrari:[98,102],contribut:[0,13],contributor:86,control:[2,8,9,12,64,66,67,79,84,99,101],conveni:[0,2,13,18,27,32,46,57,58,60,63,64,65,66,68,76,77,81,84,89,95,98],convent:[6,19,45,47,59,93,102],convers:[2,11,13,24,30,44,74,95],convert:[0,2,3,4,5,9,23,31,37,45,95,97],converted_str:44,cooki:93,coordin:91,copi:[1,2,4,87,88,100],coptic:26,copyright:[2,13],correct:[0,2,6,10,11,13,87],correctli:[1,2,5,39],correspond:[2,4,9,15,17,27,32,34,36,42,51,53,60,72,76,83,87,88,91,94],cost:[2,102],cost_expon:102,could:[2,6,30],count:[0,2,3,7,8,13,23,84,86,87],counterpart:[29,100],countri:[6,55,91],cours:[2,4,30,31,84],cover:[5,12,31],cpp:[2,31],cppflag:1,cpu:66,cra:[85,102],cran:0,creat:[0,1,3,5,14,56],criteria:[2,67,72],crlf:83,csrucod:31,cstring:2,cultur:6,currenc:[6,9],current:[0,1,2,3,6,9,12,22,23,39,41,44,49,57,60,62,69,73,90,92,103],custom:[1,2,63],customis:0,cxx11:[1,2],cxx1x:2,cxxcpp:2,cxxflag:1,cyclic:23,cyril:[9,95],czech:30,czw:23,d_ef_g:81,dai:[20,21,22,23],danish:30,dash:[2,9],dat:2,data:[0,1,2,3,5,9,11,22,23,30,31,38,44,59,62,64,67,69,72,81,91,103],databas:[9,13],date:[0,2,3,13,24,91,92],date_long:23,dateformatsymbol:26,datetim:[20,21,22,23,24,25,26,90,91,92],datetime_relative_medium:23,davisvaughan:2,daylight:[23,90,91],dayofweek:22,dayofyear:22,de_d:[17,93],deal:[2,4,5,42,53],debian:1,debug:2,decid:5,decim:[9,12],decimal_numb:12,declar:[0,2,3,5,39,40,41,43,44],decnumb:2,decod:[32,95],decomposit:97,decreas:[30,31,67,79],def:27,default_ignorable_code_point:9,default_local:2,defin:[9,10,12,32,39,49,64,81,83,84,87,88,91,97,99],definit:[64,66],delimit:81,deliv:6,denorm:5,denot:[5,9,22,48,76,84,87,102],depend:[1,2,5,6,8,9,12,15,17,18,22,23,27,29,46,57,58,66,67,72,76,79,80,81,83,84,89,92,93,100,102],deprec:[0,2,3,9,29,63,64,65,66,69,73,74,103],descend:67,describ:[9,10,11,12,54],design:[2,5,23,91,95],desir:[6,66,71,77,95],dessert:60,detail:4,detect:[0,2,3,6,7,13,35,38,39,42,53,60,65,74,85],determin:[0,2,3,5,9,13,17,19,27,30,40,81,83,92,97,102],dev:[1,2,9,13,26,63,64,66,91,92],devel:[0,1],develop:[1,5,13],diacrit:[8,9,17],diagnos:44,diagnost:2,did:[2,6],differ:[2,5,6,8,9,12,17,18,19,30,46,48,51,58,60,66,76,93,94,95,97,98],digit:[5,9,12,13,23,45,64,71,91,99],digraph:9,dim:4,dimitri:2,dir:[1,2],directli:[2,58,80,84],directori:1,disabl:[1,2,12],disallow:[9,44],disappear:9,discourag:9,discret:69,discuss:[5,39,44,55],disjoint:88,dispatch:68,displai:[2,5,8,9,23,69],display_typ:90,distinguish:12,distribut:[1,2,13,69],divers:1,doc:[9,10,13,26,63,64,66,91,92],document:[2,8,9,13,26,63,64,66,91,92,97],doe:[1,2,5,6,8,9,12,17,23,24,33,55,60,64,91,101,102],dog:76,doing:[4,5,39],dolor:[18,52,69,76,81,85,86,87,102],domini:23,done:[11,71],dot:9,dot_al:66,dotal:66,download:[0,1,2],draft:[0,2,13,97],drastic:2,draw:71,drop:4,dst:[90,91],dt_relative_styl:23,dt_style:23,du_disable_renam:2,dual:[32,42],due:[1,4,5,37],dummi:[2,69],duplic:[0,2,3,37,100],dure:[6,56,81,91],dutch:30,dynam:[2,102],dynlib:2,e0000:9,e0fff:9,each:[0,2,3,4,5,6,7,8,9,13,14,18,24,27,28,29,30,31,32,37,40,42,46,47,51,52,53,54,58,60,62,68,71,72,73,76,77,81,83,84,85,86,87,88,93,94,95,96,97,102,103],eagerli:2,earli:2,eas:2,easier:[5,89],easili:[2,42,103],east:101,eee:23,eeee:23,eeeee:23,eeeeee:23,effect:[39,57,91],effici:[2,4,10,12,43],efficient_text_searching_in_java:10,egg:[19,59,60,82],eight:12,either:[1,5,9,12,18,23,24,27,44,45,46,63,81,84,89,91,93],element:[0,2,3,4,6,13,15,17,18,27,30,31,34,36,37,42,46,47,48,50,51,53,54,58,60,67,71,76,79,81,83,84,85,86,88,103],elit:[18,76,85,86,87,102],ellipsi:36,embed:44,emoji:[2,9,46],emoji_modifi:9,emoji_modifier_bas:9,emoji_present:9,emploi:9,empti:[0,2,3,4,6,9,12,18,27,31,46,47,48,50,51,81,82,83,84,87],emul:2,en_au:6,en_u:[6,57,59,82,93],enabl:[12,30,65,66],enc2utf8:[42,43],enc:[33,39],enclos:[9,23],encod:[0,2,3,9,13,30,32,34,35,36,40,42,43,49,53,62,73,74,80,89,97,103],encoding_convers:[5,32,40,41,42,43,44],encoding_detect:[5,30,31,34,35,36],encoding_manag:[5,33,37,38,39],encodingnam:44,encount:[5,12,39],encourag:[1,101],end:[0,2,3,7,8,9,12,13,27,30,32,46,57,58,59,62,63,66,67,76,79,83,86,87,88,91,92,98,102],endian:[1,2],engin:[0,2,3,7,9,11,12,13,18,27,30,46,58,60,76,81,84,89],english:[6,10,30],enhanc:80,entir:66,entireti:73,entri:[0,37,66],enumer:101,envir:86,environ:[1,2,41,86],equal:[17,23,29,30,31,51,52,64,68,71,81,82,100,101],equat:91,equip:2,equival:[2,5,9,10,15,16,17,19,29,38,42,48,51,59,64,65,66,76,77,80,83,89,97,100,101],era:[22,23,26],erron:44,error:[2,4,9,12,33,53,66,85,102],error_on_unknown_escap:66,escap:[0,3,12,13,23,66,76],especi:[1,5,10,30,87],essenti:97,establish:[2,4,57,64,92],eszett:93,etc:[1,2,4,5,12,21,22,26,42,46,63,81],etiam:[85,102],euc:30,euro:[2,6],europ:[90,92],european:[5,6],evalu:12,even:[5,8,12,23,30,54,55],evenli:102,ever:5,everi:[13,60,76,78,102],everyth:9,exact:[2,12],exactli:[5,12,17,32,33,38,42,68],examin:[5,27],exampl:[0,2,5,6,8,9,11,12],examplercppstringi:2,exce:[44,73],except:[2,9,12,23,102],exclud:[63,89],exclus:[87,88],exdent:[2,102],execut:[1,45],exemplar:23,exemplari:23,exercis:69,exist:[1,2,5,12],expand:2,expect:[1,4,6,9,66],experi:[1,102],expert:39,explain:[4,5,6,7],explicit:5,explicitli:[44,87],expon:102,express:[0,3,4,5,7,9,13,66,83,98],extend:[5,9,23,36,38,40,43],extens:2,extern:[2,5],extra:[1,64,94],extract:[0,2,3,7,12,13,29,58,81,82],face:1,facil:[10,11,30,31,66,99],fact:[30,37],factor:4,fail:[1,2,5,6,12,30,31,39,41,43,62,66],failur:[2,12,30,31],fall:[9,23],fallback:1,fallback_encod:[2,73],fals:[2,5,21,23,27,29,30,35,36,37,43,44,46,47,48,49,51,54,58,59,60,63,64,65,67,68,69,75,76,79,81,82,83,84,87,88,89,102],famili:[2,31,37,63],familiar:2,fanci:[13,48],faq:5,fashion:[2,17],fast:[0,2,11,12,13],faster:[9,44,84,89],fastest:50,fcd:64,featur:[0,1,2,12,19,59,68,82,102],feature_test:2,februari:20,fedora:1,feed:[12,83],feel:[14,15,17,84],fetch:[1,90,91],few:[0,1,12,30,31],fewer:12,fff0:9,fffb:9,fffd:44,field:[0,2,3,23,81],file:[0,1,2,3,5,13,30,63,83,85,86],fill:[2,46,47,54,81,82],filter:[30,82],filter_angle_bracket:30,find:[1,4,8,9,50,58,67],first:[1,2,4,7,8,9,10,12,17,22,23,29,31,33,46,48,51,52,58,59,60,76,84,91,93,95,98,102],fit:[5,8,63],fix:[0,2,3,10,12,18,27,43,46,49,58,62,66,76,81,84,89],flag:[1,2,12,23,49,66],flatten:[0,3],flavor:[1,9],flavour:2,floor:[68,102],fname:[2,73,74,103],fold:[2,13,97],follow:[1,2,5,6,7,9,12,13,19,22,26,29,30,31,33,45,47,49,55,59,63,69,83,85,86,90,93,95,97,99,101,102],font:101,food:60,forc:[1,2,64],form:[5,6,9,12,16,23,24,36,40,42,49,55,57,60,64,76,83,87,97,99],formal:[97,101],format:[0,2,3,8,9,12,13,30,91,97],formatpars:[23,26],formatt:24,found:[29,40,44,46,58],four:5,fox:76,fraction:[21,23],fragment:12,frame:[2,22,30,31,67,72,91],free:12,freeli:9,french:[6,30,64],frequent:[2,30],friedl:12,friend:15,friendli:[2,5,33,39,87,88],from:[0,1,2,3,4,5,9,12,13,17,21,23,29,30,37,43,44,46,51,58,66,67,69,71,76,79,81,83,84,88,89,91,95,97],from_last:[2,29],fromlast:[2,29],front:87,full:[2,23,65,81,82,93,95,101],fulli:[0,31,60],fundament:6,further:[5,13],futur:[2,23,63,64,65,66,85,86],gaertner:17,gagolew:[1,2],gagolewski:[0,2,13],gain:2,garbag:2,gather:13,gb18030:30,gcing:2,gcmask:2,gcuacggagcuucggagcuag:94,gener:[0,1,2,3,4,7,8,12,13,18,23,27,32,39,40,42,44,46,53,61,70,80,84,87,88,93,96,97,98,101],general_categori:9,generic_loc:90,generic_long:90,generic_short:90,german:[6,30,93],get:[0,1,2,3,4,5,6,33,45,51,52,53,55,58,59,64,75,85,95,98,102],getlocal:[5,38,39],getopt:[68,102],ggg:23,gggg:23,ggggg:23,ghi:27,github:[0,1,2,9,13,26,63,64,66,91,92],give:[0,2,5,11,12,13,23,29,37,38,49,57,58,59,60,67,68,70,71,77,78,80,81,82,84,85,86,87,88,94,102],given:[0,2,3,4,5,7,12,17,18,23,24,27,32,33,35,36,37,38,39,46,47,49,52,53,54,58,60,66,67,68,69,76,77,81,82,83,84,87,91,94,95,98,99,102,103],glanc:[9,10],glibc:2,gmt:[23,90,91],gmt_long:90,gmt_short:90,good:[12,46],graphem:[5,12],great:4,greater:[5,17,36,38,40,51,52,62,71,102],greatest:31,greatli:0,greedi:[2,102],greek:[9,30,95],greenwich:91,gregorian:[2,20,21,22,23,26,90],gro:[29,95,100],gross:[29,100],group:[0,2,3,5,6,12,30,46,76],gru:23,grudnia:23,guarante:[1,2],guess:[30,31],guid:[5,6,8,9,10,12,17,20,23,26,29,30,44,63,64,65,66,67,72,79,80,91,93,95,96,97,100],guidelin:[23,73,83],had:[2,5],hadlei:0,half:91,halfwidth:95,hand:[81,82],handl:[2,5,6,8,30,38,50,53,62,77,87,95,99],hangul:101,happi:[59,82],hard:63,has:[0,1,2,5,30,38,39,43,48,51,52,53,84,87,92],have:[1,2,5,6,8,9,12,23,29,31,33,39,44,54,63,68,101,102],hbox:2,he_il:26,heap:66,hebrew:[20,21,22,26,30],help:1,hemispher:91,henc:[29,100],here:[9,10,11,12,17,23,30,38,41,43,53,58,60,93],hesit:1,heurist:[30,31],hex:[12,45,95,99],hex_digit:9,hexadecim:9,hhhh:12,hhhhhhhh:12,higher:[30,31],hiragana:63,histor:91,hit:31,hladn:17,hladni:[17,67,72,79,80],hms:23,hold:[17,38],home:[2,13],homepag:[0,13],honour:2,hopefulli:1,horizont:[12,102],host:0,hour12:22,hour:[20,21,22,23,90,91],how:[2,4,5,6,7,9,10,12,13,17,55,67,72,79,80],howev:[1,2,5,6,9,14,30,35,36,44,54,55,62,76,95],html:[5,6,9,10,12,13,26,30,63,64,66,83,91,92],http:[1,2,5,6,8,9,10,12,13,17,20,23,26,29,30,44,63,64,65,66,67,72,79,80,83,86,91,92,93,95,96,97,100,101],human:[6,90],hundr:[5,30,31],hungarian:30,hyphen:[9,101],i18n:[2,13,31],iana:33,ibm420:30,ibm424:30,ibm:[13,33],icecream:60,iconv:44,icu4c:[0,2,9,13,26,63,64,66,91,92],icu52dt:2,icu55:[1,2],icu61:2,icu:[0,1,2,5,6,7,8,9,10,13,17,19,20,23,24,26,29,30,31,33,37,38,39,44,46,47,49,55,56,59,60,63,64,65,66,67,72,76,79,80,82,90,91,92,93,95,96,97,99,100,102],icudt52b:2,icudt61b:2,icudt61l:2,icudt:[1,2],icudt_dir:1,id456:89,id_:14,id_continu:9,id_start:9,ident:91,identifi:[0,2,3,9,19,20,21,22,23,26,31,33,37,47,55,56,59,90,92,93,95,96,102],ideograph:[9,63],iec:9,ietf:[13,97],ifels:103,iff:31,ignor:[2,5,6,9,10,11,12,17,19,23,25,30,44,47,51,52,59,64,71,81,87,91,94,97],ignore_nul:[2,51],ill:[32,40,42,99],imag:30,imbal:2,implement:[2,6,10,11,12,44,69,73,84,86,93],impli:36,implicit:[5,9,38],imprecis:[5,30,31],improp:6,improv:2,inc:13,incident:5,includ:[0,1,2,3,6,7,8,9,12,13,18,26,27,46,58,60,62,76,81,84,86,87,89,101],inclus:[9,87],incompat:2,inconsist:24,incorrect:[2,43,44,53],incorrectli:2,increas:79,increment:64,inde:36,indent:[2,102],independ:[2,7,13,15,17,34,35,36,76],index:[2,29,58,59,84,87,88],indian:26,indic:[2,7,15,17,29,31,34,36,44,46,47,49,58,59,60,82,87,88,100],individu:[2,6,13,42,46,81],influenti:1,info:[12,91],inform:[2,5,6,10,12,13,17,19,33,37,47,49,55,56,57,59,67,72,79,80,82,90,91,92],initi:[2,5,6,9,31,102],inject:87,input:[2,5,11,12,17,30,32,38,40,44,45,51,59,63,64,66,67,73,76,79,81,83,87,88,93,94,95,97,102],ins:73,insensit:[0,3,5,9,12,17,65,66],insert:2,insid:[12,23,66],insight:55,inspect:27,inspir:[0,12,31],instal:[0,2],instanc:[4,5,18,23,27,36,37,46,58,60,84,87,98],instead:[2,62,68,102],instruct:2,integ:[4,5,17,18,19,20,21,27,28,29,32,42,53,54,58,59,62,64,66,67,68,69,71,81,82,84,85,86,87,88,101,102],intellig:2,intens:2,interact:6,interchang:[91,97],interest:[4,13,27,84,89],interestingli:10,interfer:30,intern:[2,5,13,30,32,39,44,49,62,92],internation:13,internet:1,interoper:[5,97],interpret:[5,23,40,43],intersect:9,introduc:[2,97],introduct:[0,12],inttoutf8:32,intuit:[5,38,67,79],invalid:[2,43],invis:[39,57,92],ipa:0,ipsum:[0,2,3,18,52,76,81,85,86,87,102],is_unknown_8bit:[5,43],isalnum:9,ish:2,islam:[6,26],ismwx:12,iso8601:23,iso:[5,6,9,13,23,30,91],ispunct:9,issu:[1,2,4,13,42,44],italian:30,iter:[2,4,8,9,19,47,59,63,82,93,102],its:[2,4,5,6,9,12,13,15,17,29,37,87,100],itself:[40,91],ja_jp_tradit:26,jamo:101,januari:[20,22],japanes:[8,9,26,30,95],java:[0,10,12,13,33],jdk:12,jkl:27,john:2,join:[14,28,48,51,52],jone:[59,82],joy:13,juli:23,julian:23,jump:76,just:[2,5,6,8,12,19,29,31,41,47,58,59,60,69,76,88,100],kana:63,katakana:[9,63,95],keep:58,kei:[0,2,3,5,64],keyboard:[5,38],keyword:[6,13,20,21,22,23],kile:86,kind:9,know:[4,5,39],knowledg:5,known:[0,2,3,5,31,45,56,66,99],knuth:[2,11,102],koi8:30,korean:[9,30],l10n:13,lacinia:[85,86,102],lai:69,languag:[0,2,3,5,6,7,8,11,13,17,29,31,55,57,64,65,93,95,100,102],language_countri:[6,55,57],language_country_vari:[6,57],lappli:91,larg:9,larger:[2,5],largest:12,last:[2,7,12,29,46,58,59,60,76,83,84,87,94,98,102],latest:1,latex:[0,3],latin1:[2,5,38,44],latin:[9,68,69,71,95,102],lazi:76,lc_ctype:[5,38,39],ldflag:[1,2],lead:[4,5,9,12,17],leak:2,leap:[25,91],least:[4,12,27,30,31,68,71,85],leav:[87,88],led:2,ledkov:2,left:[0,3,9,46,58,64,66,76,102],legal:9,legibl:30,length:[0,2,3,4,9,11,12,29,30,31,38,46,47,48,51,52,53,54,58,59,62,67,68,69,71,76,79,80,81,82,87,88,97,101,102],lenient:[21,23],less:[12,17,54,58],let:5,letter:[6,8,9,10,11,14,18,23,24,30,34,36,48,50,51,53,62,63,64,66,70,71,79,91,93,95,101],level:[2,64],lexicograph:[17,67,72,79],lib64:1,lib:[1,2,49],libc:[2,80],libicu:[1,2],librari:[1,2,17,31,49,98],licens:[0,2,13],ligatur:17,like:[0,1,2,4,5,9,13,14,19,23,31,47,51,58,59,68,76,82,88,93,100,102],limit:[30,66],line:[0,1,2,3,8,9,12,13,19,30,59,63,66,68,74,82,85,86,102],line_break:[8,19,47,59,63,82],linesnempti:85,linguist:[8,9],link:[1,2,9,13],linker:1,linux:[2,5],lipca:23,list:[0,1,2,3,4,5,6,8,9,12,13,16,17,18,19,27,29,30,31,32,33,34,35,36,39,42,44,46,47,49,55,58,59,60,67,72,76,79,80,81,82,83,84,88,89,90,93,95,100,101,102],liter:[12,23,66,76],littl:1,lll:23,llll:23,lllll:23,load:[2,5,30,85,86],local:[0,2,3,7,8,9,12,13,15,17,19,20,21,22,23,26,29,46,47,49,58,59,63,64,67,72,79,80,82,90,91,93,100,102],locale_manag:[6,55,56,57],locale_sensit:[6,8,10,15,17,19,29,31,47,59,64,67,72,79,80,82,93,100,102],localiz:[0,2,3],locat:[0,2,3,7,8,10,11,19,23,44,47,82],locate_first:58,locate_last:58,log:[67,79],logic:[4,15,17,21,23,27,29,30,34,35,36,37,43,44,46,47,48,49,50,51,54,58,59,60,63,64,65,66,67,68,69,76,79,81,82,83,84,87,88,89,97,102],london:90,longer:[2,36,73,94],longest:[51,54],look:[2,12,14,15,17,30,81,84],lookahead:58,lookup:12,loos:12,lorem:[0,2,3,18,52,76,81,85,86,87,102],los_angel:23,lower:[13,64,93,95],lowercas:[9,95],lukaszdaniel:2,lunar:23,lunch:60,machin:[1,5,39],macro:2,made:2,magrittr:[2,87,88],mai:[1,2,4,5,6,7,8,9,11,12,17,19,20,21,22,23,24,30,33,35,38,39,40,42,43,44,53,54,55,56,57,58,59,62,63,66,68,70,71,76,77,78,81,82,84,85,86,87,93,96,97,98,102],main:30,mainli:95,major:5,make:[1,2,5,8,84,97],makeconf:1,makevar:2,malform:[2,9,55],malici:2,man:[4,7,9,13,45],manag:[1,2,13],mandatori:63,mani:[0,2,6,7,9,12,13,55,57,92,97,98,102],manipul:[5,13],manual:[0,1,2,4,5,12,13,24],map:[0,2,3,5,6,13,40,43,55,65],marek:[0,13],margin:8,mario:17,mark:[2,5,8,9,12,27,30,32,34,35,36,38,40,41,43,44,62,73,80,87,97],marker:[23,44,73],markov:69,markup:30,mask:99,master:[1,12],match:[0,2,3,6,7,8,9,10,12,13,30,31,38,39,46,47,58,59,65,66,76,83,98],matcher:[0,3,4],math:9,mathemat:[9,95],matric:[2,58,59,60,87,88],matrix:[0,3,46,47,58,59,60,81,82,87],max:33,max_count:[2,27],maxim:[33,44,66,73,81,82,102],maximum:1,mean:[9,23,35,36,57,66,85,91,92],meaning:5,mechan:[5,38],medial:101,medium:23,memcheck:2,memori:[2,5,62,74],mention:[19,59,64,82],mere:46,merg:[2,30,46,58,76],messag:[2,12],met:1,meta:84,metacharact:66,method:[53,92,102],mgk25:101,microsystem:2,middl:[8,9,87],might:[9,11,17,19,23,27,30,37,44,87,91],migrat:[9,65],mileston:2,millisecond:[20,22,23,66],mime:33,mimic:2,min:[33,72],mind:[5,58],minim:[2,33,54,68,102],minu:5,minut:[20,21,22,23],mirror:[1,2],misalign:2,mislead:[5,53],miss:[0,2,3,27,29,38,40,42,43,44,46,47,48,50,51,53,58,59,60,61,62,64,66,67,72,75,79,81,85,87,88,89],mmm:23,mmmm:23,mmmmm:23,mode:[46,58,60,66,73,74,76,102,103],model:[69,97],modifi:[6,9,20,23,57,86,89],mondai:23,mono:101,monster:93,month:[20,21,22,23,26],more:[0,1,2,4,5,6,8,9,10,12,13,17,18,19,23,24,27,30,31,33,37,43,44,46,47,48,56,57,58,59,60,64,67,72,73,76,79,80,81,82,84,89,90,92,93,97,98,102],moreov:[0,1,2,5,9,19,24,27,38,51,53,54,58,76,83,99,102],morri:[2,11],most:[0,1,2,4,5,9,23,24,26,30,35,36,64,66,97,98,102],mostli:30,move:[2,64],much:[2,10,17,29,73,95,100],multi:[5,9,30],multi_lin:66,multilin:66,multipl:[0,2,3,23,67,68,87,102],multitud:0,must:[6,8,12,76,88],mutual:[87,88],n_max:2,n_min:[2,54,81,82],n_paragraph:[2,69],na_character_:[2,32,54,60,91],na_empti:[2,48,75],na_integer_:91,na_last:[2,67,79],name:[1,2,4,5,9,12,17,18,19,20,21,22,23,26,27,29,30,31,33,37,39,44,46,47,55,57,58,59,60,63,64,65,66,67,72,73,74,76,79,80,81,82,84,85,86,89,90,91,93,95,100,103],narrow:26,nativ:[0,2,3,5,9,13,38,39,43,44,49,62,97],natur:[2,5,7,11,13,17,29,64,100,102],nchar:[2,101],necessari:[1,4,15,18,27,46,58,60,71,76,81,84,89],necessarili:6,need:[2,4,5,12,30,62,87,88,91,98],neg:[12,27,29,81,82,84,87,102],negat:[2,9,27,84,89],neither:[39,43],nel:83,network:97,never:[81,83],new_substr:87,newer:1,newlin:[12,73,83,103],next:83,nfc:[87,97,101],nfd:[64,95,97],nfkc:97,nfkc_casefold:97,nfkd:[95,97],nibh:[85,86,102],nice:2,nie:95,nil:2,nisan:21,nix:2,non:[2,4,5,9,10,12,17,19,20,21,22,23,27,29,45,47,59,64,67,70,71,78,79,82,85,87,99,100,102],noncharacter_code_point:9,nondecreas:[67,79],none:[2,85,102],nonincreas:[67,79],nor:[39,43],norm:97,normal:[0,2,3,5,9,13,17,37,53,62,64,69,70,71,78,87,95,98,100,101,102],normalis:[0,2,64,102],northern:91,norwegian:30,note:[1,2,5,8,9,10,11,12,13,14,17,18,19,20,22,23,30,32,35,36,39,40,41,43,44,46,47,51,53,56,57,58,59,60,63,66,68,76,78,81,82,84,87,91,93,95,97,98,99,101,102],noteworthi:103,noth:[23,103],notion:[10,17,101],now:[1,2],nparagraph:[2,69],npattern:76,nth:12,nul:[44,62],number100:64,number2:64,number:[0,1,2,3,5,6,7,9,12,13,20,22,23,25,27,28,31,33,46,54,63,68,69,71,76,81,82,85,86,93,94,101,102],numer:[2,4,5,9,21,23,30,31,64,67,72,79,91,102],numeric_valu:9,object:[0,2,3,14,15,17,19,20,22,23,25,32,38,42,46,47,50,51,53,59,62,63,64,65,66,73,74,77,81,82,87,89,101,103],observ:[2,5,6,43,71,72,91],obtain:[0,2,5,9,30,31,55,85,86,91],occur:[7,8,12,30,44],occurr:[0,2,3,7,18,27,31,44],octal:[12,99],off:1,offset:[90,91],often:[0,10,30,35,62,69,95,97,98],ogonek:[5,36,78,97],old:39,older:1,oldloc:57,oldrel:2,oldtz:92,omit:[1,48,63,83],omit_empti:[2,48,81,83],omit_na:[2,87,88,89],omit_no_match:[2,46,47,52,58,59,60,88],onc:[4,27,74],one:[1,2,4,5,6,8,9,12,18,20,23,26,27,32,33,38,42,44,46,48,53,54,55,58,59,60,62,63,64,68,71,76,85,88,89,90,91,93,95,97,103],ones:[33,64,99],onli:[2,4,5,9,12,30,33,38,39,46,48,51,52,58,59,60,63,66,68,76,80,81,82,83,87,88,89,91,93,98,102],ooo:[12,99],oooo:23,open:[0,2,9,73,74,103],opensus:[1,2],oper:[0,1,2,3,4,5,7,8,9,13,14,15,17,21,29,30,32,42,57,62,66,68,70,71,78,87,88,92,95,100,102],operator_add:[0,3],operator_compar:[0,3],operator_dollar:[0,3],opposit:64,optim:5,option:[1,2,6,15,17,29,30,43,51,52,67,72,79,80,100],opts_brkit:[2,19,47,59,82,93],opts_col:[2,17,18,27,29,46,58,64,67,72,76,79,80,81,84,89,100],opts_fix:[2,18,27,46,58,65,76,81,84,89],opts_regex:[2,18,27,46,58,60,66,76,81,89],oracl:2,order:[0,2,3,5,6,9,13,17,27,30,31,43,44,64,70,72,73,78,79,80,87,97],ordinari:[51,64],org:[1,5,6,8,9,10,12,13,17,20,23,26,29,30,44,63,64,65,66,67,72,79,80,83,91,92,93,95,96,97,98,100,101],orient:86,origin:[2,80,86],other:[0,2,4,5,6,7,8,9,10,11,12,13,14,15,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,68,69,70,71,72,73,74,75,76,77,79,80,81,82,83,84,85,86,87,88,89,90,91,92,93,94,95,96,97,98,99,100,101,102,103],otherwis:[4,23,27,29,44,45,46,47,49,51,52,54,66,71,81,82,85,90,91,102],our:[1,2,4,5,98],out:[1,2,5,9,46,50,68,69,87,98],output:[2,5,23,42,43,44,47,53,67,68,70,71,73,74,78,79,80,89,97,103],outsid:[12,23],over:[2,5,14,15,16,17,18,19,20,21,22,23,27,28,30,31,46,47,51,58,59,60,68,71,76,81,82,83,84,87,88,89,93,94,98,102],overal:[5,12],overflow:2,overful:2,overlap:[2,9,46,58,60,65,76],overload:16,overrid:1,overwhelm:1,own:44,pace:13,pacif:23,packag:[1,2,5,9,47,57,68,92],pad:[0,2,3,13],page:[2,4,5,7,13,24,45],pair:9,pairwis:15,paper:[0,2,10],paragraph:[0,2,3,8,9,69,83],paramet:[2,10,83,87,88],parametr:6,parenthes:[12,60,76],pars:[0,2,3,13],part:[1,2,9,38,39,76,87,88],particular:[1,4,5,6,8,9,13,63,87,95],pass:[0,1,2,3,16,18,27,46,55,58,59,60,63,64,65,66,76,81,84,87,88,89],password:71,past:[2,48,51,77],pat1:9,pat2:9,pat:[58,84],patch:2,path:1,patter:2,pattern:[0,2,3,4,7,10,12,13,23,30,66,71,94,98],pdf:2,pdt:23,peculiar:[4,70,71,78],pellentesqu:[85,102],per:[4,6,57,69,102],perform:[0,2,3,4,5,6,7,9,10,11,12,15,17,19,29,47,56,57,59,62,63,64,66,67,74,79,82,95],perl:[9,12],permiss:64,permut:[0,2,3,70,78],persian:26,phonebook:[6,17],php:86,piec:[9,10,19,81,82],pipabl:2,pipe:[2,87,88],pizza:60,pkg:[1,2],pkg_config:[1,2],pkg_config_path:1,pl_fonipa:95,pl_pl:[17,23,26,55,67,72,79,80],place:[9,87,88,89],plai:[5,88],plain:77,plass:102,platform:[1,2,5,6,13,38,83,92,103],pleas:[1,4,5,9,10,17,24,44,60,63,98],plu:[5,9,12],point:[0,2,3,5,8,9,12,13,15,17,19,31,32,33,40,42,44,59,62,64,65,68,71,78,84,85,87,91,93,94,100,102],polish:[5,6,17,30],poor:2,poorli:66,portabl:[0,1,2,5,9,44,72],portion:12,portugues:30,posit:[2,5,8,9,12,35,36,58,59,63,64,81,82,84,87,102],posix:[2,65],posix_alnum:9,posix_blank:9,posix_graph:9,posix_print:9,posix_xdigit:9,posixct:[20,21,22,23,25],posixst:23,possess:12,possibl:[0,1,2,3,4,5,12,31,38,63,65,81,82,84,97,102],potenti:97,power:[0,12,13],pqrst:28,practic:102,pratt:[2,11],pre:[2,95],preced:[9,12],precis:[5,6,66,91],predefin:[9,69],predict:13,prefer:12,prefix:[2,102],prepar:2,preprocessor:1,preserv:[2,98,102],prevent:[2,63],previou:[12,57,92],previous:[2,39,57,92],primari:64,print:[2,5,8,9,20,53,68,87,88,89,101,102],printabl:45,prioriti:87,privat:9,probabl:71,problem:[1,2,97],problemat:44,proce:101,process:[2,3,5,7,8,9,10,11,17,29,30,45,47,62,66,68,69,81,92,95,97,98,100,102],produc:[23,44,65],prof:[59,82],program:[5,6,102],proin:[86,102],project:[1,2,5,6,8,9,10,12,13,17,20,23,26,29,30,44,63,64,65,66,67,72,79,80,91,93,95,96,97,98,100],pronounc:0,propag:1,proper:36,properli:[1,5,6,10,38,50,53,62],properti:[4,7,12,18,85,98,101],protect:2,protocol:5,provid:[2,5,6,9,10,11,12,13,16,17,31,33,47,49,51,55,60,64,87,90,91,94,95,102],pseudo:[2,13,69,70,71],pt_br:57,punct:9,punctuat:[8,9,10,11,23],purpos:[2,5,8,83],put:[67,79,97,102],python:16,qqq:23,qqqq:23,qqqqq:23,quarter:[23,26],quaternari:64,queri:[0,3,6,56,92],quick:76,quicker:76,quit:[0,5,12,66],quot:[9,12,23,45],quotat:9,quotation_mark:9,r_home:1,r_inst_dir:1,r_usedynamicsymbol:2,ragged:[2,102],rais:[2,33],random:[0,2,3,9,13,69,70,78],randomli:[0,3,69],rang:[0,5,9,12,23,87,88,95],rank:[0,2,3,13,80],ranki:95,rare:[2,4,5],rather:[27,44,66,68,84,89,97,102],raw:[0,3,5,30,31,34,35,36,42,44,90,91],rawoffset:90,rawtochar:[30,44],rbbi:63,rbind:91,rbuildignor:1,rchk:2,rcpp:[0,2],read:[0,2,3,5,13,38,41],readabl:90,readbin:30,readlin:[30,73,85,86],real:23,realli:[5,55],rearrang:67,reason:[2,4,5,43,44],recal:9,receiv:72,recent:1,recogn:[6,45,66,99],recommend:[97,102],recycl:[2,4,15,18,27,46,58,60,71,76,81,84,88,89],redund:71,refer:[0,1,2,18,24,27,46,58,60,76,81,84,89],referenc:6,reflect:[6,33],reformat:102,regard:[2,29,67],regardless:5,regex:[0,2,3,4,7,9,18,27,46,58,76,81,84,89],regexmatch:2,regexp:[9,12,66],region:[6,91],regular:[0,3,4,5,7,9,13,66,83,98],reilli:12,rel:[1,23,80],relat:[13,15,17,23],relationship:64,releas:[0,1,2,85,86],relev:1,reli:[1,2,5,84,98],reliabl:64,remaind:[81,82],rememb:4,remov:[0,2,3,5,9,17,30,37,43,63,64,65,66,67,76,79,81,83,95,97,98,100],renam:2,rep:70,replac:[0,2,3,7,13,20,23,24,40,43,44,71,72,81,89,94,98,102],repo:1,report:[1,2,9,12,19,66,83,97,101],repres:[5,9,17,23,25,30,32,33,36,37,46,58,60,66,83,85,86,91],represent:[2,5,21,33,80,90,92],request:[5,6,24,56],requir:[1,2,11,12,23,63],reserv:[9,23],resolv:1,resourc:[6,56],respect:[2,4,9,12,18,23,27,46,47,58,59,72,76,81,82,84,87,88,89,94],rest:93,restor:[57,92],restrict:95,result:[2,4,5,6,9,11,12,13,14,15,17,18,19,23,27,28,29,35,36,37,41,43,46,47,49,51,52,54,55,58,60,64,65,69,70,71,72,76,78,79,80,81,82,83,84,88,89,93,99],retri:12,reus:4,revers:[0,3,13,33,68,70],revert:2,rexamin:76,rf_error:2,rfc3629:13,rfc5198:97,rfc:[13,23,97],rid:[2,75],right:[0,3,9,46,58,76],robust:73,role:[5,88],romanian:30,roughli:[31,42,77,89,101],round:[2,60,76],routin:[2,5],row:[23,46,47,54,58,59,60,81,82],rpm:1,rule:[2,4,19,47,59,63,64,83,88,91,97],run:[2,30,46,57,62,76,84,87,92],runif:72,russian:30,sake:23,same:[2,5,6,9,13,17,29,33,38,39,50,53,54,55,57,62,64,72,80,81,91,97,100,101],sampl:[71,79],saniti:2,sappli:[69,90],sausag:52,save:[90,91],scelerisqu:[85,86,102],scenario:[46,58,60,88],scharf:93,schedul:2,scheme:[5,9,33],scp:1,screen:68,script:[1,2,9,68,71,95,102],search:[0,1,2,3,4,5,6,9,11,12,13,18,19,27,29,46,47,58,59,60,63,64,66,71,76,81,82,84,85,89,98,101],search_charclass:[7,9,98],search_col:[7,10,64],search_count:[7,18,19],search_detect:[7,27,84],search_extract:[7,46,47,60],search_fix:[7,11,65],search_loc:[7,58,59],search_regex:[7,12,66],search_replac:[7,76,98],search_split:[7,81,82,83],search_subset:[7,89],second:[2,17,20,21,22,23,25,58,59,60,91],secondari:64,section:[6,9,12,66],sed:[1,85,86,102],see:[0,1,2,16,68,78],seek:13,seem:10,seen:[2,38],segfault:2,select:[0,3,5,6,22,31,33,69,102],selector:26,semant:5,sens:5,sensit:[0,3,7,13,23,57,65,66,93],sentenc:[8,19,59,63,69,82,93],sep:[2,14,23,48,51,52,68,69,77,102,103],separ:[8,9,23,47,48,51,52,55,58,63,73,81,83,84,85,86,95,103],septemb:23,sequenc:[0,1,2,3,5,11,12,23,30,32,34,36,40,42,43,44,53,58,66,83,95,97,102],seri:[9,95],serv:[44,83],server:[1,2],servic:[2,5,6,10,56,64,91,95],session:1,set:[0,1,2,3,4,5,6,9,11,12,17,18,19,20,21,22,23,27,29,32,42,43,44,46,47,51,53,58,59,60,67,69,71,72,76,79,80,81,82,83,84,89,93,100],setdatadirectori:2,setup:1,sever:[6,30],shall:2,shape:9,shift_ji:30,ship:[1,2],shorter:[15,18,27,46,58,60,76,81,84,89],should:[1,2,5,6,21,23,29,30,38,39,44,48,49,54,58,63,65,67,68,69,75,76,79,81,83,89,98,101,102],show:30,shown:[5,9,12],shuffl:[0,3],side:[0,3,68,102],sign:[2,5,9,20,25],signific:[2,6,23],significantli:[29,100],silent:[2,4,5,17,43,51,52,87],similar:[2,5,6,9,12,16,43,54,55,91],simpl:[2,5,38,65,69,102],simplest:88,simpli:[1,2],simplifi:[2,30,37,46,47,69,81,82,102],simplify2arrai:54,sinc:[0,9,12,25,46,76,91],singl:[2,5,8,9,16,19,20,21,22,23,26,27,29,30,31,32,33,37,39,40,43,44,46,47,48,49,51,52,54,55,57,58,59,60,63,64,65,67,68,69,71,73,76,77,79,80,81,82,83,84,87,88,89,90,91,92,93,94,95,98,102],singleton:27,sit:[18,52,69,76,81,85,86,87,102],site:[1,2,13,91],situat:39,six:12,size:[33,44,66,73],sk_sk:[17,46,58,67,72,79,80,90],skip:[46,58,76],skip_:63,skip_line_hard:63,skip_line_soft:63,skip_sentence_sep:[63,82],skip_sentence_term:63,skip_word_ideo:63,skip_word_kana:63,skip_word_lett:[63,82],skip_word_non:[19,59,63,82],skip_word_numb:[63,82],slash:9,slightli:[84,86],slovak:17,slow:76,slower:[10,14,29,100],small:[5,71,86,93,95],smaller:88,smith:[59,82],snprintf:2,soft:[9,63,101],soft_dot:9,softwar:102,solari:[1,2,39],sole:[2,5],solut:1,solv:2,some:[1,2,4,5,9,11,12,13,23,24,30,33,37,44,48,55,56,57,58,63,66,86,87,90,99],somehow:5,someth:[9,76],sometim:[4,35,53,83],somewhat:[12,67,79],sort:[0,2,3,5,6,13,37,64,67,88],sourc:[0,1,2,69],sourceforg:86,southern:91,space:[2,5,8,9,12,18,23,46,58,66,76,85,86,98,101,102],space_separ:12,spaghetti:60,spam:[19,52,59,82],sparc:1,speak:5,special:[5,9,45,63,66],specif:[2,6,8,9,10,11,13,17,20,23,31,56,84,91,97],specifi:[2,5,6,9,12,20,21,22,23,24,37,44,63,71,76,95,97,98,102],spectrum:5,speed:[2,5,66],spell:2,split:[0,2,3,7,12,13,73,74,102],spontan:2,sprintf:[0,2,3],squar:[9,102],src:[1,2],sse2:2,sss:23,ssss:23,ssz:23,stabl:[67,79],stable_sort:[67,79],stack:[2,66],stack_limit:[2,66],stage:2,stand:[6,9,22,23,26],standalon:26,standard:[0,1,2,5,6,9,12,33,59,62,82,83,97,99,101],start:[0,2,3,7,8,9,27,46,58,59,66,68,69,76,87,88,98,102],start_lipsum:69,stat:[85,86],state:[2,9,20,68,90,102],statist:[0,3,5,13,30,31],statu:[2,19,47,59],stdin:[5,38],step:95,stick:98,still:[1,6],sting:27,stl:[67,79],stop:[2,27,66],storag:[5,66],store:[5,62],str2:77,str:[2,11,18,19,23,27,28,29,30,31,34,35,36,38,40,41,42,43,44,45,46,47,48,50,53,58,59,60,62,67,68,70,72,76,77,78,79,80,81,82,83,84,85,86,87,88,89,93,94,95,97,98,99,100,101,102,103],str_split_fix:2,strchr:2,strcmp:[17,80],stream:[0,3,40,43],strength:[17,29,46,58,64,84,100],strftime:[23,24],stri:[2,14,15,16,28],stri_:[2,4,7,9,10,12,65,84],stri_brkit:2,stri_c:[2,51],stri_c_list:52,stri_cmp:[2,13,17,64],stri_cmp_eq:[2,17,93],stri_cmp_equiv:[2,15,17],stri_cmp_g:[2,17],stri_cmp_gt:[2,17],stri_cmp_l:[2,15,17],stri_cmp_lt:[2,17],stri_cmp_neq:[2,17],stri_cmp_nequiv:[2,17],stri_col:64,stri_compar:[0,3,6,8,10,15,19,29,31,47,59,64,67,72,79,80,82,93,100,102],stri_conv:44,stri_count:[0,2,3,7,19],stri_count_:7,stri_count_boundari:[0,2,3,6,7,8,10,13,15,17,18,29,31,47,53,59,63,64,67,72,79,80,82,83,93,100,102],stri_count_charclass:18,stri_count_col:18,stri_count_fix:[2,18,65],stri_count_regex:[18,66],stri_count_word:[2,19,47,59],stri_datetime_add:[0,2,3,21,22,23,24,25,26,90,91,92],stri_datetime_cr:[0,2,3,20,22,23,24,25,26,90,91,92],stri_datetime_field:[0,2,3,20,21,23,24,25,26,90,91,92],stri_datetime_format:[0,2,3,13,20,21,22,24,25,26,90,91,92],stri_datetime_fstr:[0,2,3,20,21,22,23,25,26,90,91,92],stri_datetime_now:[0,2,3,20,21,22,23,24,26,90,91,92],stri_datetime_pars:[2,23,24],stri_datetime_symbol:[0,2,3,20,21,22,23,24,25,90,91,92],stri_detect:[0,2,3,7,84,89],stri_detect_:[2,7],stri_detect_charclass:27,stri_detect_col:[27,64],stri_detect_fix:[27,65],stri_detect_regex:[2,27,66,84],stri_dup:[0,2,3,13,14,48,51,52],stri_dupl:[0,2,3,6,8,10,13,15,17,19,31,47,59,64,67,72,79,80,82,93,100,102],stri_duplicated_ani:[2,29],stri_enc_detect2:[0,2,3,5,6,8,10,15,17,19,29,30,34,35,36,47,59,64,67,72,79,80,82,93,100,102],stri_enc_detect:[0,2,3,5,31,34,35,36,74],stri_enc_fromutf32:[0,3,5,40,41,42,43,44,46,101],stri_enc_get:[5,38,39,41,43,44],stri_enc_info:[0,3,5,37,38,39,49],stri_enc_isascii:[0,2,3,5,30,31,35,36],stri_enc_isnf:2,stri_enc_isutf16:[0,3],stri_enc_isutf16b:[5,30,31,34,35,36],stri_enc_isutf16l:35,stri_enc_isutf32b:35,stri_enc_isutf32l:35,stri_enc_isutf8:[0,2,3,5,30,31,34,35],stri_enc_list:[0,3,5,33,38,39,44],stri_enc_mark:[0,2,3,5,33,37,39,40,41,43,44],stri_enc_nf:2,stri_enc_set:[0,2,3,5,33,37,38],stri_enc_toascii:[0,3,5,32,41,42,43,44],stri_enc_ton:[0,2,3,5,32,40,42,43,44],stri_enc_toutf32:[0,3,5,32,40,41,43,44],stri_enc_toutf8:[0,2,3,5,32,40,41,42,44,53,77],stri_encod:[0,2,3,5,30,32,40,41,42,43,73,74],stri_endswith:[2,27,84],stri_endswith_:[2,7],stri_endswith_charclass:84,stri_endswith_col:84,stri_endswith_fix:84,stri_escape_unicod:[0,3,13,62,99],stri_extract:[0,2,3,7,58,60],stri_extract_:[2,7,46,47],stri_extract_al:[2,7,46,47,54,60,88],stri_extract_all_:[2,46,47],stri_extract_all_boundari:[6,7,8,10,15,17,19,29,31,46,47,59,60,63,64,67,72,79,80,82,83,93,100,102],stri_extract_all_charclass:[2,46],stri_extract_all_col:46,stri_extract_all_fix:[2,46,65],stri_extract_all_regex:[2,46,52,60],stri_extract_all_word:[2,8,12,19,47,52,59],stri_extract_boundari:[0,3],stri_extract_first:[46,87],stri_extract_first_:[46,47],stri_extract_first_boundari:47,stri_extract_first_charclass:46,stri_extract_first_col:46,stri_extract_first_fix:46,stri_extract_first_regex:46,stri_extract_first_word:[2,47],stri_extract_last:[46,87],stri_extract_last_:[46,47],stri_extract_last_boundari:47,stri_extract_last_charclass:46,stri_extract_last_col:46,stri_extract_last_fix:46,stri_extract_last_regex:46,stri_extract_last_word:[2,47],stri_extract_word:2,stri_flatten:[0,2,3,13,14,28,30,51,52,69],stri_info:[0,2,3,39],stri_install_check:2,stri_install_icudt:2,stri_isempti:[0,3,53,62,101],stri_join:[0,2,3,4,13,14,28,48,52],stri_join_list:[0,2,3,14,28,48,51],stri_length:[0,2,3,13,19,50,62,94,101],stri_list2matrix:[0,2,3,46,47,61,75,77,81,82],stri_loc:[0,2,3,7],stri_locale_get:57,stri_locale_info:[0,3,6,49,56,57],stri_locale_list:[0,3,6,55,57],stri_locale_set:[0,3,6,55,56],stri_locate_:[7,58,59],stri_locate_al:[7,58,59,87,88],stri_locate_all_:[2,58,59],stri_locate_all_boundari:[2,6,7,8,10,15,17,19,29,31,47,58,59,63,64,67,72,79,80,82,83,87,88,93,100,102],stri_locate_all_charclass:[2,58],stri_locate_all_col:58,stri_locate_all_fix:[2,58,65],stri_locate_all_regex:[44,58,88],stri_locate_all_word:[2,19,59],stri_locate_boundari:[0,2,3],stri_locate_first:[58,87,88],stri_locate_first_:[58,59],stri_locate_first_boundari:[2,59],stri_locate_first_charclass:58,stri_locate_first_col:58,stri_locate_first_fix:58,stri_locate_first_regex:[58,87],stri_locate_first_word:[2,59],stri_locate_last:[58,87,88],stri_locate_last_:[58,59],stri_locate_last_boundari:[2,59],stri_locate_last_charclass:58,stri_locate_last_col:58,stri_locate_last_fix:58,stri_locate_last_regex:[58,87],stri_locate_last_word:[2,59],stri_locate_regex:2,stri_locate_word:2,stri_match:[0,2,3,7,12,46],stri_match_:[2,60],stri_match_al:[7,46,47,60],stri_match_all_:[2,60],stri_match_all_regex:60,stri_match_first:60,stri_match_first_regex:60,stri_match_last:60,stri_match_last_regex:60,stri_na2empti:[0,2,3,54,75,77],stri_numbyt:[0,3,19,50,53,101],stri_omit_empti:[2,75],stri_omit_empty_na:[2,75],stri_omit_na:[2,75],stri_opts_brkit:[0,2,3,7,8,19,47,59,82,83,93,102],stri_opts_col:[0,2,3,6,7,8,10,13,15,17,18,19,27,29,31,46,47,58,59,67,72,76,79,80,81,82,84,89,93,100,102],stri_opts_fix:[0,2,3,7,11,18,27,46,58,76,81,84,89],stri_opts_regex:[0,2,3,7,12,18,27,46,58,60,76,81,89],stri_ord:[0,2,3,6,8,10,13,15,17,19,29,31,47,59,64,72,79,80,82,93,100,102],stri_pad:[0,2,3,13,102],stri_pad_:[2,68],stri_pad_both:[2,68],stri_pad_left:[2,68],stri_pad_right:[2,68],stri_past:[2,51,58,70,71,77,84,102],stri_paste_list:52,stri_prepare_arg_posixct:2,stri_rand_lipsum:[0,2,3,13,70,71],stri_rand_shuffl:[0,2,3,13,69,71,78],stri_rand_str:[0,2,3,9,13,69,70],stri_rank:[0,2,3,6,8,10,13,15,17,19,29,31,47,59,64,67,79,80,82,93,100,102],stri_read_bin:2,stri_read_lin:[0,2,3,13,74,85,103],stri_read_raw:[0,2,3,13,73,103],stri_remove_empti:[0,2,3,54,61,77],stri_remove_empty_na:[2,75],stri_remove_na:[2,75],stri_replac:[0,3,7,98],stri_replace_:[7,76],stri_replace_al:[2,7,76,98],stri_replace_all_:[2,76],stri_replace_all_charclass:[2,76],stri_replace_all_col:76,stri_replace_all_fix:[2,76],stri_replace_all_regex:76,stri_replace_first:[76,87],stri_replace_first_charclass:76,stri_replace_first_col:76,stri_replace_first_fix:76,stri_replace_first_regex:76,stri_replace_last:[76,87],stri_replace_last_charclass:76,stri_replace_last_col:76,stri_replace_last_fix:76,stri_replace_last_regex:76,stri_replace_na:[0,2,3,54,61,75],stri_revers:[0,3,13,70],stri_sort:[0,2,3,6,8,10,13,15,17,19,29,31,47,59,64,67,72,80,82,93,100,102],stri_sort_kei:[0,2,3,6,8,10,15,17,19,29,31,47,59,64,67,72,79,82,93,100,102],stri_split:[0,2,3,7,54,82,83],stri_split_:[2,7],stri_split_boundari:[0,2,3,6,7,8,10,15,17,19,29,31,47,59,63,64,67,72,79,80,81,83,93,100,102],stri_split_charclass:[2,81],stri_split_col:[2,81],stri_split_fix:[2,55,81],stri_split_lin:[0,3,7,8,13,19,47,59,63,81,82,93,102],stri_split_lines1:[73,74,83],stri_split_regex:[2,81],stri_startsendswith:[0,3],stri_startswith:[2,7,27,84],stri_startswith_:[2,7],stri_startswith_charclass:84,stri_startswith_col:84,stri_startswith_fix:84,stri_stats_gener:[0,3,13,86],stri_stats_latex:[0,3,13,85],stri_sub:[0,2,3,13,58,59,88],stri_sub_al:[0,2,3,58,59,87],stri_sub_all_replac:88,stri_sub_replac:[2,87],stri_sub_replace_al:[2,88],stri_subset:[0,2,3,7,27],stri_subset_:[2,7],stri_subset_charclass:89,stri_subset_col:89,stri_subset_fix:89,stri_subset_regex:89,stri_timezone_get:[2,20,21,22,23,24,25,26,90,91,92],stri_timezone_info:[0,2,3,20,21,22,23,24,25,26,91,92],stri_timezone_list:[0,2,3,20,21,22,23,24,25,26,90,92],stri_timezone_set:[0,2,3],stri_trans_casefold:2,stri_trans_casemap:[0,3],stri_trans_char:[0,2,3,13,93,95,96,97],stri_trans_gener:[0,2,3,13,93,94,96,97],stri_trans_isnf:[2,97],stri_trans_isnfc:97,stri_trans_isnfd:97,stri_trans_isnfkc:97,stri_trans_isnfkc_casefold:97,stri_trans_isnfkd:97,stri_trans_list:[0,2,3,93,94,95,97],stri_trans_nf:[0,2,3],stri_trans_nfc:[5,13,53,87,93,94,95,96,97,101,102],stri_trans_nfd:[78,95,97],stri_trans_nfkc:97,stri_trans_nfkc_casefold:97,stri_trans_nfkd:[17,19,29,53,68,97,100,101],stri_trans_to:2,stri_trans_tolow:[6,7,8,10,13,15,17,19,29,31,47,59,63,64,67,72,79,80,82,83,93,94,95,96,97,100,102],stri_trans_totitl:[2,8,93],stri_trans_toupp:[93,95],stri_trim:[0,3,7,13,76],stri_trim_both:[7,9,76,98],stri_trim_left:[68,98],stri_trim_right:98,stri_unescape_unicod:[0,3,45],stri_uniqu:[0,2,3,6,8,10,13,15,17,19,29,31,47,59,64,67,72,79,80,82,93,102],stri_width:[0,2,3,13,50,53,62,68,102],stri_wrap:[0,2,3,6,7,8,10,13,15,17,19,29,31,47,59,63,64,67,68,69,72,79,80,82,83,93,100],stri_write_lin:[0,2,3,13,73,74],stricontainerutf16:2,stricontainerutf8:2,strictest:64,striexcept:2,string8:2,string:[2,3,4,5,6,9,11,12,16,18,19,20,21,22,23,26,27,29,30,31,32,33,34,35,36,39,40,45,46,47,49,51,53,54,55,57,58,59,60,62,63,64,65,66,67,69,72,73,76,77,79,80,85,86,87,88,89,90,91,92,94,95,97,100,101,102],stringi:[7,13,17,18,19,25,27,32,34,35,36,37,38,44,46,47,51,55,56,58,59,60,63,64,65,66,67,68,71,72,76,79,80,81,82,83,84,85,86,87,89,93,95,97,98,100,101,102],stringi_1:1,stringi_cflag:[1,2],stringi_cppflag:[1,2],stringi_cxxflag:[1,2],stringi_disable_cxx11:[1,2],stringi_disable_icu_bundl:[1,2],stringi_disable_pkg_config:[1,2],stringi_general_top:[4,5,6,7,8,9,10,11,12,13],stringi_ldflag:[1,2],stringi_lib:[1,2],stringr:[0,2],stringsearch:[7,10],strncpy:2,strongli:[1,9],strptime:[0,2,3],strrringi:[18,27],strstr:2,strsxp:2,strwrap:[2,102],stubdata:2,student:2,studio:2,stuff:[85,86],style:[0,3,9,23,30],sub:[12,60,89],sub_index:2,submiss:2,subsequ:102,subset:[1,2,4,5,7,9,27,33],substitut:[2,5,40,44,73,81,87,88,89,102,103],substr:[0,2,3,12,13,46,59,60,64,76,81],success:1,successfulli:1,suffici:2,suggest:[0,1,2,6,102,103],suit:[29,98,100],suitabl:[1,2,102],summar:[9,12],sun:2,sundai:22,superset:[5,39],supplementari:[18,27,46,58,60,76,81,84,89],suppli:[2,12,30,31,76],support:[0,2,5,6,9,23,24,37,39,44,46,49,60,62,81,90,97],suppos:2,suppress:2,sure:[1,35],surrog:9,surround:93,suscipit:[85,86,102],swedish:30,sxpinfo:2,syllabl:9,symbol:[2,9,23],synonym:28,syntax:[9,12,16,23,63],sys:2,system:[1,2,5,6,8,9,38,39,49],tab:[9,12,83,102],tabl:30,tabul:12,take:[10,17,65,68,90,102],taken:[8,30],tar:1,target:[2,44],tartanu:[0,13],task:[2,7,12,13,95,96],tato:95,team:86,technic:[5,8,12,44,83,97],techniqu:30,technolog:2,tellu:[85,102],temporari:14,term:[51,91],termin:[12,27,63,66],terminal_punctu:9,tertiari:64,test1:77,test2:19,test:[2,6,9,15,17,19,27,29,30,39,59,77,82,84,100],text:[0,2,3,5,7,9,12,13,23,30,31,63,68,69,81,85,86,87,93,97,101],text_boundari:[7,8,19,47,59,63,82,83,93,102],textbf:86,textit:86,textual:9,tf08:5,tgca:94,th_th_tradit:26,than:[2,4,5,8,9,10,12,14,17,23,29,38,40,44,51,52,54,58,62,64,67,70,71,88,100,102],thank:[0,2],thei:[2,5,6,9,12,13,15,17,23,32,43,44,46,58,59,60,63,65,67,76,79,84,89,95],them:[5,6,17,30,33,96],themselv:[66,81],theoret:9,therefor:[5,9,17,83],therein:13,thereof:44,thi:[0,1,2,4,5,6,7,8,9,17,18,19,22,23,27,30,31,32,33,34,36,37,38,40,41,42,43,44,46,50,51,53,54,55,58,59,60,61,62,63,64,65,66,67,68,70,71,72,73,76,77,78,79,80,82,83,84,85,86,91,95,97,100,102,103],think:8,third:[8,60,64],those:[5,6,10],though:[2,12],thought:5,three:[12,23,30,31,91,93],through:9,throughout:91,thu:[4,5,59,81,97,103],tie:9,tied:72,time:[0,2,3,5,9,11,12,13,14,24,28,29,66,81,89,94],time_limit:[2,66],timezon:[20,23,90,91,92],titl:[13,93,95],to_raw:44,todo:2,togeth:[0,1,3,6,49,95],token:[81,82],tokens_onli:[2,81,82],toler:1,too:2,took:4,tool:[2,12,13,97],top:64,topic:[12,13],total:[12,31,68,85,98,102],tr11:101,tr13:83,tr15:97,tr18:[12,83],tr29:66,tr44:9,tr_tr:93,tracker:0,tradit:[30,66],trail:62,transform:[0,2,3,13,94,97],transit:12,translat:[0,3,5,13,33],transliter:[0,2,3,13],transpos:54,transposit:54,treat:[12,13,23,48,51,64,66,75],treatment:[67,79],tri:[2,5,8,12,31,37,39],trick:1,trim:[0,3,13,84],trivial:2,truncat:[23,69],tue:23,tuesdai:23,tune:[6,10,11,12,17,18,27,46,58,63,64,65,66,67,72,76,79,80,81,84,89],turkish:30,turn:64,tutori:12,tweak:[1,2,11],two:[0,2,3,5,6,9,12,15,17,23,53,58,59,72,83,87,88,91,93,94,97],txt:[9,30,97],type:[1,2,5,8,9,19,44,53,59,63,74,81,82,87,88,93,103],typic:[5,14,15,84,91,97],tzone:22,u0000:9,u0007:12,u0009:12,u000a:12,u000c:12,u000d:12,u0010ffff:[9,12],u001a:44,u001b:12,u0032:99,u00a0abov:[19,59,82],u00a9:19,u00df:[19,29,93,95,100],u00e1rio:17,u00e4rtn:17,u00fd:[17,46,58],u0104123:78,u0104:[34,36,50,53,62,93,95],u0105:[9,17,29,34,36,45,50,53,62,78,93,97,99,100,101],u0119:19,u0153:19,u0222:36,u03c0:19,u0627:[58,84],u0633:[58,84],u0635:[58,84],u0639:[58,84],u0644:[58,84],u0645xyz:[58,84],u0647:[58,84],u0648:[58,84],u0649:[58,84],u064a:[58,84],u105:17,u1234:36,u200c:12,u200d:12,u2190:19,u2192:19,u2193:19,u2620:95,u7fffffff:62,u_charset_is_utf8:[2,39,49],u_ea_fullwidth:101,u_ea_wid:101,u_hst_trailing_jamo:101,u_hst_vowel_jamo:101,u_init:2,u_missing_resource_error:2,u_toupp:65,uax:101,ubbfc:68,ubc1f:101,ubrk:63,ubrk_8h:63,ubrk_word_non:[19,47,59],ubsan:2,ubuntu:[1,2],uc74c:68,uc815:68,ucd:13,uchar32:33,uchar:33,uchar_east_asian_width:101,uchar_hangul_syllable_typ:101,ucs:101,ud6c8:68,ufb00:17,ufdfa:[58,84,97],ufdfaxyz:[58,84],ufffd:[43,44],uhhhh:12,uhhhhhhhh:12,uint32_t:2,umlaut:36,unambigu:83,unassign:9,unavail:[33,56,60],unbound:12,unchang:[43,76,87,88],under:[0,2,5,13],underli:[18,27,46,58,60,76,80,81,84,89],underscor:55,understand:[5,55,99],undesir:39,unfortun:5,unicod:[0,2,3,5,7,8,11,12,13,17,19,26,32,33,42,43,49,53,62,63,64,66,68,70,71,73,78,81,83,85,87,91,92,93,94,95,98,99,100,101,102],unicode_equival:97,unicodeset:[2,95],unicodestr:2,unidata:9,uninspect:27,union:9,uniqu:[0,2,3,6,8,29,37,94],unit:[2,5,8,9,20,93],unitialis:2,univers:[2,5,13,91,98],unix:[2,5,9,66],unix_lin:66,unknown:[2,5,6,30,33,38],unless:[5,9,27,39,51,52,92],unlik:[23,29,38,42,58,100],unnecessari:98,unprotect:2,unrecogn:66,unsupport:55,until:12,unzip:1,updat:2,upgrad:2,upon:1,upper:[9,13,64,93,95],uppercas:[9,95],uppercase_first:64,ups:[2,5],uregex_8h:66,uregexpflag:66,usag:[1,2,9],use:[1,2,4,9,10,12,38,42,43,44,48,62,66,81,84,86,89,91,95,97,101],use_length:[68,102],use_width:2,usearch:2,used:[1,2,4,5,6,9,13,17,18,19,23,24,27,30,32,33,38,39,40,43,44,45,46,47,48,49,51,52,53,55,57,58,59,60,62,63,64,65,68,69,73,76,77,81,83,84,87,89,90,91,92,93,94,96,98,102],usedynlib:2,useful:[2,5,7,9,19,54,59,80,82,95],user:[1,2,5,6,8,9,10,12,17,20,23,26,29,30,39,44,63,64,65,66,67,72,79,80,91,93,95,96,97,100],userguid:[5,6,8,9,10,12,17,20,23,26,29,30,44,63,64,65,66,67,72,79,80,91,93,95,96,97,100],uses:[2,6,8,9,26,30,31,38,65,66,67,79,90,97],usesdaylighttim:90,using:[2,5,6,9,10,15,23,24,30,31,66,80,92,97,103],uslax:23,usr:1,usual:[11,15,32,45,51,53,67,79,88,89,97,100],utc:[25,91],utf8:[5,37,49],utf8toint:42,utf:[0,2,3,13,17,30,31,33,38,39,40,41,44,49,51,53,62,73,89,97,99,103],utf_8:5,utf_bom:5,util:[6,12,54,61,75,77,92,102],utr22:33,utr:83,uuuu:23,uword:66,uxxxx:[45,99],uxxxxxxxx:[45,99],valgrind:2,valid:[2,5,6,17,31,34,35,36,37,43,99],valu:[0,2,3,5,6,9,12],vari:91,variabl:[1,2,23,64],variant:[6,55,76,87,88],varieti:95,variou:[5,68,102],vec:32,vector:[0,2,3,5,7,13,15,16,17,18,19,20,21,22,23,24,27,28,29,30,31,32,34,35,36,37,38,40,41,42,43,44,45,46,47,48,50,52,53,54,56,58,59,60,61,62,67,68,69,70,71,72,73,74,76,78,79,80,81,82,83,84,88,89,91,93,94,95,96,97,98,99,100,101,102,103],vectorise_al:76,vectorize_al:[2,76],vel:[85,102],veri:[0,1,2,5,9,11,12,19,39,59,69,82,102],verifi:6,versa:23,version:[1,2,20,32,44,49,75,79,87,88,89,99,100],vertic:83,via:[1,2,11,12,30,38,51,65],vice:23,video:0,vietnames:9,vignett:2,violat:2,vowel:101,vvv:23,vvvv:23,w3c:97,wai:[2,5,10,11,12,16,23,34,35,36,44,50,64,73,77,81,95,102,103],want:[2,6,42,43],warn:[2,4,9,12,18,24,27,32,39,40,42,44,53,63,64,65,66,84,94,99],warnfix:2,warsaw:[2,92],wcwidth:101,weakli:79,web:97,wed:23,week:[20,23],weekdai:26,weekofmonth:22,weekofyear:22,weight:64,well:[2,9,13,36,45,49,64,87,101],were:[2,5,60,95],werner:10,western:5,wget:1,what:[0,4,5,8,9,11,17,39,43],whatev:12,when:[2,4,5,6,8,12,17,23,43,53,64,66,68,80,83,90,91,102],whenev:[4,5,65],where:[2,5,17,23,24,32,39,42,43,51,58,63,67,76,79,83,84,85,86,89,91,98,102],wherea:23,wherev:[77,87,88],whether:[2,6,17,23,27,29,31,34,35,36,38,44,46,49,50,58,64,66,81,83,84,87,88,89,90,97,100],which:[1,2,5,6,8,9,10,13,19,29,30,40,44,51,62,64,67,68,73,79,80,81,82,91,97,102],white:[2,9,12,13,18,46,58,66,76,85,86,98,102],white_spac:[9,18,76,81,85],whitespace_onli:[2,102],who:6,whole:[8,60,65],wickham:0,wide:[0,5,26,97],width:[0,2,3,9,13,23,26,53,68,102],wieczori:95,wiki:97,wikipedia:97,win:2,winbuild:2,window:[2,5,30,33,36,62,90,99,103],windtfmt:2,winnmfmt:2,wise:[2,7,13],wish:[1,12,48,76,81,84],within:[1,2,4,6,8,12,18,23,27,30,46,58,60,66,87,88,102],without:[0,3,6,23,66],word:[0,2,3,8,9,12,19,47,59,63,66,69,76,82,86,89,93],word_boundari:66,work:[1,2,5,30,31,41,65,87,97,99],world:[5,97],worst:11,worth:93,would:[8,62,66,98],wparenthes:2,wraca:95,wrap:[0,2,3,8,13,68,88],wrapper:[60,98],write:[0,3,8,13],writelin:103,written:[5,30,66],wspace:[84,98],www:[5,6,9,12,83,97,101],x1a:40,xaaaax:[46,58],xhh:12,xml:30,xnox:2,xtfrm:72,xxx:[23,48,99],xxxx:23,xxxxx:23,xyx:60,xyz:51,year:[5,20,21,22,23,90,91],yet:[2,13,97,98],yield:[2,23,46,67],you:[0,1,2,4,5,6,9,10,11,12,17,30,31,38,39,42,43,48,51,52,55,57,58,59,62,66,70,76,81,84,85,97,98,102],your:[1,4,5,6,9,38,39,62,84,98],yutannihil:2,yyyi:23,yyyyi:23,zc1:27,zero:[0,2,3,5,9,12,23,58,81,101,102],zip:[1,2],zipf:69,zone:[0,2,3,13,20,21,22,23],zwnbsp:9,zwsp:9,zxy:78,zzz:23,zzzz:23,zzzzz:23},titles:["stringi: THE String Processing Package for R","Installing stringi","What Is New in stringi","R Package stringi Reference","about_arguments: Passing Arguments to Functions in stringi","about_encoding: Character Encodings and stringi","about_locale: Locales and stringi","about_search: String Searching","about_search_boundaries: Text Boundary Analysis in stringi","about_search_charclass: Character Classes in stringi","about_search_coll: Locale-Sensitive Text Searching in stringi","about_search_fixed: Locale-Insensitive Fixed Pattern Matching in stringi","about_search_regex: Regular Expressions in stringi","about_stringi: THE String Processing Package","operator_add: Concatenate Two Character Vectors","operator_compare: Compare Strings with or without Collation","operator_dollar: C-Style Formatting with sprintf as a Binary Operator","stri_compare: Compare Strings with or without Collation","stri_count: Count the Number of Pattern Matches","stri_count_boundaries: Count the Number of Text Boundaries","stri_datetime_add: Date and Time Arithmetic","stri_datetime_create: Create a Date-Time Object","stri_datetime_fields: Get Values for Date and Time Fields","stri_datetime_format: Date and Time Formatting and Parsing","stri_datetime_fstr: Convert strptime-Style Format Strings","stri_datetime_now: Get Current Date and Time","stri_datetime_symbols: List Localizable Date-Time Formatting Data","stri_detect: Detect a Pattern Match","stri_dup: Duplicate Strings","stri_duplicated: Determine Duplicated Elements","stri_enc_detect: Detect Character Set and Language","stri_enc_detect2: [DEPRECATED] Detect Locale-Sensitive Character Encoding","stri_enc_fromutf32: Convert From UTF-32","stri_enc_info: Query a Character Encoding","stri_enc_isascii: Check If a Data Stream Is Possibly in ASCII","stri_enc_isutf16: Check If a Data Stream Is Possibly in UTF-16 or UTF-32","stri_enc_isutf8: Check If a Data Stream Is Possibly in UTF-8","stri_enc_list: List Known Character Encodings","stri_enc_mark: Get Declared Encodings of Each String","stri_enc_set: Set or Get Default Character Encoding in stringi","stri_enc_toascii: Convert To ASCII","stri_enc_tonative: Convert Strings To Native Encoding","stri_enc_toutf32: Convert Strings To UTF-32","stri_enc_toutf8: Convert Strings To UTF-8","stri_encode: Convert Strings Between Given Encodings","stri_escape_unicode: Escape Unicode Code Points","stri_extract: Extract Occurrences of a Pattern","stri_extract_boundaries: Extract Data Between Text Boundaries","stri_flatten: Flatten a String","stri_info: Query Default Settings for stringi","stri_isempty: Determine if a String is of Length Zero","stri_join: Concatenate Character Vectors","stri_join_list: Concatenate Strings in a List","stri_length: Count the Number of Code Points","stri_list2matrix: Convert a List to a Character Matrix","stri_locale_info: Query Given Locale","stri_locale_list: List Available Locales","stri_locale_set: Set or Get Default Locale in stringi","stri_locate: Locate Occurrences of a Pattern","stri_locate_boundaries: Locate Text Boundaries","stri_match: Extract Regex Pattern Matches, Together with Capture Groups","stri_na2empty: Replace NAs with Empty Strings","stri_numbytes: Count the Number of Bytes","stri_opts_brkiter: Generate a List with BreakIterator Settings","stri_opts_collator: Generate a List with Collator Settings","stri_opts_fixed: Generate a List with Fixed Pattern Search Engine\u2019s Settings","stri_opts_regex: Generate a List with Regex Matcher Settings","stri_order: Ordering Permutation","stri_pad: Pad (Center/Left/Right Align) a String","stri_rand_lipsum: A Lorem Ipsum Generator","stri_rand_shuffle: Randomly Shuffle Code Points in Each String","stri_rand_strings: Generate Random Strings","stri_rank: Ranking","stri_read_lines: Read Text Lines from a Text File","stri_read_raw: Read Text File as Raw","stri_remove_empty: Remove All Empty Strings from a Character Vector","stri_replace: Replace Occurrences of a Pattern","stri_replace_na: Replace Missing Values in a Character Vector","stri_reverse: Reverse Each String","stri_sort: Sorting","stri_sort_key: Sort Keys","stri_split: Split a String By Pattern Matches","stri_split_boundaries: Split a String at Text Boundaries","stri_split_lines: Split a String Into Text Lines","stri_startsendswith: Determine if the Start or End of a String Matches a Pattern","stri_stats_general: General Statistics for a Character Vector","stri_stats_latex: Statistics for a Character Vector Containing LaTeX Commands","stri_sub: Extract a Substring From or Replace a Substring In a Character Vector","stri_sub_all: Extract or Replace Multiple Substrings","stri_subset: Select Elements that Match a Given Pattern","stri_timezone_info: Query a Given Time Zone","stri_timezone_list: List Available Time Zone Identifiers","stri_timezone_set: Set or Get Default Time Zone in stringi","stri_trans_casemap: Transform Strings with Case Mapping","stri_trans_char: Translate Characters","stri_trans_general: General Text Transforms, Including Transliteration","stri_trans_list: List Available Text Transforms and Transliterators","stri_trans_nf: Perform or Check For Unicode Normalization","stri_trim: Trim Characters from the Left and/or Right Side of a String","stri_unescape_unicode: Un-escape All Escape Sequences","stri_unique: Extract Unique Elements","stri_width: Determine the Width of Code Points","stri_wrap: Word Wrap Text to Format Paragraphs","stri_write_lines: Write Text Lines to a Text File"],titleterms:{"2013":2,"2014":2,"2015":2,"2016":2,"2017":2,"2018":2,"2019":2,"2020":2,"2021":2,"byte":[11,62],"case":93,"class":9,"default":[6,39,49,57,92],"function":[4,6,12],"new":2,For:97,Into:83,NAs:[4,61],THE:[0,13],about_argu:4,about_encod:5,about_local:6,about_search:7,about_search_boundari:8,about_search_charclass:9,about_search_col:10,about_search_fix:11,about_search_regex:12,about_stringi:13,align:68,all:[75,99],also:[4,5,6,7,8,9,10,11,12,13,14,15,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,69,70,71,72,73,74,75,76,77,79,80,81,82,83,84,85,86,87,88,89,90,91,92,93,94,95,96,97,98,99,100,101,102,103],analysi:8,argument:[4,14,15,16,17,18,19,20,21,22,23,24,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,57,58,59,60,61,62,63,64,65,66,67,68,69,70,71,72,73,74,75,76,77,78,79,80,81,82,83,84,85,86,87,88,89,90,91,92,93,94,95,97,98,99,100,101,102,103],arithmet:20,ascii:[34,40],attribut:4,author:13,avail:[13,56,91,96],awar:10,between:[44,47],binari:[9,16],boundari:[8,19,47,59,82],breakiter:63,build:1,captur:60,categori:9,center:68,charact:[5,9,12,14,30,31,33,37,39,51,54,75,77,85,86,87,94,98],check:[34,35,36,97],code:[45,53,70,101],coercion:4,collat:[15,17,64],command:86,compar:[11,15,17],concaten:[14,51,52],conclus:1,contain:86,convers:5,convert:[24,32,40,41,42,43,44,54],count:[18,19,53,62],cran:2,creat:21,current:25,customis:1,data:[26,34,35,36,47],date:[20,21,22,23,25,26],declar:38,deprec:31,descript:[4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,68,69,70,71,72,73,74,75,76,77,78,79,80,81,82,83,84,85,86,87,88,89,90,91,92,93,94,95,96,97,98,99,100,101,102,103],detail:[5,6,7,8,9,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,50,51,52,53,54,55,56,57,58,59,60,62,63,64,65,66,67,68,69,70,71,72,73,74,76,77,78,79,80,81,82,83,84,85,86,87,88,89,90,91,92,93,94,95,97,98,99,100,101,102,103],detect:[5,27,30,31],determin:[29,50,84,101],devel:2,duplic:[28,29],each:[38,70,78],element:[29,89,100],empti:[61,75],encod:[5,31,33,37,38,39,41,44],end:84,engin:[10,65],escap:[45,99],exampl:[14,15,16,17,18,19,20,21,22,23,24,26,27,28,29,30,34,36,45,46,47,48,50,51,52,53,54,55,57,58,59,60,61,62,64,65,66,67,68,69,70,71,72,75,76,77,78,79,80,81,82,84,85,86,87,88,89,90,91,92,93,94,95,97,98,99,100,101,102],express:12,extract:[46,47,60,87,88,100],facil:13,field:22,file:[73,74,103],fix:[11,65],flatten:48,format:[16,23,24,26,102],from:[32,73,75,87,98],gener:[9,63,64,65,66,69,71,85,95],get:[22,25,38,39,57,92],given:[44,55,89,90],glanc:12,group:60,handl:4,icu4c:1,icu:12,identifi:[6,91],includ:95,input:4,insensit:11,instal:1,introduct:1,ipsum:69,kei:80,known:37,languag:30,latex:86,left:[68,98],length:50,line:[73,83,103],list:[26,37,52,54,56,63,64,65,66,91,96],local:[6,10,11,31,55,56,57],localiz:26,locat:[58,59],lorem:69,map:93,match:[11,18,27,60,81,84,89],matcher:66,matrix:54,meta:12,miss:[4,77],multipl:88,nativ:41,normal:97,note:6,number:[18,19,53,62],object:[4,21],occurr:[46,58,76],oper:[12,16],operator_add:14,operator_compar:15,operator_dollar:16,order:67,packag:[0,3,13],pad:68,paragraph:102,pars:23,pass:4,pattern:[9,11,18,27,46,58,60,65,76,81,84,89],perform:97,permut:67,point:[45,53,70,101],posix:9,possibl:[34,35,36],preserv:4,process:[0,1,13],properti:9,queri:[33,49,55,90],random:71,randomli:70,rank:72,raw:74,read:[73,74],refer:[3,5,6,8,9,10,12,13,17,20,23,26,29,30,44,63,64,65,66,67,72,79,80,83,91,92,93,95,96,97,100,101,102],regex:[12,60,66],regular:12,remov:75,replac:[61,76,77,87,88],revers:78,right:[68,98],search:[7,10,65],see:[4,5,6,7,8,9,10,11,12,13,14,15,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,69,70,71,72,73,74,75,76,77,79,80,81,82,83,84,85,86,87,88,89,90,91,92,93,94,95,96,97,98,99,100,101,102,103],select:89,sensit:[6,10,31],sequenc:99,set:[30,39,49,57,63,64,65,66,92],shuffl:70,side:98,sort:[79,80],split:[81,82,83],sprintf:16,start:84,statist:[85,86],stream:[34,35,36],stri_compar:17,stri_count:18,stri_count_boundari:19,stri_datetime_add:20,stri_datetime_cr:21,stri_datetime_field:22,stri_datetime_format:23,stri_datetime_fstr:24,stri_datetime_now:25,stri_datetime_symbol:26,stri_detect:27,stri_dup:28,stri_dupl:29,stri_enc_detect2:31,stri_enc_detect:30,stri_enc_fromutf32:32,stri_enc_info:33,stri_enc_isascii:34,stri_enc_isutf16:35,stri_enc_isutf8:36,stri_enc_list:37,stri_enc_mark:38,stri_enc_set:39,stri_enc_toascii:40,stri_enc_ton:41,stri_enc_toutf32:42,stri_enc_toutf8:43,stri_encod:44,stri_escape_unicod:45,stri_extract:46,stri_extract_boundari:47,stri_flatten:48,stri_info:49,stri_isempti:50,stri_join:51,stri_join_list:52,stri_length:53,stri_list2matrix:54,stri_loc:58,stri_locale_info:55,stri_locale_list:56,stri_locale_set:57,stri_locate_boundari:59,stri_match:60,stri_na2empti:61,stri_numbyt:62,stri_opts_brkit:63,stri_opts_col:64,stri_opts_fix:65,stri_opts_regex:66,stri_ord:67,stri_pad:68,stri_rand_lipsum:69,stri_rand_shuffl:70,stri_rand_str:71,stri_rank:72,stri_read_lin:73,stri_read_raw:74,stri_remove_empti:75,stri_replac:76,stri_replace_na:77,stri_revers:78,stri_sort:79,stri_sort_kei:80,stri_split:81,stri_split_boundari:82,stri_split_lin:83,stri_startsendswith:84,stri_stats_gener:85,stri_stats_latex:86,stri_sub:87,stri_sub_al:88,stri_subset:89,stri_timezone_info:90,stri_timezone_list:91,stri_timezone_set:92,stri_trans_casemap:93,stri_trans_char:94,stri_trans_gener:95,stri_trans_list:96,stri_trans_nf:97,stri_trim:98,stri_unescape_unicod:99,stri_uniqu:100,stri_width:101,stri_wrap:102,stri_write_lin:103,string:[0,7,10,13,15,17,24,28,38,41,42,43,44,48,50,52,61,68,70,71,75,78,81,82,83,84,93,98],stringi:[0,1,2,3,4,5,6,8,9,10,11,12,39,49,57,92],strptime:24,style:[16,24],substr:[87,88],support:1,text:[8,10,19,47,59,73,74,82,83,95,96,102,103],time:[20,21,22,23,25,26,90,91,92],togeth:60,transform:[93,95,96],translat:94,transliter:[95,96],trim:98,two:14,unicod:[9,45,97],unicodeset:9,uniqu:100,usag:[14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,68,69,70,71,72,73,74,75,76,77,78,79,80,81,82,83,84,85,86,87,88,89,90,91,92,93,94,95,96,97,98,99,100,101,102,103],utf:[5,32,35,36,42,43],valu:[4,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,68,69,70,71,72,73,74,75,76,77,78,79,80,81,82,83,84,85,86,87,88,89,90,91,92,93,94,95,96,97,98,99,100,101,102,103],vector:[4,14,51,75,77,85,86,87],what:2,width:101,without:[15,17],word:102,wrap:102,write:103,zero:50,zone:[90,91,92]}}) \ No newline at end of file diff --git a/man/about_encoding.Rd b/man/about_encoding.Rd index 75d9e130d..4287cf4fc 100644 --- a/man/about_encoding.Rd +++ b/man/about_encoding.Rd @@ -106,7 +106,7 @@ the same value denotes the ``plus-minus'' sign. Thus, a character encoding is a translation scheme: we need to communicate with \R somehow, relying on how it represents strings. -Basically, \R has a very simple encoding marking mechanism, +Overall, \R has a very simple encoding marking mechanism, see \code{\link{stri_enc_mark}}. There is an implicit assumption that your platform's default (native) encoding always extends ASCII -- \pkg{stringi} checks that whenever your native encoding diff --git a/man/about_locale.Rd b/man/about_locale.Rd index aa7cf3651..ffee44e50 100644 --- a/man/about_locale.Rd +++ b/man/about_locale.Rd @@ -119,6 +119,7 @@ Other locale_sensitive: \code{\link{stri_locate_all_boundaries}()}, \code{\link{stri_opts_collator}()}, \code{\link{stri_order}()}, +\code{\link{stri_rank}()}, \code{\link{stri_sort_key}()}, \code{\link{stri_sort}()}, \code{\link{stri_split_boundaries}()}, diff --git a/man/about_search_boundaries.Rd b/man/about_search_boundaries.Rd index 1506b0662..752424c16 100644 --- a/man/about_search_boundaries.Rd +++ b/man/about_search_boundaries.Rd @@ -68,6 +68,7 @@ Other locale_sensitive: \code{\link{stri_locate_all_boundaries}()}, \code{\link{stri_opts_collator}()}, \code{\link{stri_order}()}, +\code{\link{stri_rank}()}, \code{\link{stri_sort_key}()}, \code{\link{stri_sort}()}, \code{\link{stri_split_boundaries}()}, diff --git a/man/about_search_coll.Rd b/man/about_search_coll.Rd index b969728e5..d7c9f780c 100644 --- a/man/about_search_coll.Rd +++ b/man/about_search_coll.Rd @@ -57,6 +57,7 @@ Other locale_sensitive: \code{\link{stri_locate_all_boundaries}()}, \code{\link{stri_opts_collator}()}, \code{\link{stri_order}()}, +\code{\link{stri_rank}()}, \code{\link{stri_sort_key}()}, \code{\link{stri_sort}()}, \code{\link{stri_split_boundaries}()}, diff --git a/man/about_stringi.Rd b/man/about_stringi.Rd index f43cb3f47..da7e3023a 100644 --- a/man/about_stringi.Rd +++ b/man/about_stringi.Rd @@ -10,7 +10,7 @@ \pkg{stringi} is THE R package for fast, correct, consistent, and convenient string/text manipulation. It gives predictable results on every platform, in each locale, -and under any ``native'' character encoding. +and under any native character encoding. \bold{Keywords}: R, text processing, character strings, internationalization, localization, ICU, ICU4C, i18n, l10n, Unicode. @@ -34,7 +34,7 @@ Manual pages on general topics: locale-sensitive operations. In particular, see \code{\link{stri_opts_collator}} for a description of the string collation algorithm, which is used for string comparing, ordering, - sorting, case-folding, and searching. + ranking, sorting, case-folding, and searching. \item \link{about_arguments} -- information on how \pkg{stringi} treats its functions' arguments. @@ -92,8 +92,8 @@ and \code{\link{stri_trans_general}} for other universal yet powerful text transforms, including transliteration. \item \code{\link{stri_cmp}}, \code{\link{\%s<\%}}, \code{\link{stri_order}}, -\code{\link{stri_sort}}, \code{\link{stri_unique}}, and -\code{\link{stri_duplicated}} for collation-based, +\code{\link{stri_sort}}, \code{\link{stri_rank}}, \code{\link{stri_unique}}, +and \code{\link{stri_duplicated}} for collation-based, locale-aware operations, see also \link{about_locale}. \item \code{\link{stri_split_lines}} (among others) @@ -141,8 +141,6 @@ Other stringi_general_topics: \author{ Marek Gagolewski, with contributions from Bartek Tartanus and many others. -ICU4C was developed by IBM and others. -The Unicode Character Database is due to Unicode, Inc.; -see the COPYRIGHTS file for more details. +ICU4C was developed by IBM, Unicode, Inc., and others. } \concept{stringi_general_topics} diff --git a/man/operator_compare.Rd b/man/operator_compare.Rd index 14498112d..b08b1bb2c 100644 --- a/man/operator_compare.Rd +++ b/man/operator_compare.Rd @@ -95,6 +95,7 @@ Other locale_sensitive: \code{\link{stri_locate_all_boundaries}()}, \code{\link{stri_opts_collator}()}, \code{\link{stri_order}()}, +\code{\link{stri_rank}()}, \code{\link{stri_sort_key}()}, \code{\link{stri_sort}()}, \code{\link{stri_split_boundaries}()}, diff --git a/man/stri_compare.Rd b/man/stri_compare.Rd index 462019fa4..b3e617997 100644 --- a/man/stri_compare.Rd +++ b/man/stri_compare.Rd @@ -148,6 +148,7 @@ Other locale_sensitive: \code{\link{stri_locate_all_boundaries}()}, \code{\link{stri_opts_collator}()}, \code{\link{stri_order}()}, +\code{\link{stri_rank}()}, \code{\link{stri_sort_key}()}, \code{\link{stri_sort}()}, \code{\link{stri_split_boundaries}()}, diff --git a/man/stri_count_boundaries.Rd b/man/stri_count_boundaries.Rd index 33254c0ff..0b50dcaf4 100644 --- a/man/stri_count_boundaries.Rd +++ b/man/stri_count_boundaries.Rd @@ -84,6 +84,7 @@ Other locale_sensitive: \code{\link{stri_locate_all_boundaries}()}, \code{\link{stri_opts_collator}()}, \code{\link{stri_order}()}, +\code{\link{stri_rank}()}, \code{\link{stri_sort_key}()}, \code{\link{stri_sort}()}, \code{\link{stri_split_boundaries}()}, diff --git a/man/stri_duplicated.Rd b/man/stri_duplicated.Rd index df6e07cae..61eac96da 100644 --- a/man/stri_duplicated.Rd +++ b/man/stri_duplicated.Rd @@ -97,6 +97,7 @@ Other locale_sensitive: \code{\link{stri_locate_all_boundaries}()}, \code{\link{stri_opts_collator}()}, \code{\link{stri_order}()}, +\code{\link{stri_rank}()}, \code{\link{stri_sort_key}()}, \code{\link{stri_sort}()}, \code{\link{stri_split_boundaries}()}, diff --git a/man/stri_enc_detect2.Rd b/man/stri_enc_detect2.Rd index 8497d6cf9..c6c08cab5 100644 --- a/man/stri_enc_detect2.Rd +++ b/man/stri_enc_detect2.Rd @@ -71,6 +71,7 @@ Other locale_sensitive: \code{\link{stri_locate_all_boundaries}()}, \code{\link{stri_opts_collator}()}, \code{\link{stri_order}()}, +\code{\link{stri_rank}()}, \code{\link{stri_sort_key}()}, \code{\link{stri_sort}()}, \code{\link{stri_split_boundaries}()}, diff --git a/man/stri_extract_boundaries.Rd b/man/stri_extract_boundaries.Rd index f80650d2b..760893e17 100644 --- a/man/stri_extract_boundaries.Rd +++ b/man/stri_extract_boundaries.Rd @@ -109,6 +109,7 @@ Other locale_sensitive: \code{\link{stri_locate_all_boundaries}()}, \code{\link{stri_opts_collator}()}, \code{\link{stri_order}()}, +\code{\link{stri_rank}()}, \code{\link{stri_sort_key}()}, \code{\link{stri_sort}()}, \code{\link{stri_split_boundaries}()}, diff --git a/man/stri_locate_boundaries.Rd b/man/stri_locate_boundaries.Rd index b16c7c41a..9b91ac422 100644 --- a/man/stri_locate_boundaries.Rd +++ b/man/stri_locate_boundaries.Rd @@ -113,6 +113,7 @@ Other locale_sensitive: \code{\link{stri_extract_all_boundaries}()}, \code{\link{stri_opts_collator}()}, \code{\link{stri_order}()}, +\code{\link{stri_rank}()}, \code{\link{stri_sort_key}()}, \code{\link{stri_sort}()}, \code{\link{stri_split_boundaries}()}, diff --git a/man/stri_opts_collator.Rd b/man/stri_opts_collator.Rd index 159d05eb6..b77602004 100644 --- a/man/stri_opts_collator.Rd +++ b/man/stri_opts_collator.Rd @@ -118,6 +118,7 @@ Other locale_sensitive: \code{\link{stri_extract_all_boundaries}()}, \code{\link{stri_locate_all_boundaries}()}, \code{\link{stri_order}()}, +\code{\link{stri_rank}()}, \code{\link{stri_sort_key}()}, \code{\link{stri_sort}()}, \code{\link{stri_split_boundaries}()}, diff --git a/man/stri_order.Rd b/man/stri_order.Rd index 64b6838b1..d6cbe9093 100644 --- a/man/stri_order.Rd +++ b/man/stri_order.Rd @@ -37,15 +37,15 @@ For more information on \pkg{ICU}'s Collator and how to tune it up in \pkg{stringi}, refer to \code{\link{stri_opts_collator}}. As usual in \pkg{stringi}, non-character inputs are coerced to strings, -see an example below for a perhaps non-intuitive behavior of lexicographic +see an example below for a somewhat non-intuitive behavior of lexicographic sorting on numeric inputs. - - - This function uses a stable sort algorithm (\pkg{STL}'s \code{stable_sort}), which performs up to \eqn{N*log^2(N)} element comparisons, where \eqn{N} is the length of \code{str}. + +For ordering with regards to multiple criteria (such as sorting +data frames by more than 1 column), see \code{\link{stri_rank}}. } \examples{ stri_order(c('hladny', 'chladny'), locale='pl_PL') @@ -71,6 +71,7 @@ Other locale_sensitive: \code{\link{stri_extract_all_boundaries}()}, \code{\link{stri_locate_all_boundaries}()}, \code{\link{stri_opts_collator}()}, +\code{\link{stri_rank}()}, \code{\link{stri_sort_key}()}, \code{\link{stri_sort}()}, \code{\link{stri_split_boundaries}()}, diff --git a/man/stri_rank.Rd b/man/stri_rank.Rd new file mode 100644 index 000000000..8bead007b --- /dev/null +++ b/man/stri_rank.Rd @@ -0,0 +1,70 @@ +% Generated by roxygen2: do not edit by hand +% Please edit documentation in R/sort.R +\name{stri_rank} +\alias{stri_rank} +\title{Ranking} +\usage{ +stri_rank(str, ..., opts_collator = NULL) +} +\arguments{ +\item{str}{a character vector} + +\item{...}{additional settings for \code{opts_collator}} + +\item{opts_collator}{a named list with \pkg{ICU} Collator's options, +see \code{\link{stri_opts_collator}}, \code{NULL} +for default collation options} +} +\value{ +The result is a vector of ranks corresponding to each +string in \code{str}. +} +\description{ +This function ranks each string in a character vector according to a +locale-dependent lexicographic order. +It is a portable replacement for the base \code{xtfrm} function. +} +\details{ +Missing values result in missing ranks and tied observations receive +the same ranks (based on min). + +For more information on \pkg{ICU}'s Collator and how to tune it up +in \pkg{stringi}, refer to \code{\link{stri_opts_collator}}. +} +\examples{ +stri_rank(c('hladny', 'chladny'), locale='pl_PL') +stri_rank(c('hladny', 'chladny'), locale='sk_SK') + +stri_rank("a" \%s+\% c(1, 100, 2, 101, 11, 10)) # lexicographic order +stri_rank("a" \%s+\% c(1, 100, 2, 101, 11, 10), numeric=TRUE) + +# Ordering a data frame with respect to two criteria: +X <- data.frame(a=c("b", NA, "b", "b", NA, "a", "a", "c"), b=runif(8)) +X[order(stri_rank(X$a), X$b), ] +} +\references{ +\emph{Collation} - ICU User Guide, +\url{http://userguide.icu-project.org/collation} +} +\seealso{ +Other locale_sensitive: +\code{\link{\%s<\%}()}, +\code{\link{about_locale}}, +\code{\link{about_search_boundaries}}, +\code{\link{about_search_coll}}, +\code{\link{stri_compare}()}, +\code{\link{stri_count_boundaries}()}, +\code{\link{stri_duplicated}()}, +\code{\link{stri_enc_detect2}()}, +\code{\link{stri_extract_all_boundaries}()}, +\code{\link{stri_locate_all_boundaries}()}, +\code{\link{stri_opts_collator}()}, +\code{\link{stri_order}()}, +\code{\link{stri_sort_key}()}, +\code{\link{stri_sort}()}, +\code{\link{stri_split_boundaries}()}, +\code{\link{stri_trans_tolower}()}, +\code{\link{stri_unique}()}, +\code{\link{stri_wrap}()} +} +\concept{locale_sensitive} diff --git a/man/stri_sort.Rd b/man/stri_sort.Rd index 7110726b9..79b8b4b09 100644 --- a/man/stri_sort.Rd +++ b/man/stri_sort.Rd @@ -29,7 +29,7 @@ The result is a sorted version of \code{str}, i.e., a character vector. } \description{ -This function sorts a character vector according to the locale-dependent +This function sorts a character vector according to a locale-dependent lexicographic order. } \details{ @@ -37,7 +37,7 @@ For more information on \pkg{ICU}'s Collator and how to tune it up in \pkg{stringi}, refer to \code{\link{stri_opts_collator}}. As usual in \pkg{stringi}, non-character inputs are coerced to strings, -see an example below for a perhaps non-intitive behavior of lexicographic +see an example below for a somewhat non-intuitive behavior of lexicographic sorting on numeric inputs. This function uses a stable sort algorithm (\pkg{STL}'s \code{stable_sort}), @@ -69,6 +69,7 @@ Other locale_sensitive: \code{\link{stri_locate_all_boundaries}()}, \code{\link{stri_opts_collator}()}, \code{\link{stri_order}()}, +\code{\link{stri_rank}()}, \code{\link{stri_sort_key}()}, \code{\link{stri_split_boundaries}()}, \code{\link{stri_trans_tolower}()}, diff --git a/man/stri_sort_key.Rd b/man/stri_sort_key.Rd index 36352f13b..222ed97f2 100644 --- a/man/stri_sort_key.Rd +++ b/man/stri_sort_key.Rd @@ -17,18 +17,22 @@ for default collation options} } \value{ The result is a character vector with the same length as \code{str} that -contains the sort keys. +contains the sort keys. The output is marked as \code{bytes}-encoded. } \description{ -This function computes a locale-dependent 'sort key', which is an alternative +This function computes a locale-dependent sort key, which is an alternative character representation of the string that, when ordered in the C locale -(which orders using bytes directly), will give an equivalent ordering to the -original string. It is useful for enhancing algorithms that sort only in the -C locale with the ability to be locale-aware. +(which orders using the underlying bytes directly), will give an equivalent +ordering to the original string. It is useful for enhancing algorithms +that sort only in the C locale (e.g., the \code{strcmp} function in libc) +with the ability to be locale-aware. } \details{ For more information on \pkg{ICU}'s Collator and how to tune it up in \pkg{stringi}, refer to \code{\link{stri_opts_collator}}. + +See also \code{\link{stri_rank}} for ranking strings with a single character +vector, i.e., generating relative sort keys. } \examples{ stri_sort_key(c('hladny', 'chladny'), locale='pl_PL') @@ -52,6 +56,7 @@ Other locale_sensitive: \code{\link{stri_locate_all_boundaries}()}, \code{\link{stri_opts_collator}()}, \code{\link{stri_order}()}, +\code{\link{stri_rank}()}, \code{\link{stri_sort}()}, \code{\link{stri_split_boundaries}()}, \code{\link{stri_trans_tolower}()}, diff --git a/man/stri_split_boundaries.Rd b/man/stri_split_boundaries.Rd index af3cf122a..0fa9eabc7 100644 --- a/man/stri_split_boundaries.Rd +++ b/man/stri_split_boundaries.Rd @@ -98,6 +98,7 @@ Other locale_sensitive: \code{\link{stri_locate_all_boundaries}()}, \code{\link{stri_opts_collator}()}, \code{\link{stri_order}()}, +\code{\link{stri_rank}()}, \code{\link{stri_sort_key}()}, \code{\link{stri_sort}()}, \code{\link{stri_trans_tolower}()}, diff --git a/man/stri_trans_casemap.Rd b/man/stri_trans_casemap.Rd index 57e0fa679..805ca3c06 100644 --- a/man/stri_trans_casemap.Rd +++ b/man/stri_trans_casemap.Rd @@ -84,6 +84,7 @@ Other locale_sensitive: \code{\link{stri_locate_all_boundaries}()}, \code{\link{stri_opts_collator}()}, \code{\link{stri_order}()}, +\code{\link{stri_rank}()}, \code{\link{stri_sort_key}()}, \code{\link{stri_sort}()}, \code{\link{stri_split_boundaries}()}, diff --git a/man/stri_unique.Rd b/man/stri_unique.Rd index 632206f47..100e8a200 100644 --- a/man/stri_unique.Rd +++ b/man/stri_unique.Rd @@ -59,6 +59,7 @@ Other locale_sensitive: \code{\link{stri_locate_all_boundaries}()}, \code{\link{stri_opts_collator}()}, \code{\link{stri_order}()}, +\code{\link{stri_rank}()}, \code{\link{stri_sort_key}()}, \code{\link{stri_sort}()}, \code{\link{stri_split_boundaries}()}, diff --git a/man/stri_wrap.Rd b/man/stri_wrap.Rd index 3babb38e0..be613f911 100644 --- a/man/stri_wrap.Rd +++ b/man/stri_wrap.Rd @@ -139,6 +139,7 @@ Other locale_sensitive: \code{\link{stri_locate_all_boundaries}()}, \code{\link{stri_opts_collator}()}, \code{\link{stri_order}()}, +\code{\link{stri_rank}()}, \code{\link{stri_sort_key}()}, \code{\link{stri_sort}()}, \code{\link{stri_split_boundaries}()}, diff --git a/src/stri_exports.h b/src/stri_exports.h index 6a363a7c0..0f916e5ca 100644 --- a/src/stri_exports.h +++ b/src/stri_exports.h @@ -51,6 +51,7 @@ SEXP stri_cmp_neq(SEXP e1, SEXP e2); // sort.cpp SEXP stri_sort(SEXP str, SEXP decreasing=Rf_ScalarLogical(FALSE), SEXP na_last=Rf_ScalarLogical(NA_LOGICAL), SEXP opts_collator=R_NilValue); +SEXP stri_rank(SEXP str, SEXP opts_collator=R_NilValue); SEXP stri_order(SEXP str, SEXP decreasing=Rf_ScalarLogical(FALSE), SEXP na_last=Rf_ScalarLogical(TRUE), SEXP opts_collator=R_NilValue); SEXP stri_sort_key(SEXP str, SEXP opts_collator=R_NilValue); diff --git a/src/stri_sort.cpp b/src/stri_sort.cpp index c4b41819a..7b63a28a6 100644 --- a/src/stri_sort.cpp +++ b/src/stri_sort.cpp @@ -42,6 +42,10 @@ #include +# define STRI_SORTRANKORDER_SORT 1 +# define STRI_SORTRANKORDER_RANK 2 +# define STRI_SORTRANKORDER_ORDER 3 + /** help struct for stri_order **/ struct StriSortComparer { StriContainerUTF8* cont; @@ -60,8 +64,8 @@ struct StriSortComparer { // if (col) { UErrorCode status = U_ZERO_ERROR; int ret = (int)ucol_strcollUTF8(col, - cont->get(a).c_str(), cont->get(a).length(), - cont->get(b).c_str(), cont->get(b).length(), &status); + cont->get(a).c_str(), cont->get(a).length(), + cont->get(b).c_str(), cont->get(b).length(), &status); STRI__CHECKICUSTATUS_THROW(status, {/* do nothing special on err */}) return (decreasing)?(ret > 0):(ret < 0); // } @@ -76,14 +80,14 @@ struct StriSortComparer { }; -/** Generate the ordering permutation, possibly with collation [internal] +/** Sort, rank, or generate an ordering permutation * * @param str character vector * @param decreasing single logical value * @param na_last single logical value * @param opts_collator passed to stri__ucol_open() - * @param _type internal, 1 for order, 2 for sort - * @return integer vector (permutation) or character vector + * @param _type internal, 2 for order, 1 for sort, 3 for rank + * @return integer vector (permutation/ranks) or character vector * * @version 0.1-?? (Marek Gagolewski) * @@ -108,17 +112,29 @@ struct StriSortComparer { * * @version 0.6-1 (Marek Gagolewski, 2015-07-05) * use stri_order, stri_sort + * + * @version 1.6.1 (Marek Gagolewski, 2021-04-30) + * rank */ -SEXP stri_order_or_sort(SEXP str, SEXP decreasing, SEXP na_last, +SEXP stri_order_rank_or_sort(SEXP str, SEXP decreasing, SEXP na_last, SEXP opts_collator, int _type) { bool decr = stri__prepare_arg_logical_1_notNA(decreasing, "decreasing"); PROTECT(na_last = stri_prepare_arg_logical_1(na_last, "na_last")); PROTECT(str = stri_prepare_arg_string(str, "str")); // prepare string argument + int na_last_int = INTEGER(na_last)[0]; // type is an internal arg -- check manually - if (_type < 1 || _type > 2) + if (_type < 1 || _type > 3) + Rf_error(MSG__INCORRECT_INTERNAL_ARG); + + if ( + _type == STRI_SORTRANKORDER_RANK && + (decr || na_last_int == NA_LOGICAL || !na_last_int) + ) { + // decreasing and na_last is ignored for rank Rf_error(MSG__INCORRECT_INTERNAL_ARG); + } // call stri__ucol_open after prepare_arg: // if prepare_arg had failed, we would have a mem leak @@ -131,7 +147,7 @@ SEXP stri_order_or_sort(SEXP str, SEXP decreasing, SEXP na_last, R_len_t vectorize_length = LENGTH(str); StriContainerUTF8 str_cont(str, vectorize_length); - int na_last_int = INTEGER(na_last)[0]; + deque NA_pos; vector order(vectorize_length); @@ -154,45 +170,81 @@ SEXP stri_order_or_sort(SEXP str, SEXP decreasing, SEXP na_last, SEXP ret; - if (_type == 1) { - // order - STRI__PROTECT(ret = Rf_allocVector(INTSXP, k+NA_pos.size())); - int* ret_tab = INTEGER(ret); - + if (_type == STRI_SORTRANKORDER_SORT) { + // sort + STRI__PROTECT(ret = Rf_allocVector(STRSXP, k+NA_pos.size())); R_len_t j = 0; if (na_last_int != NA_LOGICAL && !na_last_int) { // put NAs first for (std::deque::iterator it=NA_pos.begin(); it!=NA_pos.end(); ++it, ++j) - ret_tab[j] = (*it)+1; // 1-based indices + SET_STRING_ELT(ret, j, NA_STRING); } for (std::vector::iterator it=order.begin(); it!=order.end(); ++it, ++j) - ret_tab[j] = (*it)+1; // 1-based indices + SET_STRING_ELT(ret, j, str_cont.toR(*it)); if (na_last_int != NA_LOGICAL && na_last_int) { // put NAs last for (std::deque::iterator it=NA_pos.begin(); it!=NA_pos.end(); ++it, ++j) - ret_tab[j] = (*it)+1; // 1-based indices + SET_STRING_ELT(ret, j, NA_STRING); } } - else { - // sort - STRI__PROTECT(ret = Rf_allocVector(STRSXP, k+NA_pos.size())); + else if (_type == STRI_SORTRANKORDER_ORDER) { + STRI__PROTECT(ret = Rf_allocVector(INTSXP, k+NA_pos.size())); + int* ret_tab = INTEGER(ret); + R_len_t j = 0; if (na_last_int != NA_LOGICAL && !na_last_int) { // put NAs first for (std::deque::iterator it=NA_pos.begin(); it!=NA_pos.end(); ++it, ++j) - SET_STRING_ELT(ret, j, NA_STRING); + ret_tab[j] = (*it)+1; // 1-based indices } for (std::vector::iterator it=order.begin(); it!=order.end(); ++it, ++j) - SET_STRING_ELT(ret, j, str_cont.toR(*it)); + ret_tab[j] = (*it)+1; // 1-based indices if (na_last_int != NA_LOGICAL && na_last_int) { // put NAs last for (std::deque::iterator it=NA_pos.begin(); it!=NA_pos.end(); ++it, ++j) - SET_STRING_ELT(ret, j, NA_STRING); + ret_tab[j] = (*it)+1; // 1-based indices + } + } + else if (_type == STRI_SORTRANKORDER_RANK) { + // NAs are always preserved, order is increasing + STRI__PROTECT(ret = Rf_allocVector(INTSXP, vectorize_length)); + int* ret_tab = INTEGER(ret); + for (R_len_t i=0; i::iterator it=order.begin(); it!=order.end(); ++it) { + cur_idx = *it; + + if (j_first > 1) { + UErrorCode status = U_ZERO_ERROR; + if ( + 0 != (int)ucol_strcollUTF8( + col, + str_cont.get(last_idx).c_str(), + str_cont.get(last_idx).length(), + str_cont.get(cur_idx).c_str(), + str_cont.get(cur_idx).length(), &status + ) + ) { + j_min = j_first; + } + // else reuse j_min == a tie. + STRI__CHECKICUSTATUS_THROW(status, {/* do nothing special on err */}) + } + + + ret_tab[cur_idx] = j_min; + last_idx = cur_idx; + j_first++; } + } if (col) { @@ -212,37 +264,57 @@ SEXP stri_order_or_sort(SEXP str, SEXP decreasing, SEXP na_last, } -/** Return an ordering permutation + + +/** Sort a character vector * * @param str character vector * @param decreasing single logical value * @param na_last single logical value * @param opts_collator passed to stri__ucol_open() - * @return integer vector (permutation) + * @return charcter vector * * @version 0.6-1 (Marek Gagolewski, 2015-07-05) - * Call stri_order_or_sort + * Call stri_order_rank_or_sort */ -SEXP stri_order(SEXP str, SEXP decreasing, SEXP na_last, SEXP opts_collator) +SEXP stri_sort(SEXP str, SEXP decreasing, SEXP na_last, SEXP opts_collator) { - return stri_order_or_sort(str, decreasing, na_last, opts_collator, 1); + return stri_order_rank_or_sort(str, decreasing, na_last, opts_collator, STRI_SORTRANKORDER_SORT); } -/** Sort a character vector + +/** Return an ordering permutation * * @param str character vector * @param decreasing single logical value * @param na_last single logical value * @param opts_collator passed to stri__ucol_open() - * @return charcter vector + * @return integer vector (permutation) * * @version 0.6-1 (Marek Gagolewski, 2015-07-05) - * Call stri_order_or_sort + * Call stri_order_rank_or_sort */ -SEXP stri_sort(SEXP str, SEXP decreasing, SEXP na_last, SEXP opts_collator) +SEXP stri_order(SEXP str, SEXP decreasing, SEXP na_last, SEXP opts_collator) { - return stri_order_or_sort(str, decreasing, na_last, opts_collator, 2); + return stri_order_rank_or_sort(str, decreasing, na_last, opts_collator, STRI_SORTRANKORDER_ORDER); +} + + +/** Rank strings + * + * @param str character vector + * @param opts_collator passed to stri__ucol_open() + * @return integer vector (ranks) + * + * @version 1.6.1 (Marek Gagolewski, 2021-04-29) + */ +SEXP stri_rank(SEXP str, SEXP opts_collator) +{ + return stri_order_rank_or_sort(str, + Rf_ScalarLogical(FALSE)/*decreasing*/, + Rf_ScalarLogical(TRUE)/*na_last*/, + opts_collator, STRI_SORTRANKORDER_RANK); } @@ -499,6 +571,7 @@ SEXP stri_duplicated_any(SEXP str, SEXP fromLast, SEXP opts_collator) }) } + /** Compute a character sort key * * @param str character vector @@ -506,6 +579,8 @@ SEXP stri_duplicated_any(SEXP str, SEXP fromLast, SEXP opts_collator) * @return character vector * * @version 1.4.7 (Davis Vaughan, 2020-07-15) + * @version 1.6.1 (Marek Gagolewski, 2021-04-29) + * output `bytes`-encoded strings */ SEXP stri_sort_key(SEXP str, SEXP opts_collator) { PROTECT(str = stri_prepare_arg_string(str, "str")); @@ -557,7 +632,7 @@ SEXP stri_sort_key(SEXP str, SEXP opts_collator) { // which we don't want to copy into the R CHARSXP R_len_t key_char_size = key_size - 1; - SET_STRING_ELT(ret, i, Rf_mkCharLenCE(key_buffer.data(), key_char_size, CE_UTF8)); + SET_STRING_ELT(ret, i, Rf_mkCharLenCE(key_buffer.data(), key_char_size, CE_BYTES)); } if (col) { diff --git a/src/stri_stringi.cpp b/src/stri_stringi.cpp index e1162fe81..cc1d2d82b 100644 --- a/src/stri_stringi.cpp +++ b/src/stri_stringi.cpp @@ -154,6 +154,7 @@ const R_CallMethodDef cCallMethods[] = { STRI__MK_CALL("C_stri_match_all_regex", stri_match_all_regex, 5), STRI__MK_CALL("C_stri_numbytes", stri_numbytes, 1), STRI__MK_CALL("C_stri_order", stri_order, 4), + STRI__MK_CALL("C_stri_rank", stri_rank, 2), STRI__MK_CALL("C_stri_sort", stri_sort, 4), STRI__MK_CALL("C_stri_sort_key", stri_sort_key, 2), STRI__MK_CALL("C_stri_pad", stri_pad, 5),