Usage
rm_bracket(text.var, pattern = "all", trim = TRUE, clean = TRUE,
replacement = "", extract = FALSE, include.markers = ifelse(extract,
FALSE, TRUE), dictionary = getOption("regex.library"), ...)
rm_round(text.var, pattern = "(", trim = TRUE, clean = TRUE,
replacement = "", extract = FALSE, include.markers = ifelse(extract,
FALSE, TRUE), dictionary = getOption("regex.library"), ...)
rm_square(text.var, pattern = "[", trim = TRUE, clean = TRUE,
replacement = "", extract = FALSE, include.markers = ifelse(extract,
FALSE, TRUE), dictionary = getOption("regex.library"), ...)
rm_curly(text.var, pattern = "{", trim = TRUE, clean = TRUE,
replacement = "", extract = FALSE, include.markers = ifelse(extract,
FALSE, TRUE), dictionary = getOption("regex.library"), ...)
rm_angle(text.var, pattern = "<", trim="TRUE," clean="TRUE," replacement="" ,="" extract="FALSE," include.markers="ifelse(extract," false,="" true),="" dictionary="getOption("regex.library")," ...)="" rm_bracket_multiple(text.var,="" pattern="all" merge="TRUE)" }="" - text.var
{The text variable.}
- pattern
{The type of bracket (and encased text) to remove. This is one
or more of the strings "curly"/"{", "square"/"[",
"round"/"(", "angle"/"<"< code=""> and "all". These
strings correspond to: {, [, (, < or all four types.}
- trim
{logical. If TRUE removes leading and trailing white
spaces.}
- clean
{trim logical. If TRUE extra white spaces and escaped
character will be removed.}
- replacement
{Replacement for matched pattern.}
- extract
{logical. If TRUE the bracketed text is extracted into
a list of vectors.}
- include.markers
{logical. If TRUE and extract = TRUE returns
the markers (left/right) and the text between.}
- dictionary
{A dictionary of canned regular expressions to search within
if pattern begins with "@rm_".}
- merge
{logical. If TRUE the results of each bracket type will
be merged by string. FALSE returns a named list of lists of vectors
of bracketed text per bracket type.}
- ...
{Other arguments passed to gsub.}
rm_bracket - returns a character string with
multiple brackets removed. If extract = TRUE the results are
optionally merged and named by bracket type. This is more flexible than
rm_bracket but slower.
rm_round - returns a character string with round brackets removed.
rm_square - returns a character string with square brackets
removed.
rm_curly - returns a character string with curly brackets
removed.
rm_angle - returns a character string with angle brackets
removed.
rm_bracket_multiple - returns a character string with
multiple brackets removed. If extract = TRUE the results are
optionally merged and named by bracket type. This is more flexible than
rm_bracket but slower.
Remove/replace/extract bracketed strings.
examp <- structure(list(person = structure(c(1L, 2L, 1L, 3L),
.Label = c("bob", "greg", "sue"), class = "factor"), text =
c("I love chicken [unintelligible]!",
"Me too! (laughter) It's so good.[interrupting]",
"Yep it's awesome {reading}.", "Agreed. {is so much fun}")), .Names =
c("person", "text"), row.names = c(NA, -4L), class = "data.frame")
examp
rm_bracket(examp$text, pattern = "square")
rm_bracket(examp$text, pattern = "curly")
rm_bracket(examp$text, pattern = c("square", "round"))
rm_bracket(examp$text)
rm_bracket(examp$text, pattern = "square", extract=TRUE)
rm_bracket(examp$text, pattern = "curly", extract=TRUE)
rm_bracket(examp$text, pattern = c("square", "round"), extract=TRUE)
rm_bracket(examp$text, pattern = c("square", "round"), merge = FALSE, extract=TRUE)
rm_bracket(examp$text, extract=TRUE)
rm_bracket(examp$tex, include.markers=TRUE, extract=TRUE)
library(qdap)
rm_bracket(examp$tex, pattern="curly", extract=TRUE) %>%
unlist() %>%
na.omit() %>%
paste2()
x <- "I like [bots] (not). And many do not {he he}"
rm_round(x)
rm_round(x, extract = TRUE)
rm_round(x, include.marker = FALSE)
rm_round(x, extract = TRUE, include.marker = TRUE)
rm_square(x)
rm_square(x, extract = TRUE)
rm_curly(x)
rm_curly(x, extract = TRUE)
rm_angle(x)
rm_angle(x, extract = TRUE)
lapply(rm_between('She said, "I am!" and he responded..."Am what?".',
left='"', right='"', extract = TRUE), "[", c(TRUE, FALSE))
[object Object],[object Object]
http://stackoverflow.com/q/8621066/1000343
gsub,
rm_between,
stri_extract_all_regex
Other rm_.functions: rm_abbreviation;
rm_between,
rm_between_multiple;
rm_caps_phrase; rm_caps;
rm_citation_tex; rm_citation;
rm_city_state_zip;
rm_city_state; rm_date;
rm_default; rm_dollar;
rm_email; rm_emoticon;
rm_endmark; rm_hash;
rm_nchar_words; rm_non_ascii;
rm_number; rm_percent;
rm_phone; rm_postal_code;
rm_repeated_characters;
rm_repeated_phrases;
rm_repeated_words; rm_tag;
rm_time; rm_title_name;
rm_twitter_url, rm_url;
rm_white, rm_white_bracket,
rm_white_colon,
rm_white_comma,
rm_white_endmark,
rm_white_lead,
rm_white_lead_trail,
rm_white_multiple,
rm_white_punctuation,
rm_white_trail; rm_zip
bracket"<>",>