rm_bracket {qdapRegex} | R Documentation |
Remove/Replace/Extract Brackets
Description
Remove/replace/extract bracketed strings.
Usage
rm_bracket(
text.var,
pattern = "all",
trim = TRUE,
clean = TRUE,
replacement = "",
extract = FALSE,
include.markers = ifelse(extract, FALSE, TRUE),
dictionary = getOption("regex.library"),
...
)
rm_round(
text.var,
pattern = "(",
trim = TRUE,
clean = TRUE,
replacement = "",
extract = FALSE,
include.markers = ifelse(extract, FALSE, TRUE),
dictionary = getOption("regex.library"),
...
)
rm_square(
text.var,
pattern = "[",
trim = TRUE,
clean = TRUE,
replacement = "",
extract = FALSE,
include.markers = ifelse(extract, FALSE, TRUE),
dictionary = getOption("regex.library"),
...
)
rm_curly(
text.var,
pattern = "{",
trim = TRUE,
clean = TRUE,
replacement = "",
extract = FALSE,
include.markers = ifelse(extract, FALSE, TRUE),
dictionary = getOption("regex.library"),
...
)
rm_angle(
text.var,
pattern = "<",
trim = TRUE,
clean = TRUE,
replacement = "",
extract = FALSE,
include.markers = ifelse(extract, FALSE, TRUE),
dictionary = getOption("regex.library"),
...
)
rm_bracket_multiple(
text.var,
trim = TRUE,
clean = TRUE,
pattern = "all",
replacement = "",
extract = FALSE,
include.markers = FALSE,
merge = TRUE
)
ex_bracket(
text.var,
pattern = "all",
trim = TRUE,
clean = TRUE,
replacement = "",
extract = TRUE,
include.markers = ifelse(extract, FALSE, TRUE),
dictionary = getOption("regex.library"),
...
)
ex_bracket_multiple(
text.var,
trim = TRUE,
clean = TRUE,
pattern = "all",
replacement = "",
extract = TRUE,
include.markers = FALSE,
merge = TRUE
)
ex_angle(
text.var,
pattern = "<",
trim = TRUE,
clean = TRUE,
replacement = "",
extract = TRUE,
include.markers = ifelse(extract, FALSE, TRUE),
dictionary = getOption("regex.library"),
...
)
ex_round(
text.var,
pattern = "(",
trim = TRUE,
clean = TRUE,
replacement = "",
extract = TRUE,
include.markers = ifelse(extract, FALSE, TRUE),
dictionary = getOption("regex.library"),
...
)
ex_square(
text.var,
pattern = "[",
trim = TRUE,
clean = TRUE,
replacement = "",
extract = TRUE,
include.markers = ifelse(extract, FALSE, TRUE),
dictionary = getOption("regex.library"),
...
)
ex_curly(
text.var,
pattern = "{",
trim = TRUE,
clean = TRUE,
replacement = "",
extract = TRUE,
include.markers = ifelse(extract, FALSE, TRUE),
dictionary = getOption("regex.library"),
...
)
Arguments
text.var |
The text variable. |
pattern |
The type of bracket (and encased text) to remove. This is one
or more of the strings |
trim |
logical. If |
clean |
trim logical. If |
replacement |
Replacement for matched |
extract |
logical. If |
include.markers |
logical. If |
dictionary |
A dictionary of canned regular expressions to search within
if |
... |
Other arguments passed to |
merge |
logical. If |
Value
rm_bracket
- returns a character string with
multiple brackets removed. If extract = TRUE
the results are
optionally merged and named by bracket type. This is more flexible than
rm_bracket
but slower.
rm_round
- returns a character string with round brackets removed.
rm_square
- returns a character string with square brackets
removed.
rm_curly
- returns a character string with curly brackets
removed.
rm_angle
- returns a character string with angle brackets
removed.
rm_bracket_multiple
- returns a character string with
multiple brackets removed. If extract = TRUE
the results are
optionally merged and named by bracket type. This is more flexible than
rm_bracket
but slower.
Author(s)
Martin Morgan and Tyler Rinker <tyler.rinker@gmail.com>.
References
https://stackoverflow.com/q/8621066/1000343
See Also
gsub
,
rm_between
,
stri_extract_all_regex
Other rm_ functions:
rm_abbreviation()
,
rm_between()
,
rm_caps_phrase()
,
rm_caps()
,
rm_citation_tex()
,
rm_citation()
,
rm_city_state_zip()
,
rm_city_state()
,
rm_date()
,
rm_default()
,
rm_dollar()
,
rm_email()
,
rm_emoticon()
,
rm_endmark()
,
rm_hash()
,
rm_nchar_words()
,
rm_non_ascii()
,
rm_non_words()
,
rm_number()
,
rm_percent()
,
rm_phone()
,
rm_postal_code()
,
rm_repeated_characters()
,
rm_repeated_phrases()
,
rm_repeated_words()
,
rm_tag()
,
rm_time()
,
rm_title_name()
,
rm_url()
,
rm_white()
,
rm_zip()
Examples
examp <- structure(list(person = structure(c(1L, 2L, 1L, 3L),
.Label = c("bob", "greg", "sue"), class = "factor"), text =
c("I love chicken [unintelligible]!",
"Me too! (laughter) It's so good.[interrupting]",
"Yep it's awesome {reading}.", "Agreed. {is so much fun}")), .Names =
c("person", "text"), row.names = c(NA, -4L), class = "data.frame")
examp
rm_bracket(examp$text, pattern = "square")
rm_bracket(examp$text, pattern = "curly")
rm_bracket(examp$text, pattern = c("square", "round"))
rm_bracket(examp$text)
ex_bracket(examp$text, pattern = "square")
ex_bracket(examp$text, pattern = "curly")
ex_bracket(examp$text, pattern = c("square", "round"))
ex_bracket(examp$text, pattern = c("square", "round"), merge = FALSE)
ex_bracket(examp$text)
ex_bracket(examp$tex, include.markers=TRUE)
## Not run:
library(qdap)
ex_bracket(examp$tex, pattern="curly") %>%
unlist() %>%
na.omit() %>%
paste2()
## End(Not run)
x <- "I like [bots] (not). And <likely> many do not {he he}"
rm_round(x)
ex_round(x)
ex_round(x, include.marker = TRUE)
rm_square(x)
ex_square(x)
rm_curly(x)
ex_curly(x)
rm_angle(x)
ex_angle(x)
lapply(ex_between('She said, "I am!" and he responded..."Am what?".',
left='"', right='"'), "[", c(TRUE, FALSE))