rm_time(text.var, trim = !extract, clean = TRUE, pattern = "@rm_time", replacement = "", extract = FALSE, dictionary = getOption("regex.library"), ...)
TRUE removes leading and trailing white
spaces.TRUE extra white spaces and escaped
character will be removed.fixed = TRUE) to be matched in the given
character vector (see Details for additional information). Default,
@rm_time uses the rm_time regex from the regular expression
dictionary from the dictionary argument.pattern.TRUE the times are extracted into a
list of vectors.pattern begins with "@rm_".gsub.Remove/replace/extract time from a string.
The default regular expression used by rm_time finds
time with no AM/PM. This behavior can be altered by using a
secondary regular expression from the regex_usa
data (or other dictionary) via (pattern = "@rm_time2". See
Examples for example usage.
The time regular expression was taken from: http://stackoverflow.com/a/25111133/1000343
x <- c("R uses 1:5 for 1, 2, 3, 4, 5.", "At 3:00 we'll meet up and leave by 4:30:20", "We'll meet at 6:33.", "He ran it in :22.34") rm_time(x)[1] "R uses 1:5 for 1, 2, 3, 4, 5." "At we'll meet up and leave by" "We'll meet at ." "He ran it in"rm_time(x, extract=TRUE)[[1]] [1] NA [[2]] [1] "3:00" "4:30:20" [[3]] [1] "6:33" [[4]] [1] ":22.34"## With AM/PM x <- c( "I'm getting 3:04 AM just fine, but...", "for 10:47 AM I'm getting 0:47 AM instead.", "no time here", "Some time has 12:04 with no AM/PM after it", "Some time has 12:04 a.m. or the form 1:22 pm" ) rm_time(x, extract=TRUE)[[1]] [1] "3:04" [[2]] [1] "10:47" "0:47" [[3]] [1] NA [[4]] [1] "12:04" [[5]] [1] "12:04" "1:22"rm_time(x, pat="@rm_time2", extract=TRUE)[[1]] [1] "3:04 AM" [[2]] [1] "10:47 AM" "0:47 AM" [[3]] [1] NA [[4]] [1] NA [[5]] [1] "12:04 a.m." "1:22 pm"rm_time(x, pat="@rm_time2")[1] "I'm getting just fine, but..." "for I'm getting instead." [3] "no time here" "Some time has 12:04 with no AM/PM after it" [5] "Some time has or the form"rm_time(x, pat=pastex("@rm_time2", "@rm_time"), extract=TRUE)[[1]] [1] "3:04 AM" [[2]] [1] "10:47 AM" "0:47 AM" [[3]] [1] NA [[4]] [1] "12:04" [[5]] [1] "12:04 a.m." "1:22 pm"
gsub,
stri_extract_all_regex
Other rm_.functions: rm_abbreviation;
rm_angle, rm_bracket,
rm_bracket_multiple,
rm_curly, rm_round,
rm_square; rm_between,
rm_between_multiple;
rm_caps_phrase; rm_caps;
rm_citation_tex; rm_citation;
rm_city_state_zip;
rm_city_state; rm_date;
rm_default; rm_dollar;
rm_email; rm_emoticon;
rm_endmark; rm_hash;
rm_nchar_words; rm_non_ascii;
rm_number; rm_percent;
rm_phone; rm_postal_code;
rm_repeated_characters;
rm_repeated_phrases;
rm_repeated_words; rm_tag;
rm_title_name;
rm_twitter_url, rm_url;
rm_white, rm_white_bracket,
rm_white_colon,
rm_white_comma,
rm_white_endmark,
rm_white_lead,
rm_white_lead_trail,
rm_white_multiple,
rm_white_punctuation,
rm_white_trail; rm_zip