242 lines
6.7 KiB
Rust
Raw Permalink Normal View History

2024-11-12 15:03:58 +03:00
#[test]
fn empty_regex_empty_match() {
let re = regex!("");
assert_eq!(vec![(0, 0)], findall!(re, ""));
}
#[test]
fn empty_regex_nonempty_match() {
let re = regex!("");
assert_eq!(vec![(0, 0), (1, 1), (2, 2), (3, 3)], findall!(re, "abc"));
}
#[test]
fn one_zero_length_match() {
let re = regex!(r"\d*");
assert_eq!(vec![(0, 0), (1, 2), (3, 4)], findall!(re, "a1b2"));
}
#[test]
fn many_zero_length_match() {
let re = regex!(r"\d*");
assert_eq!(vec![(0, 0), (1, 2), (3, 3), (4, 4), (5, 6)],
findall!(re, "a1bbb2"));
}
#[test]
fn many_sequential_zero_length_match() {
let re = regex!(r"\d?");
assert_eq!(vec![(0, 0), (1, 2), (2, 3), (4, 5), (6, 6)],
findall!(re, "a12b3c"));
}
#[test]
fn quoted_bracket_set() {
let re = regex!(r"([\x{5b}\x{5d}])");
assert_eq!(vec![(0, 1), (1, 2)], findall!(re, "[]"));
let re = regex!(r"([\[\]])");
assert_eq!(vec![(0, 1), (1, 2)], findall!(re, "[]"));
}
#[test]
fn first_range_starts_with_left_bracket() {
let re = regex!(r"([[-z])");
assert_eq!(vec![(0, 1), (1, 2)], findall!(re, "[]"));
}
#[test]
fn range_ends_with_escape() {
let re = regex!(r"([\[-\x{5d}])");
assert_eq!(vec![(0, 1), (1, 2)], findall!(re, "[]"));
}
#[test]
fn empty_match_find_iter() {
let re = regex!(r".*?");
assert_eq!(vec![(0, 0), (1, 1), (2, 2), (3, 3)], findall!(re, "abc"));
}
#[test]
fn empty_match_captures_iter() {
let re = regex!(r".*?");
let ms: Vec<_> = re.captures_iter(text!("abc"))
.map(|c| c.pos(0).unwrap())
.collect();
assert_eq!(ms, vec![(0, 0), (1, 1), (2, 2), (3, 3)]);
}
#[test]
fn capture_names() {
let re = regex!(r"(.)(?P<a>.)");
assert_eq!(3, re.captures_len());
assert_eq!((3, Some(3)), re.capture_names().size_hint());
assert_eq!(vec![None, None, Some("a")],
re.capture_names().collect::<Vec<_>>());
}
#[test]
fn regex_string() {
assert_eq!(r"[a-zA-Z0-9]+", regex!(r"[a-zA-Z0-9]+").as_str());
assert_eq!(r"[a-zA-Z0-9]+", &format!("{}", regex!(r"[a-zA-Z0-9]+")));
assert_eq!(r"[a-zA-Z0-9]+", &format!("{:?}", regex!(r"[a-zA-Z0-9]+")));
}
#[test]
fn capture_index() {
let re = regex!(r"^(?P<name>.+)$");
let cap = re.captures(t!("abc")).unwrap();
assert_eq!(&cap[0], t!("abc"));
assert_eq!(&cap[1], t!("abc"));
assert_eq!(&cap["name"], t!("abc"));
}
#[test]
#[should_panic]
#[cfg_attr(all(target_env = "msvc", target_pointer_width = "32"), ignore)]
fn capture_index_panic_usize() {
let re = regex!(r"^(?P<name>.+)$");
let cap = re.captures(t!("abc")).unwrap();
let _ = cap[2];
}
#[test]
#[should_panic]
#[cfg_attr(all(target_env = "msvc", target_pointer_width = "32"), ignore)]
fn capture_index_panic_name() {
let re = regex!(r"^(?P<name>.+)$");
let cap = re.captures(t!("abc")).unwrap();
let _ = cap["bad name"];
}
#[test]
fn capture_index_lifetime() {
// This is a test of whether the types on `caps["..."]` are general
// enough. If not, this will fail to typecheck.
fn inner(s: &str) -> usize {
let re = regex!(r"(?P<number>\d+)");
let caps = re.captures(t!(s)).unwrap();
caps["number"].len()
}
assert_eq!(3, inner("123"));
}
#[test]
fn capture_misc() {
let re = regex!(r"(.)(?P<a>a)?(.)(?P<b>.)");
let cap = re.captures(t!("abc")).unwrap();
assert_eq!(5, cap.len());
assert_eq!(Some((0, 3)), cap.pos(0));
assert_eq!(None, cap.pos(2));
assert_eq!(Some((2, 3)), cap.pos(4));
assert_eq!(Some(t!("abc")), cap.at(0));
assert_eq!(None, cap.at(2));
assert_eq!(Some(t!("c")), cap.at(4));
assert_eq!(None, cap.name("a"));
assert_eq!(Some(t!("c")), cap.name("b"));
}
#[test]
fn capture_iter() {
let re = regex!(r"(.)(?P<a>.)(.)(?P<b>.)");
let cap = re.captures(t!("abcd")).unwrap();
assert_eq!(5, cap.len());
let expected = vec![
t!("abcd"), t!("a"), t!("b"), t!("c"), t!("d"),
].into_iter().map(Some).collect::<Vec<_>>();
let got = cap.iter().collect::<Vec<_>>();
assert_eq!(expected, got);
}
#[test]
fn capture_iter_missing() {
let re = regex!(r"(.)(?P<a>a)?(.)(?P<b>.)");
let cap = re.captures(t!("abc")).unwrap();
assert_eq!(5, cap.len());
let expected = vec![
Some(t!("abc")), Some(t!("a")), None, Some(t!("b")), Some(t!("c")),
];
let got = cap.iter().collect::<Vec<_>>();
assert_eq!(expected, got);
}
#[test]
fn capture_iter_pos() {
let re = regex!(r"(.)(?P<a>.)(.)(?P<b>.)");
let cap = re.captures(t!("abcd")).unwrap();
let expected = vec![
(0, 4), (0, 1), (1, 2), (2, 3), (3, 4),
].into_iter().map(Some).collect::<Vec<_>>();
let got = cap.iter_pos().collect::<Vec<_>>();
assert_eq!(expected, got);
}
#[test]
fn capture_iter_pos_missing() {
let re = regex!(r"(.)(?P<a>a)?(.)(?P<b>.)");
let cap = re.captures(t!("abc")).unwrap();
let expected = vec![
Some((0, 3)), Some((0, 1)), None, Some((1, 2)), Some((2, 3)),
];
let got = cap.iter_pos().collect::<Vec<_>>();
assert_eq!(expected, got);
}
#[test]
fn capture_iter_named() {
let re = regex!(r"(.)(?P<a>.)(.)(?P<b>.)");
let cap = re.captures(t!("abcd")).unwrap();
let expected1 = vec![
("a", Some(t!("b"))), ("b", Some(t!("d"))),
];
let expected2 = vec![
("b", Some(t!("d"))), ("a", Some(t!("b"))),
];
let got = cap.iter_named().collect::<Vec<_>>();
assert!(got == expected1 || got == expected2);
}
#[test]
fn capture_iter_named_missing() {
let re = regex!(r"(.)(?P<a>.)?(.)(?P<b>.)");
let cap = re.captures(t!("abc")).unwrap();
let expected1 = vec![
("a", None), ("b", Some(t!("c"))),
];
let expected2 = vec![
("b", Some(t!("c"))), ("a", None),
];
let got = cap.iter_named().collect::<Vec<_>>();
assert!(got == expected1 || got == expected2);
}
expand!(expand1, r"(?P<foo>\w+)", "abc", "$foo", "abc");
expand!(expand2, r"(?P<foo>\w+)", "abc", "$0", "abc");
expand!(expand3, r"(?P<foo>\w+)", "abc", "$1", "abc");
expand!(expand4, r"(?P<foo>\w+)", "abc", "$$1", "$1");
expand!(expand5, r"(?P<foo>\w+)", "abc", "$$foo", "$foo");
expand!(expand6, r"(?P<a>\w+)\s+(?P<b>\d+)",
"abc 123", "$b$a", "123abc");
expand!(expand7, r"(?P<a>\w+)\s+(?P<b>\d+)",
"abc 123", "z$bz$az", "z");
expand!(expand8, r"(?P<a>\w+)\s+(?P<b>\d+)",
"abc 123", ".$b.$a.", ".123.abc.");
expand!(expand9, r"(?P<a>\w+)\s+(?P<b>\d+)",
"abc 123", " $b $a ", " 123 abc ");
expand!(expand10, r"(?P<a>\w+)\s+(?P<b>\d+)",
"abc 123", "$bz$az", "");
split!(split1, r"\s+", "a b\nc\td\n\t e",
&[t!("a"), t!("b"), t!("c"), t!("d"), t!("e")]);
split!(split2, r"\b", "a b c",
&[t!(""), t!("a"), t!(" "), t!("b"), t!(" "), t!("c")]);