suite_bytes.rs - Codebrowser

1	use {
2	anyhow::Result,
3	regex::bytes::{Regex, RegexBuilder},
4	regex_test::{
5	CompiledRegex, Match, RegexTest, Span, TestResult, TestRunner,
6	},
7	};
8
9	/// Tests the default configuration of the hybrid NFA/DFA.
10	#[test]
11	fn default() -> Result<()> {
12	let mut runner = TestRunner::new()?;
13	runner
14	.expand(&["is_match", "find", "captures"], \|test\| test.compiles())
15	.blacklist_iter(super::BLACKLIST)
16	.test_iter(crate::suite()?.iter(), compiler)
17	.assert();
18	Ok(())
19	}
20
21	fn run_test(re: &Regex, test: &RegexTest) -> TestResult {
22	match test.additional_name() {
23	"is_match" => TestResult::matched(re.is_match(test.haystack())),
24	"find" => TestResult::matches(
25	re.find_iter(test.haystack())
26	.take(test.match_limit().unwrap_or(std::usize::MAX))
27	.map(\|m\| Match {
28	id: `0`,
29	span: Span { start: m.start(), end: m.end() },
30	}),
31	),
32	"captures" => {
33	let it = re
34	.captures_iter(test.haystack())
35	.take(test.match_limit().unwrap_or(std::usize::MAX))
36	.map(\|caps\| testify_captures(&caps));
37	TestResult::captures(it)
38	}
39	name => TestResult::fail(&format!("unrecognized test name: {}", name)),
40	}
41	}
42
43	/// Converts the given regex test to a closure that searches with a
44	/// `bytes::Regex`. If the test configuration is unsupported, then a
45	/// `CompiledRegex` that skips the test is returned.
46	fn compiler(
47	test: &RegexTest,
48	_patterns: &[String],
49	) -> anyhow::Result<CompiledRegex> {
50	let skip = Ok(CompiledRegex::skip());
51
52	// We're only testing bytes::Regex here, which supports one pattern only.
53	let pattern = match test.regexes().len() {
54	`1` => &test.regexes()[`0`],
55	_ => return skip,
56	};
57	// We only test is_match, find_iter and captures_iter. All of those are
58	// leftmost searches.
59	if !matches!(test.search_kind(), regex_test::SearchKind::Leftmost) {
60	return skip;
61	}
62	// The top-level single-pattern regex API always uses leftmost-first.
63	if !matches!(test.match_kind(), regex_test::MatchKind::LeftmostFirst) {
64	return skip;
65	}
66	// The top-level regex API always runs unanchored searches. ... But we can
67	// handle tests that are anchored but have only one match.
68	if test.anchored() && test.match_limit() != Some(`1`) {
69	return skip;
70	}
71	// We don't support tests with explicit search bounds. We could probably
72	// support this by using the 'find_at' (and such) APIs.
73	let bounds = test.bounds();
74	if !(bounds.start == `0` && bounds.end == test.haystack().len()) {
75	return skip;
76	}
77	// The bytes::Regex API specifically does not support enabling UTF-8 mode.
78	// It could I suppose, but currently it does not. That is, it permits
79	// matches to have offsets that split codepoints.
80	if test.utf8() {
81	return skip;
82	}
83	// If the test requires Unicode but the Unicode feature isn't enabled,
84	// skip it. This is a little aggressive, but the test suite doesn't
85	// have any easy way of communicating which Unicode features are needed.
86	if test.unicode() && !cfg!(feature = "unicode") {
87	return skip;
88	}
89	let re = RegexBuilder::new(pattern)
90	.case_insensitive(test.case_insensitive())
91	.unicode(test.unicode())
92	.line_terminator(test.line_terminator())
93	.build()?;
94	Ok(CompiledRegex::compiled(move \|test\| run_test(&re, test)))
95	}
96
97	/// Convert `Captures` into the test suite's capture values.
98	fn testify_captures(
99	caps: &regex::bytes::Captures<'_>,
100	) -> regex_test::Captures {
101	let spans = caps.iter().map(\|group\| {
102	group.map(\|m\| regex_test::Span { start: m.start(), end: m.end() })
103	});
104	// This unwrap is OK because we assume our 'caps' represents a match, and
105	// a match always gives a non-zero number of groups with the first group
106	// being non-None.
107	regex_test::Captures::new(`0`, spans).unwrap()
108	}
109