Skip to content

Commit 217e7e3

Browse files
authored
Clarify the use of DOTALL in JSON Schema regular expressions (#1586)
Signed-off-by: Juan Cruz Viotti <[email protected]>
1 parent ed6fb35 commit 217e7e3

File tree

2 files changed

+27
-1
lines changed

2 files changed

+27
-1
lines changed

src/core/regex/include/sourcemeta/core/regex.h

+8-1
Original file line numberDiff line numberDiff line change
@@ -27,7 +27,7 @@
2727
#include <variant> // std::variant
2828

2929
/// @defgroup regex Regex
30-
/// @brief A regex ECMA implementation for JSON Schema
30+
/// @brief An opinionated regex ECMA 262 implementation for JSON Schema
3131
///
3232
/// This functionality is included as follows:
3333
///
@@ -95,6 +95,10 @@ auto to_regex(const T &pattern) -> std::optional<Regex<T>> {
9595
if (pattern == ".*" || pattern == "^.*$" || pattern == "^(.*)$" ||
9696
pattern == "(.*)" || pattern == "[\\s\\S]*" || pattern == "^[\\s\\S]*$") {
9797
return RegexTypeNoop{};
98+
99+
// Note that the JSON Schema specification does not impose the use of any
100+
// regular expression flag. Given popular adoption, we assume `.` matches
101+
// new line characters (as in the `DOTALL`) option
98102
} else if (pattern == ".+" || pattern == "^.+$" || pattern == "^(.+)$" ||
99103
pattern == ".") {
100104
return RegexTypeNonEmpty{};
@@ -125,6 +129,9 @@ auto to_regex(const T &pattern) -> std::optional<Regex<T>> {
125129
// treated as non-marking sub-expressions (?:expr)
126130
boost::regex::nosubs |
127131

132+
// Make the `.` character class match new lines
133+
boost::regex::mod_s |
134+
128135
// Instructs the regular expression engine to make matching faster,
129136
// with the potential cost of making construction slower
130137
boost::regex::optimize};

test/regex/regex_matches_test.cc

+19
Original file line numberDiff line numberDiff line change
@@ -93,6 +93,25 @@ TEST(Regex_matches, match_true_14) {
9393
"@namespace/mypackage"));
9494
}
9595

96+
TEST(Regex_matches, match_true_15) {
97+
const auto regex{sourcemeta::core::to_regex<std::string>(".")};
98+
EXPECT_TRUE(regex.has_value());
99+
EXPECT_TRUE(sourcemeta::core::matches<std::string>(regex.value(), "\n"));
100+
}
101+
102+
TEST(Regex_matches, match_true_16) {
103+
const auto regex{sourcemeta::core::to_regex<std::string>(".")};
104+
EXPECT_TRUE(regex.has_value());
105+
EXPECT_TRUE(sourcemeta::core::matches<std::string>(regex.value(), "\r"));
106+
}
107+
108+
TEST(Regex_matches, match_true_17) {
109+
const auto regex{sourcemeta::core::to_regex<std::string>("^.+$")};
110+
EXPECT_TRUE(regex.has_value());
111+
EXPECT_TRUE(
112+
sourcemeta::core::matches<std::string>(regex.value(), "foo\nbar\r"));
113+
}
114+
96115
TEST(Regex_matches, match_false_1) {
97116
const auto regex{sourcemeta::core::to_regex<std::string>("^foo")};
98117
EXPECT_TRUE(regex.has_value());

0 commit comments

Comments
 (0)