@@ -226,18 +226,13 @@ _GLIBCXX_BEGIN_NAMESPACE_VERSION
{
if (__icase)
return _M_traits.translate_nocase(__ch);
- else if (__collate)
- return _M_traits.translate(__ch);
else
- return __ch;
+ return _M_traits.translate(__ch);
}
_StrTransT
_M_transform(_CharT __ch) const
- {
- return _M_transform_impl(__ch, typename integral_constant<bool,
- __collate>::type());
- }
+ { return _M_transform_impl(__ch, __bool_constant<__collate>()); }
private:
_StrTransT
@@ -247,7 +242,7 @@ _GLIBCXX_BEGIN_NAMESPACE_VERSION
_StrTransT
_M_transform_impl(_CharT __ch, true_type) const
{
- _StrTransT __str = _StrTransT(1, _M_translate(__ch));
+ _StrTransT __str = _StrTransT(1, __ch);
return _M_traits.transform(__str.begin(), __str.end());
}
@@ -433,6 +428,8 @@ _GLIBCXX_BEGIN_NAMESPACE_VERSION
void
_M_make_range(_CharT __l, _CharT __r)
{
+ __l = _M_translator._M_translate(__l);
+ __r = _M_translator._M_translate(__r);
if (__l > __r)
__throw_regex_error(regex_constants::error_range,
"Invalid range in bracket expression.");
@@ -428,11 +428,13 @@ _GLIBCXX_BEGIN_NAMESPACE_VERSION
if (!(_M_flags & regex_constants::ECMAScript))
if (_M_try_char())
{
- __matcher._M_add_char(_M_value[0]);
__last_char.first = true;
__last_char.second = _M_value[0];
}
while (_M_expression_term(__last_char, __matcher));
+ if (__last_char.first)
+ __matcher._M_add_char(__last_char.second);
+
__matcher._M_ready();
_M_stack.push(_StateSeqT(
*_M_nfa,
@@ -449,8 +451,17 @@ _GLIBCXX_BEGIN_NAMESPACE_VERSION
if (_M_match_token(_ScannerT::_S_token_bracket_end))
return false;
+ const auto __flush = [&]
+ {
+ if (__last_char.first)
+ {
+ __matcher._M_add_char(__last_char.second);
+ __last_char.first = false;
+ }
+ };
if (_M_match_token(_ScannerT::_S_token_collsymbol))
{
+ __flush();
auto __symbol = __matcher._M_add_collate_element(_M_value);
if (__symbol.size() == 1)
{
@@ -459,9 +470,15 @@ _GLIBCXX_BEGIN_NAMESPACE_VERSION
}
}
else if (_M_match_token(_ScannerT::_S_token_equiv_class_name))
- __matcher._M_add_equivalence_class(_M_value);
+ {
+ __flush();
+ __matcher._M_add_equivalence_class(_M_value);
+ }
else if (_M_match_token(_ScannerT::_S_token_char_class_name))
- __matcher._M_add_character_class(_M_value, false);
+ {
+ __flush();
+ __matcher._M_add_character_class(_M_value, false);
+ }
// POSIX doesn't allow '-' as a start-range char (say [a-z--0]),
// except when the '-' is the first or last character in the bracket
// expression ([--0]). ECMAScript treats all '-' after a range as a
@@ -476,7 +493,8 @@ _GLIBCXX_BEGIN_NAMESPACE_VERSION
{
if (!__last_char.first)
{
- __matcher._M_add_char(_M_value[0]);
+ __last_char.first = true;
+ __last_char.second = _M_value[0];
if (_M_value[0] == '-'
&& !(_M_flags & regex_constants::ECMAScript))
{
@@ -488,8 +506,6 @@ _GLIBCXX_BEGIN_NAMESPACE_VERSION
"a dash is not treated literally only when it is at "
"beginning or end.");
}
- __last_char.first = true;
- __last_char.second = _M_value[0];
}
else
{
@@ -499,22 +515,16 @@ _GLIBCXX_BEGIN_NAMESPACE_VERSION
{
__matcher._M_make_range(__last_char.second , _M_value[0]);
__last_char.first = false;
+ return true;
}
- else
- {
- if (_M_scanner._M_get_token()
- != _ScannerT::_S_token_bracket_end)
- __throw_regex_error(
- regex_constants::error_range,
- "Unexpected end of bracket expression.");
- __matcher._M_add_char(_M_value[0]);
- }
- }
- else
- {
- __matcher._M_add_char(_M_value[0]);
- __last_char.second = _M_value[0];
+ if (_M_scanner._M_get_token()
+ != _ScannerT::_S_token_bracket_end)
+ __throw_regex_error(
+ regex_constants::error_range,
+ "Unexpected end of bracket expression.");
}
+ __matcher._M_add_char(__last_char.second);
+ __last_char.second = _M_value[0];
}
}
else if (_M_match_token(_ScannerT::_S_token_quoted_class))
@@ -580,8 +590,9 @@ _GLIBCXX_BEGIN_NAMESPACE_VERSION
_BracketMatcher<_TraitsT, __icase, __collate>::
_M_apply(_CharT __ch, false_type) const
{
+ __ch = _M_translator._M_translate(__ch);
bool __ret = std::binary_search(_M_char_set.begin(), _M_char_set.end(),
- _M_translator._M_translate(__ch));
+ __ch);
if (!__ret)
{
auto __s = _M_translator._M_transform(__ch);
@@ -61,12 +61,40 @@ test03()
VERIFY(!regex_search_debug("a", regex(R"(\b$)"), regex_constants::match_not_eow));
}
+// PR libstdc++/71500
+void
+test04()
+{
+ bool test __attribute__((unused)) = true;
+
+ {
+ regex re1("[A-F]+", regex::ECMAScript | regex::icase);
+ VERIFY(regex_match_debug("aaa", re1));
+ VERIFY(regex_match_debug("AAA", re1));
+ VERIFY(regex_match_debug("fff", re1));
+ VERIFY(regex_match_debug("FFF", re1));
+ }
+ {
+ bool caught = false;
+ try
+ {
+ (void)regex("[T-f]+", regex::ECMAScript | regex::icase);
+ }
+ catch (...)
+ {
+ caught = true;
+ }
+ VERIFY(caught);
+ }
+}
+
int
main()
{
test01();
test02();
test03();
+ test04();
return 0;
}