May 7, 2025 · May 7, 2025 · May 11, 2025 · May 11, 2025 · May 11, 2025 · May 12, 2025
diff --git a/Doc/library/re.rst b/Doc/library/re.rst
   if match:
       process(match)

 Match objects are proper :class:`~collections.abc.Sequence` types. You can access
 match groups via subscripting ``match[...]`` and use familiar
 :class:`~collections.abc.Sequence` idioms to iterate over and extract match groups::

   >>> m = re.match(r"(\w+) (\w+)", "Isaac Newton, physicist")
   >>> m[1]
   "Isaac"
   >>> list(m)
   ["Isaac Newton", "Isaac", "Newton"]
   >>> _, first_name, last_name = m
   >>> last_name
   "Newton"

 You can also destructure match objects with python's ``match`` statement::

   >>> match re.match(r"(\d+)-(\d+)-(\d+)", "2000-10-16"):
   ...     case [_, year, month, day]:
   ...         year
   ...
   "2000"

 .. class:: Match

   Match object returned by successful ``match``\ es and ``search``\ es.

   .. versionadded:: 3.6

   .. versionchanged:: next

      Negative indexing is now supported. This allows accessing match groups
      from the end, starting from the last group defined in the pattern::

         >>> m = re.match(r"(\w+) (\w+)", "Isaac Newton, physicist")
         >>> m[-1]      # The first parenthesized subgroup starting from the end.
         'Newton'
         >>> m[-2]      # The second parenthesized subgroup starting from the end.
         'Isaac'
         >>> m[-3]      # The entire match starting from the end.
         'Isaac Newton'

      You can also use slicing to extract multiple groups as a tuple::

         >>> m = re.match(r"(\w+) (\w+)", "Isaac Newton, physicist")
         >>> m[1:]
         ('Isaac', 'Newton')


 .. method:: Match.__len__()

   Returns the number of groups accessible through the subscript syntax provided by
   :meth:`~Match.__getitem__`. This includes group ``0`` representing the entire match::

      >>> m = re.match(r"(\w+) (\w+)", "Isaac Newton, physicist")
      >>> len(m)
      3

   .. versionadded:: next


 .. method:: Match.groups(default=None)

   *group* defaults to zero, the entire match.


 .. method:: Match.index(value, start=0, stop=sys.maxsize, /)

   Return the index of the first occurrence of the value among the matched groups.

   Raises :exc:`ValueError` if the value is not present.

   .. versionadded:: next


 .. method:: Match.count(value, /)

   Return the number of occurrences of the value among the matched groups.

   .. versionadded:: next


 .. attribute:: Match.pos

   The value of *pos* which was passed to the :meth:`~Pattern.search` or
diff --git a/Lib/re/__init__.py b/Lib/re/__init__.py
 import enum
 from . import _compiler, _parser
 import functools
 import _collections_abc
 import _sre


 Pattern = type(_compiler.compile('', 0))
 Match = type(_compiler.compile('', 0).match(''))

 _collections_abc.Sequence.register(Match)

 # --------------------------------------------------------------------
 # internals

diff --git a/Lib/test/test_re.py b/Lib/test/test_re.py
                          cpython_only, captured_stdout,
                          check_disallow_instantiation, linked_to_musl,
                          warnings_helper, SHORT_TIMEOUT, Stopwatch, requires_resource)
 import itertools
 import locale
 import re
 import string
 import sys
 import unittest
 import warnings
 from collections.abc import Sequence
 from re import Scanner
 from weakref import proxy

        self.assertEqual(m[1], 'a')
        self.assertEqual(m[2], None)
        self.assertEqual(m[3], None)
        self.assertEqual(m[-1], None)
        self.assertEqual(m[-2], None)
        self.assertEqual(m[-3], 'a')
        self.assertEqual(m[-4], 'a')
        with self.assertRaisesRegex(IndexError, 'no such group'):
            m['X']
        with self.assertRaisesRegex(IndexError, 'no such group'):
            m[-1]
            m[-5]
        with self.assertRaisesRegex(IndexError, 'no such group'):
            m[4]
        with self.assertRaisesRegex(IndexError, 'no such group'):
        self.assertEqual(m[1], 'a')
        self.assertEqual(m[2], None)
        self.assertEqual(m[3], 'c')
        self.assertEqual(m[-1], 'c')
        self.assertEqual(m[-2], None)
        self.assertEqual(m[-3], 'a')
        self.assertEqual(m[-4], 'ac')

        # Cannot assign.
        with self.assertRaises(TypeError):
            m[0] = 1

        # No len().
        self.assertRaises(TypeError, len, m)
    def test_match_getitem_slice(self):
        m = re.match(r"(a)(b)(c)", "abc")
        seq = ("abc", "a", "b", "c")
        indices = [None, *range(-len(seq), len(seq) + 1)]
        for start, end, step in itertools.product(
            indices,
            indices,
            filter(lambda x: x != 0, indices), # slice step cannot be zero
        ):
            with self.subTest(start=start, end=end, step=step):
                self.assertEqual(m[start:end:step], seq[start:end:step])

    def test_match_sequence(self):
        m = re.match(r"(a)(b)(c)", "abc")
        self.assertIsInstance(m, Sequence)
        self.assertEqual(len(m), 4)

        self.assertEqual(tuple(m), ("abc", "a", "b", "c"))
        self.assertEqual(list(m), ["abc", "a", "b", "c"])

        abc, a, b, c = m
        self.assertEqual(abc, "abc")
        self.assertEqual(a, "a")
        self.assertEqual(b, "b")
        self.assertEqual(c, "c")

        self.assertIn("abc", m)
        self.assertIn("a", m)
        self.assertIn("b", m)
        self.assertIn("c", m)
        self.assertNotIn("123", m)

        self.assertEqual(list(reversed(m)), ["c", "b", "a", "abc"])

        for s, k, v in re.finditer(r"(\w+):(\w+)", "abc:123"):
            self.assertEqual(s, "abc:123")
            self.assertEqual(k, "abc")
            self.assertEqual(v, "123")

    def test_match_iter(self):
        it = iter(re.match(r"(a)(b)(c)", "abc"))
        self.assertEqual(next(it), "abc")
        self.assertEqual(next(it), "a")
        self.assertEqual(next(it), "b")
        self.assertEqual(next(it), "c")
        self.assertRaises(StopIteration, next, it)

    def test_match_index(self):
        m = re.match(r"(a)(b)(c)(b)", "abcb")
        self.assertEqual(m.index("abcb"), 0)
        self.assertEqual(m.index("a"), 1)
        self.assertEqual(m.index("b"), 2)
        self.assertEqual(m.index("c"), 3)
        self.assertRaises(ValueError, m.index, "123")

        # With start index.
        self.assertEqual(m.index("a", 1), 1)
        self.assertEqual(m.index("b", 1), 2)
        self.assertEqual(m.index("c", 1), 3)
        self.assertRaises(ValueError, m.index, "abcb", 1)
        self.assertRaises(ValueError, m.index, "123", 1)

        self.assertEqual(m.index("b", 2), 2)
        self.assertEqual(m.index("c", 2), 3)
        self.assertRaises(ValueError, m.index, "abcb", 2)
        self.assertRaises(ValueError, m.index, "a", 2)
        self.assertRaises(ValueError, m.index, "123", 2)

        self.assertEqual(m.index("b", 3), 4)
        self.assertEqual(m.index("c", 3), 3)
        self.assertRaises(ValueError, m.index, "abcb", 3)
        self.assertRaises(ValueError, m.index, "a", 3)
        self.assertRaises(ValueError, m.index, "123", 3)

        self.assertEqual(m.index("b", 4), 4)
        self.assertRaises(ValueError, m.index, "abcb", 4)
        self.assertRaises(ValueError, m.index, "a", 4)
        self.assertRaises(ValueError, m.index, "c", 4)
        self.assertRaises(ValueError, m.index, "123", 4)

        self.assertRaises(ValueError, m.index, "abcb", 5)
        self.assertRaises(ValueError, m.index, "a", 5)
        self.assertRaises(ValueError, m.index, "b", 5)
        self.assertRaises(ValueError, m.index, "c", 5)
        self.assertRaises(ValueError, m.index, "123", 5)

        # With start index and stop index.
        self.assertEqual(m.index("b", 1, 3), 2)
        self.assertEqual(m.index("b", 2, 4), 2)
        self.assertEqual(m.index("b", 3, 5), 4)
        self.assertRaises(ValueError, m.index, "b", 0, 2)
        self.assertRaises(ValueError, m.index, "b", 3, 4)
        self.assertRaises(ValueError, m.index, "b", -1, 0)

        # Non-string objects.
        self.assertRaises(ValueError, m.index, 123)
        self.assertRaises(ValueError, m.index, [1, 2, 3])
        self.assertRaises(ValueError, m.index, object())

    def test_match_count(self):
        m = re.match(r"(a)(b)(c)", "abc")
        self.assertEqual(m.count("abc"), 1)
        self.assertEqual(m.count("a"), 1)
        self.assertEqual(m.count("b"), 1)
        self.assertEqual(m.count("c"), 1)
        self.assertEqual(m.count("123"), 0)

        # Non-string objects.
        self.assertEqual(m.count(123), 0)
        self.assertEqual(m.count([1, 2, 3]), 0)
        self.assertEqual(m.count(object()), 0)

    def test_match_match_case(self):
        m = re.match(r"(a)(b)(c)", "abc")

        match m:
            case [abc, "a", "b", "c"]:
                self.assertEqual(abc, "abc")
            case _:
                self.fail()

        match re.match(r"(\d+)-(\d+)-(\d+)", "2025-05-07"):
            case [date, year, month, day]:
                self.assertEqual(date, "2025-05-07")
                self.assertEqual(year, "2025")
                self.assertEqual(month, "05")
                self.assertEqual(day, "07")
            case _:
                self.fail()

    def test_re_fullmatch(self):
        # Issue 16203: Proposal: add re.fullmatch() method.
diff --git a/Misc/ACKS b/Misc/ACKS
 Ezra Berch
 Stuart Berg
 Michel Van den Bergh
 Valentin Berlier
 Julian Berman
 Brice Berna
 Olivier Bernard
diff --git a/Misc/NEWS.d/next/Library/2025-05-12-02-49-18.gh-issue-133546.Gk0Qct.rst b/Misc/NEWS.d/next/Library/2025-05-12-02-49-18.gh-issue-133546.Gk0Qct.rst
 Make :class:`re.Match` a well-rounded :class:`~collections.abc.Sequence`
 type.
diff --git a/Modules/_sre/clinic/sre.c.h b/Modules/_sre/clinic/sre.c.h
Original file line number	Diff line number	Diff line change
Expand Up		@@ -1378,6 +1378,27 @@ when there is no match, you can test whether there was a match with a simple
		if match:
		process(match)

		Match objects are proper :class:`~collections.abc.Sequence` types. You can access
Copy link Member JelleZijlstraMay 7, 2025 Choose a reason for hiding this comment The reason will be displayed to describe this comment to others.Learn more. This is not true with this PR, Sequence has a number of other requirements (e.g. an`index` and`count` method). Copy link ContributorAuthor vberlierMay 7, 2025 Choose a reason for hiding this comment The reason will be displayed to describe this comment to others.Learn more. Nice catch, thanks! I added`index` and`count` by adapting the implementation of`tuple.index` and`tuple.count`. I also updated the unit test to cover all`Sequence` mixin methods.
		match groups via subscripting ``match[...]`` and use familiar
		:class:`~collections.abc.Sequence` idioms to iterate over and extract match groups::

		>>> m = re.match(r"(\w+) (\w+)", "Isaac Newton, physicist")
		>>> m[1]
		"Isaac"
		>>> list(m)
		["Isaac Newton", "Isaac", "Newton"]
		>>> _, first_name, last_name = m
		>>> last_name
		"Newton"

		You can also destructure match objects with python's ``match`` statement::

		>>> match re.match(r"(\d+)-(\d+)-(\d+)", "2000-10-16"):
		... case [_, year, month, day]:
		... year
		...
		"2000"

		.. class:: Match

		Match object returned by successful ``match``\ es and ``search``\ es.
Expand DownExpand Up		@@ -1473,6 +1494,37 @@ when there is no match, you can test whether there was a match with a simple

		.. versionadded:: 3.6

		.. versionchanged:: next

		Negative indexing is now supported. This allows accessing match groups
		from the end, starting from the last group defined in the pattern::

		>>> m = re.match(r"(\w+) (\w+)", "Isaac Newton, physicist")
		>>> m[-1] # The first parenthesized subgroup starting from the end.
		'Newton'
		>>> m[-2] # The second parenthesized subgroup starting from the end.
		'Isaac'
		>>> m[-3] # The entire match starting from the end.
		'Isaac Newton'

		You can also use slicing to extract multiple groups as a tuple::

		>>> m = re.match(r"(\w+) (\w+)", "Isaac Newton, physicist")
		>>> m[1:]
		('Isaac', 'Newton')


		.. method:: Match.__len__()

		Returns the number of groups accessible through the subscript syntax provided by
		:meth:`~Match.__getitem__`. This includes group ``0`` representing the entire match::

		>>> m = re.match(r"(\w+) (\w+)", "Isaac Newton, physicist")
		>>> len(m)
		3

		.. versionadded:: next


		.. method:: Match.groups(default=None)

Expand DownExpand Up		@@ -1539,6 +1591,22 @@ when there is no match, you can test whether there was a match with a simple
		group defaults to zero, the entire match.


		.. method:: Match.index(value, start=0, stop=sys.maxsize, /)
picnixz marked this conversation as resolved. Show resolvedHide resolved

		Return the index of the first occurrence of the value among the matched groups.

		Raises :exc:`ValueError` if the value is not present.

		.. versionadded:: next


		.. method:: Match.count(value, /)

		Return the number of occurrences of the value among the matched groups.

		.. versionadded:: next


		.. attribute:: Match.pos

		The value of pos which was passed to the :meth:`~Pattern.search` or
Expand Down
Original file line number	Diff line number	Diff line change
Expand Up		@@ -125,6 +125,7 @@
		import enum
		from . import _compiler, _parser
		import functools
		import _collections_abc
		import _sre


Expand DownExpand Up		@@ -315,6 +316,8 @@ def escape(pattern):
		Pattern = type(_compiler.compile('', 0))
		Match = type(_compiler.compile('', 0).match(''))

		_collections_abc.Sequence.register(Match)

		# --------------------------------------------------------------------
		# internals

Expand Down
Original file line number	Diff line number	Diff line change
Expand Up		@@ -2,12 +2,14 @@
		cpython_only, captured_stdout,
		check_disallow_instantiation, linked_to_musl,
		warnings_helper, SHORT_TIMEOUT, Stopwatch, requires_resource)
		import itertools
		import locale
		import re
		import string
		import sys
		import unittest
		import warnings
		from collections.abc import Sequence
		from re import Scanner
		from weakref import proxy

Expand DownExpand Up		@@ -570,10 +572,14 @@ def test_match_getitem(self):
		self.assertEqual(m[1], 'a')
		self.assertEqual(m[2], None)
		self.assertEqual(m[3], None)
		self.assertEqual(m[-1], None)
		self.assertEqual(m[-2], None)
		self.assertEqual(m[-3], 'a')
		self.assertEqual(m[-4], 'a')
		with self.assertRaisesRegex(IndexError, 'no such group'):
		m['X']
		with self.assertRaisesRegex(IndexError, 'no such group'):
		m[-1]
		m[-5]
		with self.assertRaisesRegex(IndexError, 'no such group'):
		m[4]
		with self.assertRaisesRegex(IndexError, 'no such group'):
Expand All		@@ -594,13 +600,144 @@ def test_match_getitem(self):
		self.assertEqual(m[1], 'a')
		self.assertEqual(m[2], None)
		self.assertEqual(m[3], 'c')
		self.assertEqual(m[-1], 'c')
		self.assertEqual(m[-2], None)
		self.assertEqual(m[-3], 'a')
		self.assertEqual(m[-4], 'ac')

		# Cannot assign.
		with self.assertRaises(TypeError):
		m[0] = 1

		# No len().
		self.assertRaises(TypeError, len, m)
		def test_match_getitem_slice(self):
		m = re.match(r"(a)(b)(c)", "abc")
picnixz marked this conversation as resolved. Show resolvedHide resolved
		seq = ("abc", "a", "b", "c")
		indices = [None, *range(-len(seq), len(seq) + 1)]
		for start, end, step in itertools.product(
		indices,
		indices,
		filter(lambda x: x != 0, indices), # slice step cannot be zero
		):
		with self.subTest(start=start, end=end, step=step):
		self.assertEqual(m[start:end:step], seq[start:end:step])

		def test_match_sequence(self):
		m = re.match(r"(a)(b)(c)", "abc")
		self.assertIsInstance(m, Sequence)
		self.assertEqual(len(m), 4)

		self.assertEqual(tuple(m), ("abc", "a", "b", "c"))
		self.assertEqual(list(m), ["abc", "a", "b", "c"])

		abc, a, b, c = m
		self.assertEqual(abc, "abc")
		self.assertEqual(a, "a")
		self.assertEqual(b, "b")
		self.assertEqual(c, "c")

		self.assertIn("abc", m)
		self.assertIn("a", m)
		self.assertIn("b", m)
		self.assertIn("c", m)
		self.assertNotIn("123", m)

		self.assertEqual(list(reversed(m)), ["c", "b", "a", "abc"])

		for s, k, v in re.finditer(r"(\w+):(\w+)", "abc:123"):
		self.assertEqual(s, "abc:123")
		self.assertEqual(k, "abc")
		self.assertEqual(v, "123")

		def test_match_iter(self):
		it = iter(re.match(r"(a)(b)(c)", "abc"))
		self.assertEqual(next(it), "abc")
		self.assertEqual(next(it), "a")
		self.assertEqual(next(it), "b")
		self.assertEqual(next(it), "c")
		self.assertRaises(StopIteration, next, it)

		def test_match_index(self):
		m = re.match(r"(a)(b)(c)(b)", "abcb")
		self.assertEqual(m.index("abcb"), 0)
		self.assertEqual(m.index("a"), 1)
		self.assertEqual(m.index("b"), 2)
picnixz marked this conversation as resolved. Show resolvedHide resolved
		self.assertEqual(m.index("c"), 3)
		self.assertRaises(ValueError, m.index, "123")

		# With start index.
		self.assertEqual(m.index("a", 1), 1)
		self.assertEqual(m.index("b", 1), 2)
		self.assertEqual(m.index("c", 1), 3)
		self.assertRaises(ValueError, m.index, "abcb", 1)
		self.assertRaises(ValueError, m.index, "123", 1)

		self.assertEqual(m.index("b", 2), 2)
		self.assertEqual(m.index("c", 2), 3)
		self.assertRaises(ValueError, m.index, "abcb", 2)
		self.assertRaises(ValueError, m.index, "a", 2)
		self.assertRaises(ValueError, m.index, "123", 2)

		self.assertEqual(m.index("b", 3), 4)
		self.assertEqual(m.index("c", 3), 3)
		self.assertRaises(ValueError, m.index, "abcb", 3)
		self.assertRaises(ValueError, m.index, "a", 3)
		self.assertRaises(ValueError, m.index, "123", 3)

		self.assertEqual(m.index("b", 4), 4)
		self.assertRaises(ValueError, m.index, "abcb", 4)
		self.assertRaises(ValueError, m.index, "a", 4)
		self.assertRaises(ValueError, m.index, "c", 4)
		self.assertRaises(ValueError, m.index, "123", 4)

		self.assertRaises(ValueError, m.index, "abcb", 5)
		self.assertRaises(ValueError, m.index, "a", 5)
		self.assertRaises(ValueError, m.index, "b", 5)
		self.assertRaises(ValueError, m.index, "c", 5)
		self.assertRaises(ValueError, m.index, "123", 5)

		# With start index and stop index.
		self.assertEqual(m.index("b", 1, 3), 2)
		self.assertEqual(m.index("b", 2, 4), 2)
		self.assertEqual(m.index("b", 3, 5), 4)
		self.assertRaises(ValueError, m.index, "b", 0, 2)
		self.assertRaises(ValueError, m.index, "b", 3, 4)
		self.assertRaises(ValueError, m.index, "b", -1, 0)

		# Non-string objects.
		self.assertRaises(ValueError, m.index, 123)
		self.assertRaises(ValueError, m.index, [1, 2, 3])
		self.assertRaises(ValueError, m.index, object())

		def test_match_count(self):
		m = re.match(r"(a)(b)(c)", "abc")
		self.assertEqual(m.count("abc"), 1)
		self.assertEqual(m.count("a"), 1)
		self.assertEqual(m.count("b"), 1)
		self.assertEqual(m.count("c"), 1)
		self.assertEqual(m.count("123"), 0)
picnixz marked this conversation as resolved. Show resolvedHide resolved

		# Non-string objects.
		self.assertEqual(m.count(123), 0)
		self.assertEqual(m.count([1, 2, 3]), 0)
		self.assertEqual(m.count(object()), 0)

		def test_match_match_case(self):
		m = re.match(r"(a)(b)(c)", "abc")

		match m:
		case [abc, "a", "b", "c"]:
		self.assertEqual(abc, "abc")
		case _:
		self.fail()

		match re.match(r"(\d+)-(\d+)-(\d+)", "2025-05-07"):
		case [date, year, month, day]:
		self.assertEqual(date, "2025-05-07")
		self.assertEqual(year, "2025")
		self.assertEqual(month, "05")
		self.assertEqual(day, "07")
		case _:
		self.fail()

picnixz marked this conversation as resolved. Show resolvedHide resolved
		def test_re_fullmatch(self):
		# Issue 16203: Proposal: add re.fullmatch() method.
Expand Down
Original file line number	Diff line number	Diff line change
Expand Up		@@ -157,6 +157,7 @@ Bennett Benson
		Ezra Berch
		Stuart Berg
		Michel Van den Bergh
		Valentin Berlier
		Julian Berman
		Brice Berna
		Olivier Bernard
Expand Down
Original file line number	Diff line number	Diff line change
		@@ -0,0 +1,2 @@
		Make :class:`re.Match` a well-rounded :class:`~collections.abc.Sequence`
		type.