The rain ' @@ -618,8 +608,6 @@ def test_convert_charrefs_dropped_text(self): class AttributesTestCase(TestCaseBase): - # TODO: RUSTPYTHON - @unittest.expectedFailure def test_attr_syntax(self): output = [ ("starttag", "a", [("b", "v"), ("c", "v"), ("d", "v"), ("e", None)]) @@ -629,8 +617,6 @@ def test_attr_syntax(self): self._run_check("""""", output) self._run_check("""""", output) - # TODO: RUSTPYTHON - @unittest.expectedFailure def test_attr_values(self): self._run_check("""""", [("starttag", "a", [("b", "xxx\n\txxx"), @@ -646,8 +632,6 @@ def test_attr_values(self): "", [("starttag", "a", [("href", "mailto:xyz@example.com")])]) - # TODO: RUSTPYTHON - @unittest.expectedFailure def test_attr_nonascii(self): # see issue 7311 self._run_check( @@ -668,8 +652,6 @@ def test_attr_entity_replacement(self): "", [("starttag", "a", [("b", "&><\"'")])]) - # TODO: RUSTPYTHON - @unittest.expectedFailure def test_attr_funky_names(self): self._run_check( "", @@ -718,8 +700,6 @@ def test_malformed_attributes(self): ] self._run_check(html, expected) - # TODO: RUSTPYTHON - @unittest.expectedFailure def test_malformed_adjacent_attributes(self): # see #12629 self._run_check('', @@ -732,8 +712,6 @@ def test_malformed_adjacent_attributes(self): ('endtag', 'x')]) # see #755670 for the following 3 tests - # TODO: RUSTPYTHON - @unittest.expectedFailure def test_adjacent_attributes(self): self._run_check('', [("starttag", "a", @@ -759,8 +737,6 @@ def test_end_tag_in_attribute_value(self): [("href", "http://www.example.org/\">;")]), ("data", "spam"), ("endtag", "a")]) - # TODO: RUSTPYTHON - @unittest.expectedFailure def test_with_unquoted_attributes(self): # see #12008 html = ("" diff --git a/Lib/test/test_re.py b/Lib/test/test_re.py index 62bfc3a7aa..03cb8172de 100644 --- a/Lib/test/test_re.py +++ b/Lib/test/test_re.py @@ -54,6 +54,8 @@ def checkTemplateError(self, pattern, repl, string, errmsg, pos=None): if pos is not None: self.assertEqual(err.pos, pos) + # TODO: RUSTPYTHON + @unittest.expectedFailure def test_keep_buffer(self): # See bug 14212 b = bytearray(b'x') @@ -555,6 +557,8 @@ def test_re_groupref_exists(self): pat = '(?:%s)(?(200)z)' % pat self.assertEqual(re.match(pat, 'xc8yz').span(), (0, 5)) + # TODO: RUSTPYTHON + @unittest.expectedFailure def test_re_groupref_exists_errors(self): self.checkPatternError(r'(?P )(?(0)a|b)', 'bad group number', 10) self.checkPatternError(r'()(?(-1)a|b)', @@ -650,6 +654,8 @@ def test_repeat_minmax(self): self.checkPatternError(r'x{2,1}', 'min repeat greater than max repeat', 2) + # TODO: RUSTPYTHON + @unittest.expectedFailure def test_getattr(self): self.assertEqual(re.compile("(?i)(a)(b)").pattern, "(?i)(a)(b)") self.assertEqual(re.compile("(?i)(a)(b)").flags, re.I | re.U) @@ -723,6 +729,8 @@ def test_other_escapes(self): with self.subTest(c): self.assertRaises(re.error, re.compile, '[\\%c]' % c) + # TODO: RUSTPYTHON + @unittest.expectedFailure def test_named_unicode_escapes(self): # test individual Unicode named escapes self.assertTrue(re.match(r'\N{LESS-THAN SIGN}', '<')) @@ -789,6 +797,8 @@ def test_string_boundaries(self): # Can match around the whitespace. self.assertEqual(len(re.findall(r"\B", " ")), 2) + # TODO: RUSTPYTHON + @unittest.expectedFailure def test_bigcharset(self): self.assertEqual(re.match("([\u2222\u2223])", "\u2222").group(1), "\u2222") @@ -861,6 +871,8 @@ def test_lookbehind(self): self.assertRaises(re.error, re.compile, r'(a)b(?<=(a)(?(2)b|x))(c)') self.assertRaises(re.error, re.compile, r'(a)b(?<=(.)(?<=\2))(c)') + # TODO: RUSTPYTHON + @unittest.expectedFailure def test_ignore_case(self): self.assertEqual(re.match("abc", "ABC", re.I).group(0), "ABC") self.assertEqual(re.match(b"abc", b"ABC", re.I).group(0), b"ABC") @@ -901,6 +913,8 @@ def test_ignore_case(self): self.assertTrue(re.match(r'\ufb05', '\ufb06', re.I)) self.assertTrue(re.match(r'\ufb06', '\ufb05', re.I)) + # TODO: RUSTPYTHON + @unittest.expectedFailure def test_ignore_case_set(self): self.assertTrue(re.match(r'[19A]', 'A', re.I)) self.assertTrue(re.match(r'[19a]', 'a', re.I)) @@ -939,6 +953,8 @@ def test_ignore_case_set(self): self.assertTrue(re.match(r'[19\ufb05]', '\ufb06', re.I)) self.assertTrue(re.match(r'[19\ufb06]', '\ufb05', re.I)) + # TODO: RUSTPYTHON + @unittest.expectedFailure def test_ignore_case_range(self): # Issues #3511, #17381. self.assertTrue(re.match(r'[9-a]', '_', re.I)) @@ -1137,6 +1153,8 @@ def test_pickling(self): # current pickle expects the _compile() reconstructor in re module from re import _compile + # TODO: RUSTPYTHON + @unittest.expectedFailure def test_copying(self): import copy p = re.compile(r'(?P\d+)(?:\.(?P\d*))?') @@ -1442,6 +1460,8 @@ def test_bug_817234(self): self.assertEqual(next(iter).span(), (4, 4)) self.assertRaises(StopIteration, next, iter) + # TODO: RUSTPYTHON + @unittest.expectedFailure def test_bug_6561(self): # '\d' should match characters in Unicode category 'Nd' # (Number, Decimal Digit), but not those in 'Nl' (Number, @@ -1471,6 +1491,8 @@ def test_empty_array(self): self.assertIsNone(re.compile(b"bla").match(a)) self.assertEqual(re.compile(b"").match(a).groups(), ()) + # TODO: RUSTPYTHON + @unittest.expectedFailure def test_inline_flags(self): # Bug #1700 upper_char = '\u1ea0' # Latin Capital Letter A with Dot Below @@ -1753,6 +1775,10 @@ def test_bug_6509(self): pat = re.compile(b'..') self.assertEqual(pat.sub(lambda m: b'bytes', b'a5'), b'bytes') + # RUSTPYTHON: here in rustpython, we borrow the string only at the + # time of matching, so we will not check the string type when creating + # SRE_Scanner, expect this, other tests has passed + @cpython_only def test_dealloc(self): # issue 3299: check for segfault in debug build import _sre @@ -1859,6 +1885,8 @@ def test_issue17998(self): self.assertEqual(re.compile(pattern, re.S).findall(b'xyz'), [b'xyz'], msg=pattern) + # TODO: RUSTPYTHON + @unittest.expectedFailure def test_match_repr(self): for string in '[abracadabra]', S('[abracadabra]'): m = re.search(r'(.+)(.*?)\1', string) @@ -1905,6 +1933,9 @@ def test_zerowidth(self): self.assertEqual([m.span() for m in re.finditer(r"\b|\w+", "a::bc")], [(0, 0), (0, 1), (1, 1), (3, 3), (3, 5), (5, 5)]) + # TODO: RUSTPYTHON + # @unittest.expectedFailure + @unittest.skip("") def test_bug_2537(self): # issue 2537: empty submatches for outer_op in ('{0,}', '*', '+', '{1,187}'): @@ -2237,6 +2268,8 @@ def test_inline_flags(self): self.check('(?i)pattern', "re.compile('(?i)pattern', re.IGNORECASE)") + # TODO: RUSTPYTHON + @unittest.expectedFailure def test_unknown_flags(self): self.check_flags('random pattern', 0x123000, "re.compile('random pattern', 0x123000)") diff --git a/extra_tests/snippets/stdlib_re.py b/extra_tests/snippets/stdlib_re.py index 45a505fcf7..17ecdba7f6 100644 --- a/extra_tests/snippets/stdlib_re.py +++ b/extra_tests/snippets/stdlib_re.py @@ -67,4 +67,7 @@ urlpattern = re.compile('//([^/#?]*)(.*)', re.DOTALL) url = '//www.example.org:80/foo/bar/baz.html' -assert urlpattern.match(url).group(1) == 'www.example.org:80' \ No newline at end of file +assert urlpattern.match(url).group(1) == 'www.example.org:80' + +assert re.compile('(?:\w+(?:\s|/(?!>))*)*').match('a /bb />ccc').group() == 'a /bb ' +assert re.compile('(?:(1)?)*').match('111').group() == '111' \ No newline at end of file diff --git a/vm/Cargo.toml b/vm/Cargo.toml index 3c72b2de0a..5fd905c8a0 100644 --- a/vm/Cargo.toml +++ b/vm/Cargo.toml @@ -72,7 +72,8 @@ memoffset = "0.6.5" optional = "0.5.0" # RustPython crates implementing functionality based on CPython -sre-engine = "0.1.2" +# sre-engine = "0.1.2" +sre-engine = { git = "https://github.com/qingshi163/sre-engine", branch = "refactor" } # to work on sre-engine locally # sre-engine = { path = "../../sre-engine" } From abc75866623808fa3510d65d0ffeecde3cda5799 Mon Sep 17 00:00:00 2001 From: Jeong YunWon Date: Wed, 27 Jul 2022 05:14:34 +0900 Subject: [PATCH 3/3] bump up sre-engine to 0.2.0 --- Cargo.lock | 5 +++-- vm/Cargo.toml | 3 +-- 2 files changed, 4 insertions(+), 4 deletions(-) diff --git a/Cargo.lock b/Cargo.lock index ecca468c98..e0094cecbd 100644 --- a/Cargo.lock +++ b/Cargo.lock @@ -2066,8 +2066,9 @@ dependencies = [ [[package]] name = "sre-engine" -version = "0.1.2" -source = "git+https://github.com/qingshi163/sre-engine?branch=refactor#82675ae5bd541139163c33312f84e421dddcdd1e" +version = "0.2.0" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "55e283f0ec6488739d0b972e3c17b70a8698b33c298a169430387f871af51a03" dependencies = [ "bitflags", "num_enum", diff --git a/vm/Cargo.toml b/vm/Cargo.toml index 5fd905c8a0..f1771238b5 100644 --- a/vm/Cargo.toml +++ b/vm/Cargo.toml @@ -72,8 +72,7 @@ memoffset = "0.6.5" optional = "0.5.0" # RustPython crates implementing functionality based on CPython -# sre-engine = "0.1.2" -sre-engine = { git = "https://github.com/qingshi163/sre-engine", branch = "refactor" } +sre-engine = "0.2.0" # to work on sre-engine locally # sre-engine = { path = "../../sre-engine" }