Thanks to visit codestin.com
Credit goes to github.com

Skip to content

Commit 6c6b78d

Browse files
committed
Initial revision
1 parent 564f550 commit 6c6b78d

2 files changed

Lines changed: 78 additions & 0 deletions

File tree

Lib/regex_syntax.py

Lines changed: 41 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,41 @@
1+
# These bits are passed to regex.set_syntax() to choose among
2+
# alternative regexp syntaxes.
3+
4+
# 1 means plain parentheses serve as grouping, and backslash
5+
# parentheses are needed for literal searching.
6+
# 0 means backslash-parentheses are grouping, and plain parentheses
7+
# are for literal searching.
8+
RE_NO_BK_PARENS = 1
9+
10+
# 1 means plain | serves as the "or"-operator, and \| is a literal.
11+
# 0 means \| serves as the "or"-operator, and | is a literal.
12+
RE_NO_BK_VBAR = 2
13+
14+
# 0 means plain + or ? serves as an operator, and \+, \? are literals.
15+
# 1 means \+, \? are operators and plain +, ? are literals.
16+
RE_BK_PLUS_QM = 4
17+
18+
# 1 means | binds tighter than ^ or $.
19+
# 0 means the contrary.
20+
RE_TIGHT_VBAR = 8
21+
22+
# 1 means treat \n as an _OR operator
23+
# 0 means treat it as a normal character
24+
RE_NEWLINE_OR = 16
25+
26+
# 0 means that a special characters (such as *, ^, and $) always have
27+
# their special meaning regardless of the surrounding context.
28+
# 1 means that special characters may act as normal characters in some
29+
# contexts. Specifically, this applies to:
30+
# ^ - only special at the beginning, or after ( or |
31+
# $ - only special at the end, or before ) or |
32+
# *, +, ? - only special when not after the beginning, (, or |
33+
RE_CONTEXT_INDEP_OPS = 32
34+
35+
# Now define combinations of bits for the standard possibilities.
36+
RE_SYNTAX_AWK = (RE_NO_BK_PARENS | RE_NO_BK_VBAR | RE_CONTEXT_INDEP_OPS)
37+
RE_SYNTAX_EGREP = (RE_SYNTAX_AWK | RE_NEWLINE_OR)
38+
RE_SYNTAX_GREP = (RE_BK_PLUS_QM | RE_NEWLINE_OR)
39+
RE_SYNTAX_EMACS = 0
40+
41+
# (Python's obsolete "regexp" module used a syntax similar to awk.)

Lib/regexp.py

Lines changed: 37 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,37 @@
1+
# Provide backward compatibility for module "regexp" using "regex".
2+
3+
import regex
4+
from regex_syntax import *
5+
6+
class Prog:
7+
def init(self, pat):
8+
save_syntax = regex.set_syntax(RE_SYNTAX_AWK)
9+
try:
10+
self.prog = regex.compile(pat)
11+
finally:
12+
xxx = regex.set_syntax(save_syntax)
13+
return self
14+
def match(self, args):
15+
if type(args) = type(()):
16+
str, offset = args
17+
else:
18+
str, offset = args, 0
19+
if self.prog.search(str, offset) < 0:
20+
return ()
21+
regs = self.prog.regs()
22+
i = len(regs)
23+
while i > 0 and regs[i-1] = (-1, -1):
24+
i = i-1
25+
return regs[:i]
26+
27+
def compile(pat):
28+
return Prog().init(pat)
29+
30+
cache_pat = None
31+
cache_prog = None
32+
33+
def match(pat, str):
34+
global cache_pat, cache_prog
35+
if pat <> cache_pat:
36+
cache_pat, cache_prog = pat, compile(pat)
37+
return cache_prog.match(str)

0 commit comments

Comments
 (0)