【Jupyter notebook】
import re
match = re.search(r'[1-9]\d{5}', 'BIT 100081')
if match:
print(match.group(0))
100081
match = re.match(r'[1-9]\d{5}', 'BIT 100081')
if match:
print(match.group(0))
else:
print("not found")
not found
match = re.match(r'[1-9]\d{5}', '100081 BIT')
if match:
print(match.group(0))
else:
print("not found")
100081
ls = re.findall(r'[1-9]\d{5}','BIT100081 TSU100084 000008DUX')
ls
['100081', '100084']
re.split(r'[1-9]\d{5}','BIT 100081 TSU 100084 000008DUX')
['BIT ', ' TSU ', ' 000008DUX']
re.split(r'[1-9]\d{5}','BIT100081 TSU100084 000008DUX', maxsplit=1)
['BIT', ' TSU100084 000008DUX']
for m in re.finditer(r'[1-9]\d{5}','BIT100081 TSU100083'):
if m:
print(m.group(0))
else:
print('not found')
100081
100083
re.sub(r'[1-9]\d{5}', ':zipcode','BIT100081 TSU100084')
'BIT:zipcode TSU:zipcode'
pat = re.compile(r'[1-9]\d{5}')
pat.findall('BIT100081 TSU100083')
['100081', '100083']
for item in pat.finditer('BIT100081 TSU100083 100038UAB U100032AS'):
print(item.group(0))
100081
100083
100038
100032
pat.search('BIT100081 TSU100083 100038UAB U100032AS')
<_sre.SRE_Match object; span=(3, 9), match='100081'>
m = pat.search('BIT100081 TSU100083 100038UAB U100032AS')
m.string
'BIT100081 TSU100083 100038UAB U100032AS'
m.re
re.compile(r'[1-9]\d{5}', re.UNICODE)
m.start()
3
m.end()
9
m.span()
(3, 9)
pat = re.compile(r'PY.*N')
m = pat.search("PYANBNCNDN")
m.group(0)
'PYANBNCNDN'
# 但是如果我们只想匹配最短的即“PYAN”,怎么办?
pat = re.compile(r'PY.*?N')
m = pat.search("PYANBNCNDN")
m.group(0)
'PYAN'
def match(pattern, string, flags=0):
"""Try to apply the pattern at the start of the string, returning
a match object, or None if no match was found."""
return _compile(pattern, flags).match(string)
def fullmatch(pattern, string, flags=0):
"""Try to apply the pattern to all of the string, returning
a match object, or None if no match was found."""
return _compile(pattern, flags).fullmatch(string)
def search(pattern, string, flags=0):
"""Scan through string looking for a match to the pattern, returning
a match object, or None if no match was found."""
return _compile(pattern, flags).search(string)
def sub(pattern, repl, string, count=0, flags=0):
"""Return the string obtained by replacing the leftmost
non-overlapping occurrences of the pattern in string by the
replacement repl. repl can be either a string or a callable;
if a string, backslash escapes in it are processed. If it is
a callable, it's passed the match object and must return
a replacement string to be used."""
return _compile(pattern, flags).sub(repl, string, count)
def subn(pattern, repl, string, count=0, flags=0):
"""Return a 2-tuple containing (new_string, number).
new_string is the string obtained by replacing the leftmost
non-overlapping occurrences of the pattern in the source
string by the replacement repl. number is the number of
substitutions that were made. repl can be either a string or a
callable; if a string, backslash escapes in it are processed.
If it is a callable, it's passed the match object and must
return a replacement string to be used."""
return _compile(pattern, flags).subn(repl, string, count)
def split(pattern, string, maxsplit=0, flags=0):
"""Split the source string by the occurrences of the pattern,
returning a list containing the resulting substrings. If
capturing parentheses are used in pattern, then the text of all
groups in the pattern are also returned as part of the resulting
list. If maxsplit is nonzero, at most maxsplit splits occur,
and the remainder of the string is returned as the final element
of the list."""
return _compile(pattern, flags).split(string, maxsplit)
def findall(pattern, string, flags=0):
"""Return a list of all non-overlapping matches in the string.
If one or more capturing groups are present in the pattern, return
a list of groups; this will be a list of tuples if the pattern
has more than one group.
Empty matches are included in the result."""
return _compile(pattern, flags).findall(string)
def finditer(pattern, string, flags=0):
"""Return an iterator over all non-overlapping matches in the
string. For each match, the iterator returns a match object.
Empty matches are included in the result."""
return _compile(pattern, flags).finditer(string)
def compile(pattern, flags=0):
"Compile a regular expression pattern, returning a pattern object."
return _compile(pattern, flags)
def purge():
"Clear the regular expression caches"
_cache.clear()
_compile_repl.cache_clear()