python之正则表达式

python之正则表达式

看了b站莫(da)烦(lao)的视频,感受很详细,本身手敲了一遍,方便你们查看,回头忘了就过来看看。

点击https://www.bilibili.com/video/av16926522/?p=36能够去b站看dalao视频python


在这里插入图片描述

# 1 匹配字符串中的目标字符串
pattern1 = "cat"
pattern2 = "bird"
string = "dog runs to cat"
print(re.search(pattern1, string))
print(re.search(pattern2, string))

#result
<re.Match object; span=(12, 15), match='cat'>
None
#2 匹配多种可能
ptn = r"r[au]n"
string = "dog runs(ran) to cat"
print(re.search(ptn, string))

#result
<re.Match object; span=(4, 7), match='run'>
#发现结果只返回匹配第一个检索到的字符串
#3 匹配更多可能
print(re.search(r"r[A-Z]n", "dog runs to cat"))
print(re.search(r"r[a-z]n", "dog runs to cat"))
print(re.search(r"r[0-9]n", "dog r2ns to cat"))
print(re.search(r"r[0-9a-z]n", "dog runs to cat"))

#result
None
<re.Match object; span=(4, 7), match='run'>
<re.Match object; span=(4, 7), match='r2n'>
<re.Match object; span=(4, 7), match='run'>
#4 \d:数字, \D:非数字
print(re.search(r"r\dn", "run r4n"))
print(re.search(r"r\Dn", "run r4n"))

#result
<re.Match object; span=(4, 7), match='r4n'>
<re.Match object; span=(0, 3), match='run'>
#5 空白:\s, 非空白:\S 
#[\t\n\r\f\v]
print(re.search(r"r\sn", "r\nn r4n"))
print(re.search(r"r\Sn", "r\nn r4n"))

#result
<re.Match object; span=(0, 3), match='r\nn'>
<re.Match object; span=(4, 7), match='r4n'>
#6 全部字母数字和"_"
#\w:[a-zA-Z0-9_], \W相反
print(re.search(r"r\wn", "r\nn r4n"))
print(re.search(r"r\Wn", "r\nn r4n"))

#result
<re.Match object; span=(4, 7), match='r4n'>
<re.Match object; span=(0, 3), match='r\nn'>
#7 空白字符
#\b:仅仅在开始或结只有一个空白字符,\B反之
print(re.search(r"\b runs \b", "dog runs to cat"))
print(re.search(r"\B runs \B", "dog runs to cat"))

#result
<re.Match object; span=(3, 9), match=' runs '>
<re.Match object; span=(4, 10), match=' runs '>
#8 匹配特殊字符
#\\:匹配\, .匹配除了\n
print(re.search(r"runs\\", "dog runs\ to cat"))
print(re.search(r"r.n", "r\"n to cat"))

#result
<re.Match object; span=(4, 9), match='runs\\'>
<re.Match object; span=(0, 3), match='r"n'>
#9 ^: 句首, $: 句尾
print(re.search(r"^dog", "dog runs\ to cat"))
print(re.search(r"cat$", "r\"n to cat"))

#result
<re.Match object; span=(0, 3), match='dog'>
<re.Match object; span=(7, 10), match='cat'>
#10 ?:是否
print(re.search(r"Mon(day)?", "Monday"))
print(re.search(r"Mon(day)?", "Mon"))

#result
<re.Match object; span=(0, 6), match='Monday'>
<re.Match object; span=(0, 3), match='Mon'>
#11 多行匹配 Multi-line
string = ''' Dog runs to the cat. I run to the dog. '''
print(re.search(r"^I", string))
print(re.search(r"^I", string, flags= re.M))

#result
None
<re.Match object; span=(22, 23), match='I'>
#12 *:0或屡次
print(re.search(r"ab*", "a"))
print(re.search(r"ab*", "abbbbbbb"))

#result
<re.Match object; span=(0, 1), match='a'>
<re.Match object; span=(0, 8), match='abbbbbbb'>
#13 +:1或屡次
print(re.search(r"ab+", "a"))
print(re.search(r"ab+", "ab"))

#result
None
<re.Match object; span=(0, 2), match='ab'>
#14 可选次数{n,m}
print(re.search(r"ab{2,10}", "a"))
print(re.search(r"ab{2,10}", "abbbb"))

#result
None
<re.Match object; span=(0, 5), match='abbbb'>
#15 group组
match = re.search(r"(\d+), Date: (.+)", "ID: 21321, Date: Aug/19/2019")
print(match.group())
print(match.group(1))
print(match.group(2))

#result
21321, Date: Aug/19/2019
21321
Aug/19/2019
#16 ?P<name>: 组命名
match = re.search(r"(?P<id>\d+), Date: (?P<date>.+)", "ID: 21321, Date: Aug/19/2019")
print(match.group())
print(match.group('id'))
print(match.group('date'))

#result
21321, Date: Aug/19/2019
21321
Aug/19/2019
#17 findall: 寻找全部匹配
print(re.findall(r"r[au]n", "run ran ren"))

#result
['run', 'ran']
#18 |: 或
print(re.findall(r"r(a|u)n", "run ran ren"))

#result
['u', 'a']
#19 sub: 替换
print(re.sub(r"r[au]n", "catches", "dog runs to cat"))

#result
dog catchess to cat
#20 分裂
print(re.split(r"[,;\.]", "a,b;d.c"))

#result
['a', 'b', 'd', 'c']
#21 compile : 编译
compile_re = re.compile(r"r[au]n")
print(compile_re.search("dog ran to cat"))

#result
<re.Match object; span=(4, 7), match='ran'>

另外,Python默认的是贪婪匹配,返回匹配结果最长的字符串。好比:web

import re
match = re.search(r'py.*?n', 'pyanbncndn')
print(match.group(0))

#result
pyanbncndn

而要想使用最小匹配,则只需加一个?即:正则表达式

import re
match = re.search(r'py.*?n', 'pyanbncndn')
print(match.group(0))

#result
pyan

最小匹配操做符以下:
在这里插入图片描述ide