![python中的re模块中的向后引用和零宽断言 python中的re模块中的向后引用和零宽断言](https://image.shishitao.com:8440/aHR0cHM6Ly9iYnNtYXguaWthZmFuLmNvbS9zdGF0aWMvTDNCeWIzaDVMMmgwZEhCekwybHRZV2RsY3pJd01UZ3VZMjVpYkc5bmN5NWpiMjB2WW14dlp5OHhNalV5T0RneUx6SXdNVGd3T0M4eE1qVXlPRGd5TFRJd01UZ3dPRE14TVRVMU9EVTRPVEEwTFRRMk9UTXdOelEyTWk1d2JtYz0uanBn.jpg?w=700&webp=1)
1.后向引用
pattern = re.compile(r"(\w+)")#['hello', 'go', 'go', 'hello']
# pattern = re.compile(r"\b(\w+)\b\s+\b")#['hello', 'go', 'go']
# pattern = re.compile(r"\b(\w+)\b\s+\1\b")#['go'] 匹配重复的单词
str = 'hello hello go go come come go go hello hello'
pattern = re.compile(r"\b(?P<word>\w+)\b\s+(?P=word)\b")
print(re.findall(pattern,str))
2.零宽断言
str = "I'm singing while you're dancing."
pattern = re.compile(r"\b\w+(?=ing\b)")#(?=exp)匹配exp前面的位置
print(re.findall(pattern,str))#['sing', 'danc']
str = 'reading a book'
pattern = re.compile(r"(?<=\bre)\w+\b")#(?<=exp)匹配exp后面的位置
print(re.findall(pattern,str))#['ading']
str = '123,456,789'
pattern = re.compile(r"(?<=,)?(\d+)(?=,)?")#匹配以逗号相隔的数字
print(re.findall(pattern,str))#['123','456','789']
3.负向零宽断言
str = '<span> hello world </span>'
pattern = re.compile(r"(?<=<(\w{4})>)(.*)(?=<\/\1>)")
print(re.findall(pattern,str))#[('span','hello world')]