import re str1 = r'aa<div>test1</div>bb<div>test2</div>cc' str2 = r'aa<div>test1<div>test2</div></div>cc' #贪婪模式 pattern=re.compile(r'<div>.*</div>') s=pattern.search(str1) print(s) #非贪婪模式1 pattern=re.compile(r'<div>.*?</div>') s=pattern.search(str1) print(s) #非贪婪模式2 pattern=re.compile(r'<div>.*?</div>') s=pattern.search(str2) print(s)
/Library/Frameworks/Python.framework/Versions/3.6/bin/python3.6 /Users/apple/PycharmProjects/stage4/spider/2018——0307/re_tanlan.py
<_sre.SRE_Match object; span=(2, 36), match='<div>test1</div>bb<div>test2</div>'>
<_sre.SRE_Match object; span=(2, 18), match='<div>test1</div>'>
<_sre.SRE_Match object; span=(2, 28), match='<div>test1<div>test2</div>'>
Process finished with exit code 0