import urllib2
import re
response = urllib2.urlopen('http://www.baidu.com/')
text = 'JGood is<title>sdfa</title> a handsome <title> boy, </title>he is cool, clever, and so on...'
text2 = text.replace('y','')
#m = re.search(r'<title>(.*)<\/title>',response.read())
#m = re.match(r'.*<title>(.*)<\/title>.*',response.read())
#m = re.match(r'.*<title>(.*)<\/title>.*',text2)
m = re.search(r'<title>(.*)<\/title>',text2)
扫描二维码关注公众号,回复:
515974 查看本文章
print m.group(1).decode('utf-8','ignore')
#m = re.finditer(r'<title>(.*)</title>',text)
#m = re.finditer(r'<title>([^<title>]*)</title>',text) ///匹配不能包含<title>中任意字符的一个。
m = re.finditer(r'<title>((.(?!<title>))*.)</title>',text) ///匹配不是<title>的字符串。