1、基本
import requests
from bs4 import BeautifulSoup
res = requests.get('http://www.baidu.com','html.parser')
soup = BeautifulSoup(res.text)
# class
soup.select('.time-source')[0].text
# id
soup.select('#artibodytitle')[0].text
#时间
from datetime import datetime
dt = datetime.strptime(timesource,'%Y %m %d %H:%M')
dt.strftime('%Y-%m-%d')
soup.select(‘#id’)[:-1]
#字符串以空格合并
article=[]
' '.join(article)