爬虫-某游戏交易网站商品信息爬取
本站下所有关于爬虫相关的技术只限于学习交流,请勿商用!切勿给对方服务器造成压力!
from requests_html import HTMLSession
url_api = "http://s.5173.com/tlbb-0-g4h3lf-vmpiyq-0-sevxou-0-0-0-a-a-a-a-a-0-0-0-0.shtml"
session = HTMLSession(
browser_args=[
'--no-sand',
'--user-agent=Mozilla/5.0',
], headless=False
)
r = session.get(url=url_api)
res = r.html.find('.sin_pdlbox')
for i in res:
print(i.find('.tt h2', first=True).text)
print(i.find('.pdlist_price .pr', first=True).text)
print(i.find('.pdlist_unitprice li', first=True).text)
print(i.find('.credit a', first=True).attrs.get('href'))