boren - 学习爬取图片

# 通过爬虫下载10张亚瑟图片
# 1.导包
import os
import requests
import re
# 电脑问我们想下载什么图片
wenti = input("你想下载神魔图片")
number = 10
if not os.path.exists(wenti):
    os.makedirs(wenti)
# 3.构建网址
url = r'http://image.baidu.com/search/flip?tn=baiduimage&ipn=r&ct=201326592&cl=2&lm=-1&st=-1&fm=result&fr=&sf=1&fmq=1497491098685_R&pv=&ic=0&nc=1&z=&se=1&showtab=0&fb=0&width=&height=&face=0&istype=2&ie=utf-8&ctd=1497491098685%5E00_1519X735&word='
url = url+wenti
# print(url)
# 3.1获取源代码
get = requests.get(url)
# print(get.text)
# 3.2 正则表达式
tupian_url = re.findall(r'objURL":"(.*?)",',get.text)
print(tupian_url)
# 3.2 利用正则表达式把源代码里的每一个图片的链接爬取找到
# 2.循环下载



# 4.保存

import requests
url = r"http://b-ssl.duitang.com/uploads/item/201705/21/20170521064802_TNweY.jpeg"
tupian = requests.get(url)
# open(文件名,访问模式) read读  write写
f = open("ma1.jpeg","wb")
# content 内容
f.write(tupian.content)
f.close()
发布了254 篇原创文章 · 获赞 16 · 访问量 9482

猜你喜欢

转载自blog.csdn.net/houlaos/article/details/104109546