您的位置:首页 > 编程语言 > Python开发

Python——用爬虫下载妹子图

2016-08-21 14:27 465 查看
import urllib.request
import re

def agentIp():
url='http://www.kuaidaili.com/'
html=urllib.request.urlopen(url)
content=html.read().decode('utf-8')
pat=re.compile(r'(((2[0-5][0-5]|1[0-9][0-9]|[0-9]?[0-9])\.)((2[0-5][0-5]|1[0-9][0-9]|[0-9]?[0-9])\.)((2[0-5][0-5]|1[0-9][0-9]|[0-9]?[0-9])\.)(2[0-5][0-5]|1[0-9][0-9]|[0-9]?[0-9]))')
p=re.findall(pat,str(content))
return (p[0][0])

def openTargetUrl():
url='http://jandan.net/ooxx/page-2099#comments'
req=urllib.request.Request(url)
req.add_header('User-agent','Mozilla/5.0 (Windows NT 10.0; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/50.0.2661.102 Safari/537.36')
res=urllib.request.urlopen(req)
content=res.read().decode('utf-8')
#print(content)
pat=re.compile(r'<img src="http://.*\.jpg')
p=re.findall(pat,str(content))
L=[]
for x in p:
x=x[10:]
L.append(x)
return L

def download(L):
for url in L:
name=url.split("/")[-1]
req = urllib.request.Request(url)
req.add_header('User-agent',
'Mozilla/5.0 (Windows NT 10.0; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/50.0.2661.102 Safari/537.36')
res = urllib.request.urlopen(req)
content = res.read()
with open("D:\Download\PythonJPG\\"+name,'wb') as f:
f.write(content)

def main():
download(openTargetUrl())
print("图片下载完成!")
#agentIp()

if __name__ == '__main__':
main()


左边是代码,右边是下载的图片,代码略简单,只能下载一页,以后有空完善吧

内容来自用户分享和网络整理,不保证内容的准确性,如有侵权内容,可联系管理员处理 点击这里给我发消息
标签:  python 爬虫