电脑系统:win10,在E盘创建目录zhihu_beautylegs
Python:Install
Python 包:reuqests
#!/usr/bin/env python
import re, requests
SAVE_DIR_PATH = 'E:/zhihu_beautylegs/'
save = lambda url: open(SAVE_DIR_PATH + url[url.rfind('/')+1:], 'wb').write(requests.get(url).content)
def flushBlog():
print("flush blog stat...")
session = requests.Session()
url="http://www.zhihu.com/question/20399991"
print("url-is:" + url)
header = {
'User-Agent': "Mozilla/5.0 (Windows NT 6.3; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/45.0.2454.101 Safari/537.36",
'Accept-Encoding': 'gzip, deflate'
}
res = session.get(url, headers=header)
cntt = res.content
urls = re.findall(r'https://pic\d.zhimg.com/[a-fA-F0-9]{5,32}_\w+.(?:png|jpg|jpeg)', cntt)
return urls
if __name__ == '__main__':
urls = flushBlog()
for url in urls:
print "image-usl=" + url
save(url)
如果想从其他页面爬一些美图,修改页面链接和图片规则就好了