[Python]代码
#!/usr/bin/env python
import urllib.request
from bs4 import BeautifulSoup
def crawl(url):
headers = {'User-Agent':'Mozilla/5.0 (Windows; U; Windows NT 6.1; en-US; rv:1.9.1.6) Gecko/20091201 Firefox/3.5.6'}
req = urllib.request.Request(url, headers=headers)
page = urllib.request.urlopen(req, timeout=20)
contents = page.read()
soup = BeautifulSoup(contents)
my_girl = soup.find_all('img')
for girl in my_girl:
link = girl.get('src')
print(link)
content2 = urllib.request.urlopen(link).read()
with open(u'D:/doubanmeizi'+'/'+link[-11:],'wb') as code:
code.write(content2)
page_start = 0
page_stop = 10
for page in range(page_start, page_stop):
page += 1
url = 'http://www.dbmeinv.com/?pager_offset=%s' % page
crawl(url)
print("哈哈,妹子图片下载完毕啦!")
原创文章,作者:ItWorker,如若转载,请注明出处:https://blog.ytso.com/tech/pnotes/8106.html