# -*- coding: utf-8 -*-
import requests
import re
for i in range(5000,5484):
url = 'http://www.meizitu.com/a/'+str(i)+'.html'
headers = {
'User-Agent': 'Mozilla/5.0 (Linux;u;Android 4.2.2;zh-cn;) AppleWebKit/534.46 (KHTML,like Gecko) Version/5.1 Mobile Safari/10600.6.3 (compatible; Baiduspider/2.0; +http://www.baidu.com/search/spider.html)'
}
r = requests.get(url, headers=headers)
r.encoding = 'gb2312'
par = re.compile('
', re.S)
items = re.findall(par, r.text)
for item in items:
print item[0], item[1]
down = requests.get(item[1], headers=headers)
with open('img3/%s.jpg' % item[0], 'wb') as f:
f.write(down.content)