import re
import requests
'''
'''
'''
http://www.xiaohuar.com/list-1-0.html
http://www.xiaohuar.com/list-1-1.html
http://www.xiaohuar.com/list-1-2.html
http://www.xiaohuar.com/list-1-3.html
http://www.xiaohuar.com/list-1-4.html
'''
count= 0
for i in range(44):
url = f'http://www.xiaohuar.com/list-1-{i}.html'
response = requests.get(url)
data = response.text
# print(data)
result_list = re.findall('" src="(.*?)" /></a>', data)
# print(result_list)
for result in result_list:
# print(result,type(result))
if result.startswith('https'):
# print(result)
img_response = requests.get(result)
img_name = result.split('/')[-1]
img_data = img_response.content
with open(img_name, 'wb') as fw:
fw.write(img_data)
fw.flush()
count +=1
print(f'爬取了{count}张')