爬取绝对领域图片
流程
代码
python代码
# 爬取绝对领域图片(https://www.jdlingyu.com/tuji)数据
import requests
import parsel
from bs4 import BeautifulSoup
# 1. 发送请求
for page in range(1,5):
url = f'https://www.jdlingyu.com/page/{page}'
response = requests.get(url)
# 2. 获取数据
html_data = response.text
# 3. 解析数据
selector = parsel.Selector(html_data)
detail_url_list = selector.css('.post-info h2 a::attr(href)').getall()
for detail_url in detail_url_list:
resp = requests.get(detail_url)
selector2 = parsel.Selector(resp.text)
img_list = selector2.css('.entry-content img::attr(data-src)').getall()
for img in img_list:
img_data = requests.get(img).content
img_name = img.split('/')[-1]
print(img_name)
# 4. 保存数据
open(f'img/{img_name}', mode = 'wb').write(img_data)