流程

代码

+ python代码

# 爬取绝对领域图片(https://www.jdlingyu.com/tuji)数据

import requests
import parsel
from bs4 import BeautifulSoup

# 1. 发送请求
for page in range(1,5):
    url = f'https://www.jdlingyu.com/page/{page}'
    response = requests.get(url)
    # 2. 获取数据
    html_data = response.text
    # 3. 解析数据
    selector = parsel.Selector(html_data)
    detail_url_list = selector.css('.post-info h2 a::attr(href)').getall()
    for detail_url in detail_url_list:
        resp = requests.get(detail_url)
        selector2 = parsel.Selector(resp.text)
        img_list = selector2.css('.entry-content img::attr(data-src)').getall()
        for img in img_list:
            img_data = requests.get(img).content
            img_name = img.split('/')[-1]
            print(img_name)
            # 4. 保存数据
            open(f'img/{img_name}', mode = 'wb').write(img_data)