py之秀人网详情链接

发布时间 2023-12-17 18:03:17作者: 萧海~

在这里插入图片描述

import requests
from lxml import etree
cookies = {
    'Hm_lvt_1e6428f355435b22644f2fc429cf38a4': '1702806796',
    'Hm_lpvt_1e6428f355435b22644f2fc429cf38a4': '1702806850',
}

headers = {
    'authority': 'www.zps.im',
    'accept': 'text/html,application/xhtml+xml,application/xml;q=0.9,image/avif,image/webp,image/apng,*/*;q=0.8,application/signed-exchange;v=b3;q=0.7',
    'accept-language': 'zh-CN,zh;q=0.9',
    'cache-control': 'no-cache',
    # Requests sorts cookies= alphabetically
    # 'cookie': 'Hm_lvt_1e6428f355435b22644f2fc429cf38a4=1702806796; Hm_lpvt_1e6428f355435b22644f2fc429cf38a4=1702806850',
    'pragma': 'no-cache',
    'referer': 'https://www.zps.im/',
    'sec-ch-ua': '"Not_A Brand";v="8", "Chromium";v="120", "Google Chrome";v="120"',
    'sec-ch-ua-mobile': '?0',
    'sec-ch-ua-platform': '"Windows"',
    'sec-fetch-dest': 'document',
    'sec-fetch-mode': 'navigate',
    'sec-fetch-site': 'same-origin',
    'sec-fetch-user': '?1',
    'upgrade-insecure-requests': '1',
    'user-agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/120.0.0.0 Safari/537.36',
}

response = requests.get('https://www.zps.im/page/2/', cookies=cookies, headers=headers)

html=etree.HTML(response.text)
res=html.xpath('//div[@class="column col-12"]/ol/li/p/a/@href')
print(res)