版本:未加入题库版本最后一版
This commit is contained in:
49
xiuren/xiuren_dl.py
Normal file
49
xiuren/xiuren_dl.py
Normal file
@@ -0,0 +1,49 @@
|
||||
import requests
|
||||
from lxml import etree
|
||||
import os
|
||||
|
||||
# 设置目标URL和请求头
|
||||
url = "https://www.xiurenwang.cc/bang?f=7"
|
||||
headers = {
|
||||
"User-Agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/120.0.0.0 Safari/537.36",
|
||||
"Referer": "https://www.xiurenwang.cc/"
|
||||
}
|
||||
|
||||
# 发送请求获取网页内容
|
||||
response = requests.get(url, headers=headers)
|
||||
response.encoding = "utf-8" # 确保正确解码
|
||||
|
||||
# 解析HTML
|
||||
html = etree.HTML(response.text)
|
||||
|
||||
# 提取图片链接和标题(假设最新图片在列表页面中)
|
||||
image_items = html.xpath('//div[@class="list"]/li/a[@class="img"]/@href')
|
||||
titles = html.xpath('//div[@class="tit"]/a/text()')
|
||||
|
||||
# 创建保存图片的文件夹
|
||||
save_dir = "./xiuren_images"
|
||||
if not os.path.exists(save_dir):
|
||||
os.makedirs(save_dir)
|
||||
|
||||
# 只获取最新的一个条目(假设第一个是最新的)
|
||||
if image_items:
|
||||
latest_url = "https://www.xiurenwang.cc" + image_items[0] # 拼接详情页URL
|
||||
latest_title = titles[0] if titles else "latest_image"
|
||||
|
||||
# 访问详情页获取图片
|
||||
detail_response = requests.get(latest_url, headers=headers)
|
||||
detail_html = etree.HTML(detail_response.text)
|
||||
image_urls = detail_html.xpath('//div[@id="image"]/a/@href')
|
||||
|
||||
# 下载图片
|
||||
for idx, img_url in enumerate(image_urls):
|
||||
img_response = requests.get(img_url, headers=headers)
|
||||
img_name = f"{latest_title}_{idx + 1}.jpg"
|
||||
img_path = os.path.join(save_dir, img_name.replace('/', '_')) # 避免文件名中的斜杠
|
||||
with open(img_path, "wb") as f:
|
||||
f.write(img_response.content)
|
||||
print(f"已下载: {img_path}")
|
||||
else:
|
||||
print("未找到图片链接,可能需要调整XPath或检查网站结构。")
|
||||
|
||||
print("最新图片下载完成!")
|
||||
Reference in New Issue
Block a user