import requests
from bs4 import BeautifulSoup
from concurrent.futures import ThreadPoolExecutor,ProcessPoolExecutor
# url = 'https://www.umei.cc/meinvtupian/meinvxiezhen/'
def down(url):
headers = {
'authority': 'www.umei.cc',
'accept': 'text/html,application/xhtml+xml,application/xml;q=0.9,image/avif,image/webp,image/apng,*/*;q=0.8,application/signed-exchange;v=b3;q=0.7',
'accept-language': 'zh-CN,zh;q=0.9',
'cache-control': 'max-age=0',
'referer': 'https://www.umei.cc/bizhitupian/',
'sec-ch-ua': '"Chromium";v="122", "Not(A:Brand";v="24", "Google Chrome";v="122"',
'sec-ch-ua-mobile': '?0',
'sec-ch-ua-platform': '"Windows"',
'sec-fetch-dest': 'document',
'sec-fetch-mode': 'navigate',
'sec-fetch-site': 'same-origin',
'sec-fetch-user': '?1',
'upgrade-insecure-requests': '1',
'user-agent': 'Mozilla/5.0 (Windows NT 10.0; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/122.0.6261.95 Safari/537.36',
}
response = requests.get(url, cookies=cookies, headers=headers)
response.encoding="utf-8"
soup =BeautifulSoup(response.text,'lxml')
photos = soup.select("div.title a")
for p in photos:
p_url = p['href'].split("=")[-1]
pnurl = "https://www.umei.cc/"+p_url
p_name =p.text
print(pnurl,p_name)
res = requests.get(url=pnurl,cookies=cookies, headers=headers)
res.encoding=("utf-8"),
soup = BeautifulSoup(res.text, 'lxml')
pp = soup.select("div.big-pic a img")[-1]
pp_url=pp.get('src')
res1 = requests.get(url=pp_url, cookies=cookies, headers=headers)
open(f'img/{p_name}.jpg','wb').write(res1.content)
if __name__ == "__main__":
with ThreadPoolExecutor(10) as t:
for i in range(1,217):
url = f'https://www.umei.cc/meinvtupian/rentiyishu/index_{i}.htm'
t.submit(down,url)
如何多线程下载图片,需要调用down函数
青龙摄影2024-07-31 20:44
相关推荐
轮子飞了15 分钟前
记一次 Spring AI Alibaba + 百炼的踩坑:结构化输出与联网搜索的冲突专注VB编程开发20年20 分钟前
VB.NET是唯一能直接打击 Python 的语言梦想三三25 分钟前
【NLP入门到实战】TF-IDF算法详解 + 红楼梦120回关键词提取弹简特26 分钟前
【零基础学Python】05-Python函数完全指南:从初阶定义到进阶参数,一篇打通核心难点学地理的小胖砸42 分钟前
【批量处理tiff文件生成jpg缩略图】机汇五金_1 小时前
通信设备防雨箱如何兼顾防护与散热?糖果店的幽灵1 小时前
LangChain 1.3 完全教程:从入门到精通-Part 7: Documents(文档处理)Wonderful U1 小时前
基于Python爬虫+Django的轻量化天气预报系统:从数据抓取到可视化展示的完整实战lqjun08271 小时前
PyTorch梯度计算词元Max1 小时前
3.1 Agent开发需要懂多少数学?