Python3批量下载抖音视频

import requests

import os

import json

import re

import sys

import time

from contextlib ``import closing

requests.packages.urllib3.disable_warnings()

class Spider():

``def __init__(``self``):

``self``.headers ``= {

``'accept'``: ``'text/html,application/xhtml+xml,application/xml;q=0.9,image/webp,image/apng,*/*;q=0.8'``,

``'accept-encoding'``: ``'gzip, deflate, br'``,

``'accept-language'``: ``'zh-CN,zh;q=0.9'``,

``'cache-control'``: ``'max-age=0'``,

``'upgrade-insecure-requests'``: ``'1'``,

``'user-agent'``: ``'Mozilla/5.0 (Linux; U; Android 5.1.1; zh-cn; MI 4S Build/LMY47V) AppleWebKit/537.36 (KHTML, like Gecko) Version/4.0 Chrome/53.0.2785.146 Mobile Safari/537.36 XiaoMi/MiuiBrowser/9.1.3'``,

``}

``print``(``'[INFO]:Douyin App Video downloader...'``)

``print``(``'[Version]: V3.0'``)

``print``(``'[Author]: Charles'``)

``# 外部调用运行

``def run(``self``):

``user_id ``= input``(``'Enter the ID:'``)

``watermark ``= input``(``'With watermark or not(0 or 1):'``)

``if watermark ``=``= '0'``:

``watermark ``= True

``else``:

``watermark ``= False

``video_names, video_urls, nickname ``= self``._parse_userID(user_id)

``if nickname ``not in os.listdir():

``os.mkdir(nickname)

``print``(``'[INFO]:Number of Videos <%s>' % len``(video_urls))

``for num ``in range``(``len``(video_names)):

``print``(``'[INFO]:Parsing <No.%d> <Url:%s>' % (num``+``1``, video_urls[num]))

``temp ``= video_names[num].replace(``'\\', '``')

``video_name ``= temp.replace(``'/'``, '')

``self``._downloader(video_urls[num], os.path.join(nickname, video_name), watermark)

``print``(``'\n'``)

``print``(``'[INFO]:All Done...'``)

``# 视频下载

``def _downloader(``self``, video_url, path, watermark):

``size ``= 0

``download_url ``= self``._get_download_url(video_url, watermark)

``with closing(requests.get(download_url, headers``=``self``.headers, stream``=``True``)) as response:

``chunk_size ``= 1024

``content_size ``= int``(response.headers[``'content-length'``])

``if response.status_code ``=``= 200``:

``sys.stdout.write(``'[File Size]: %0.2f MB\n' % (content_size``/``chunk_size``/``1024``))

``with ``open``(path, ``'wb'``) as f:

``for data ``in response.iter_content(chunk_size``=``chunk_size):

``f.write(data)

``size ``+``= len``(data)

``f.flush()

``sys.stdout.write(``'[Progress]: %0.2f%%' % float``(size``/``content_size``*``100``) ``+ '\r'``)

``sys.stdout.flush()

``# 获得视频下载地址

``def _get_download_url(``self``, video_url, watermark):

``res ``= requests.get(url``=``video_url)

``relu ``= re.``compile``(r``'playAddr: "(.+)",'``)

``url ``= relu.search(res.text).group(``1``)

``return url ``if watermark ``else url.replace(``'playwm'``, ``'play'``)

``# 通过user_id获取该用户发布的所有视频

``def _parse_userID(``self``, user_id):

``video_names ``= []

``video_urls ``= []

``unique_id ``= ''

``while unique_id !``= user_id:

``search_url ``= 'https://api.amemv.com/aweme/v1/discover/search/?cursor=0&keyword=%s&count=10&type=1&retry_type=no_retry&iid=17900846586&device_id=34692364855&ac=wifi&channel=xiaomi&aid=1128&app_name=aweme&version_code=162&version_name=1.6.2&device_platform=android&ssmix=a&device_type=MI+5&device_brand=Xiaomi&os_api=24&os_version=7.0&uuid=861945034132187&openudid=dc451556fc0eeadb&manifest_version_code=162&resolution=1080*1920&dpi=480&update_version_code=1622' % user_id

``res ``= requests.get(url``=``search_url, headers``=``self``.headers)

``res_dic ``= json.loads(res.text)

``uid ``= res_dic[``'user_list'``][``0``][``'user_info'``][``'uid'``]

``aweme_count ``= res_dic[``'user_list'``][``0``][``'user_info'``][``'aweme_count'``]

``nickname ``= res_dic[``'user_list'``][``0``][``'user_info'``][``'nickname'``]

``unique_id ``= res_dic[``'user_list'``][``0``][``'user_info'``][``'unique_id'``]

``user_url ``= 'https://www.amemv.com/aweme/v1/aweme/post/?user_id={}&max_cursor=0&count={}'``.``format``(uid, aweme_count)

``res ``= requests.get(url``=``user_url, headers``=``self``.headers)

``res_dic ``= json.loads(res.text)

``i ``= 1

``for each ``in res_dic[``'aweme_list'``]:

``share_desc ``= each[``'share_info'``][``'share_desc'``]

``if share_desc ``in [``'抖音-原创音乐短视频社区'``, ``'TikTok'``]:

``video_names.append(``str``(i) ``+ '.mp4'``)

``i ``+``= 1

``else``:

``video_names.append(share_desc ``+ '.mp4'``)

``video_urls.append(each[``'share_info'``][``'share_url'``])

``return video_names, video_urls, nickname

if __name__ ``=``= '__main__'``:

``sp ``= Spider()

``sp.run()

相关推荐
你怎么知道我是队长12 分钟前
C语言---枚举变量
c语言·开发语言
李慕婉学姐16 分钟前
【开题答辩过程】以《基于JAVA的校园即时配送系统的设计与实现》为例,不知道这个选题怎么做的,不知道这个选题怎么开题答辩的可以进来看看
java·开发语言·数据库
吃茄子的猫18 分钟前
quecpython中&的具体含义和使用场景
开发语言·python
じ☆冷颜〃29 分钟前
黎曼几何驱动的算法与系统设计:理论、实践与跨领域应用
笔记·python·深度学习·网络协议·算法·机器学习
云栖梦泽32 分钟前
易语言中小微企业Windows桌面端IoT监控与控制
开发语言
数据大魔方42 分钟前
【期货量化实战】日内动量策略:顺势而为的短线交易法(Python源码)
开发语言·数据库·python·mysql·算法·github·程序员创富
APIshop1 小时前
Python 爬虫获取 item_get_web —— 淘宝商品 SKU、详情图、券后价全流程解析
前端·爬虫·python
风送雨1 小时前
FastMCP 2.0 服务端开发教学文档(下)
服务器·前端·网络·人工智能·python·ai
效率客栈老秦1 小时前
Python Trae提示词开发实战(8):数据采集与清洗一体化方案让效率提升10倍
人工智能·python·ai·提示词·trae
哈里谢顿1 小时前
一条 Python 语句在 C 扩展里到底怎么跑
python