# @文件名 : dlmp4.py
# @公众号: Python学习开发
from concurrent.futures.thread import ThreadPoolExecutor
from tqdm import tqdm
import requests
import os
from loguru import logger
import subprocess
_temp = os.path.dirname(os.path.abspath(__file__))
m3u8_path = os.path.join(_temp, "m3u8")
ts_path = os.path.join(_temp, "ts_file")
mp4_path = os.path.join(_temp, "mp4_file")
if not os.path.exists(m3u8_path):
os.makedirs(m3u8_path)
if not os.path.exists(ts_path):
os.makedirs(ts_path)
if not os.path.exists(mp4_path):
os.makedirs(mp4_path)
session = requests.Session()
MAX_WORKERS = 50 # 最多使用10个线程
def download_from_url(url, dst):
headers = {
"User-Agent": "Mozilla/5.0 (Macintosh; Intel Mac OS X 10_14_5) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/86.0.4240.111 Safari/537.36"}
response = requests.get(url, headers=headers, stream=True) # (1)
file_size = int(response.headers['content-length']) # (2)
if os.path.exists(dst):
first_byte = os.path.getsize(dst) # (3)
else:
first_byte = 0
if first_byte >= file_size: # (4)
logger.info(f"{dst}:下载完毕")
return file_size
logger.info(f"当前下载的是:{url}")
header = {"Range": f"bytes={first_byte}-{file_size}"}
pbar = tqdm(
total=file_size, initial=first_byte,
unit='B', unit_scale=True, desc=dst)
req = requests.get(url, headers=header, stream=True) # (5)
with(open(dst, 'ab')) as f:
for chunk in req.iter_content(chunk_size=1024): # (6)
if chunk:
f.write(chunk)
pbar.update(1024)
pbar.close()
return file_size
def get_ts_file(ts_item):
url = ts_item[0]
name = ts_item[1]
dst = os.path.join(ts_path, name)
download_from_url(url, dst)
def read_file(prefix_url, file_path,file_name):
with open(file_path, "r") as fs:
for line in fs.readlines():
new_item = line.strip().replace("\n", "")
if new_item.endswith(".ts"):
yield f"{prefix_url}/{new_item}", f"{file_name}{new_item}"
def get_m3u8(download_url, file_path):
req = session.get(download_url)
buff = req.content
with open(file_path, "wb") as fs:
fs.write(buff)
def merge_ts_file(file_name):
file_list=sorted(int(item.replace("index","").replace(".ts","").replace(file_name,""))
for item in os.listdir(ts_path) if ".ts" in item)
merge_text_path = os.path.join(ts_path,f"{file_name}_merge_file.txt")
with open(merge_text_path,"w+") as f:
for index,file in enumerate(file_list):
content = f"file {file_name}index{file}.ts\n"
if index == len(file_list)-1:
content = f"file {file_name}index{file}.ts"
f.write(content)
return merge_text_path
def gen_mp4_file(file_name,text_path):
mp4_file_name=f"{file_name}.mp4"
mp4_full_path = os.path.join(mp4_path,mp4_file_name)
command = f"cd {ts_path};ffmpeg -f concat -i {text_path} -c copy {mp4_full_path};rm {file_name}*.*"
completed = subprocess.run(command, check=True, shell=True,
stdout=subprocess.PIPE)
result = completed.stdout.decode("utf-8")
logger.info(result)
except subprocess.CalledProcessError:
raise ValueError(f"{mp4_file_name},转换失败")
def main(input_url):
prefix_url = os.path.dirname(input_url)
file_name = prefix_url.split("/")[-1]
m3u8_file_name = f'{file_name}.m3u8'
m3u8_file_path = os.path.join(m3u8_path, m3u8_file_name)
get_m3u8(url, m3u8_file_path)
ts_item_gen = read_file(prefix_url, m3u8_file_path,file_name)
with ThreadPoolExecutor(MAX_WORKERS) as excutor:
res = excutor.map(get_ts_file, ts_item_gen)
logger.info("全部下载完成")
logger.info("生成ts文件列表")
merge_text_path=merge_ts_file(file_name)
logger.info("生成mp4")
gen_mp4_file(file_name,merge_text_path)
if __name__ == '__main__':
url = "https://cdn.aliyun.xxx.com/videos/202010/15/5f8345c15cb7bd239883ef72/134aag/index.m3u8"
main(url)