添加链接
link之家
链接快照平台
  • 输入网页链接,自动生成快照
  • 标签化管理网页链接
# @文件名 : dlmp4.py # @公众号: Python学习开发 from concurrent.futures.thread import ThreadPoolExecutor from tqdm import tqdm import requests import os from loguru import logger import subprocess _temp = os.path.dirname(os.path.abspath(__file__)) m3u8_path = os.path.join(_temp, "m3u8") ts_path = os.path.join(_temp, "ts_file") mp4_path = os.path.join(_temp, "mp4_file") if not os.path.exists(m3u8_path): os.makedirs(m3u8_path) if not os.path.exists(ts_path): os.makedirs(ts_path) if not os.path.exists(mp4_path): os.makedirs(mp4_path) session = requests.Session() MAX_WORKERS = 50 # 最多使用10个线程 def download_from_url(url, dst): headers = { "User-Agent": "Mozilla/5.0 (Macintosh; Intel Mac OS X 10_14_5) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/86.0.4240.111 Safari/537.36"} response = requests.get(url, headers=headers, stream=True) # (1) file_size = int(response.headers['content-length']) # (2) if os.path.exists(dst): first_byte = os.path.getsize(dst) # (3) else: first_byte = 0 if first_byte >= file_size: # (4) logger.info(f"{dst}:下载完毕") return file_size logger.info(f"当前下载的是:{url}") header = {"Range": f"bytes={first_byte}-{file_size}"} pbar = tqdm( total=file_size, initial=first_byte, unit='B', unit_scale=True, desc=dst) req = requests.get(url, headers=header, stream=True) # (5) with(open(dst, 'ab')) as f: for chunk in req.iter_content(chunk_size=1024): # (6) if chunk: f.write(chunk) pbar.update(1024) pbar.close() return file_size def get_ts_file(ts_item): url = ts_item[0] name = ts_item[1] dst = os.path.join(ts_path, name) download_from_url(url, dst) def read_file(prefix_url, file_path,file_name): with open(file_path, "r") as fs: for line in fs.readlines(): new_item = line.strip().replace("\n", "") if new_item.endswith(".ts"): yield f"{prefix_url}/{new_item}", f"{file_name}{new_item}" def get_m3u8(download_url, file_path): req = session.get(download_url) buff = req.content with open(file_path, "wb") as fs: fs.write(buff) def merge_ts_file(file_name): file_list=sorted(int(item.replace("index","").replace(".ts","").replace(file_name,"")) for item in os.listdir(ts_path) if ".ts" in item) merge_text_path = os.path.join(ts_path,f"{file_name}_merge_file.txt") with open(merge_text_path,"w+") as f: for index,file in enumerate(file_list): content = f"file {file_name}index{file}.ts\n" if index == len(file_list)-1: content = f"file {file_name}index{file}.ts" f.write(content) return merge_text_path def gen_mp4_file(file_name,text_path): mp4_file_name=f"{file_name}.mp4" mp4_full_path = os.path.join(mp4_path,mp4_file_name) command = f"cd {ts_path};ffmpeg -f concat -i {text_path} -c copy {mp4_full_path};rm {file_name}*.*" completed = subprocess.run(command, check=True, shell=True, stdout=subprocess.PIPE) result = completed.stdout.decode("utf-8") logger.info(result) except subprocess.CalledProcessError: raise ValueError(f"{mp4_file_name},转换失败") def main(input_url): prefix_url = os.path.dirname(input_url) file_name = prefix_url.split("/")[-1] m3u8_file_name = f'{file_name}.m3u8' m3u8_file_path = os.path.join(m3u8_path, m3u8_file_name) get_m3u8(url, m3u8_file_path) ts_item_gen = read_file(prefix_url, m3u8_file_path,file_name) with ThreadPoolExecutor(MAX_WORKERS) as excutor: res = excutor.map(get_ts_file, ts_item_gen) logger.info("全部下载完成") logger.info("生成ts文件列表") merge_text_path=merge_ts_file(file_name) logger.info("生成mp4") gen_mp4_file(file_name,merge_text_path) if __name__ == '__main__': url = "https://cdn.aliyun.xxx.com/videos/202010/15/5f8345c15cb7bd239883ef72/134aag/index.m3u8" main(url)