Python 代码优化:解析视频文件信息
以下是对代码的优化:
- 使用列表推导式简化获取视频文件列表的过程:
video_files = [os.path.join(root, file) for root, dirs, files in os.walk(video_folder)
for file in files if any(file.endswith(format) for format in supported_formats)]
- 使用 f-strings 替换字符串拼接:
size_str = f'{size / 1024 / 1024:.2f} MiB' if size >= 1024 * 1024 else f'{size / 1024:.2f} KiB' if size >= 1024 else f'{size} B'
- 使用命名元组代替列表存储视频和音频信息:
from collections import namedtuple
VideoInfo = namedtuple('VideoInfo', ['format', 'resolution', 'bitrate', 'framerate', 'duration'])
AudioInfo = namedtuple('AudioInfo', ['bitrate', 'sampling_rate', 'language'])
video_output = VideoInfo(*subprocess.run(['mediainfo', '--Inform=Video;%Format%|%Width%x%Height%|%BitRate/String%|%FrameRate%|%Duration/String3%', video_file], stdout=subprocess.PIPE).stdout.decode().strip().split('|')
)
audio_output = [AudioInfo(*audio_info[i*3:i*3+3]) for i in range(len(audio_info)//3)]
- 使用 try-except 捕获解析帧率时可能出现的 ValueError 异常:
try:
framerate = float(video_info[3])
except ValueError:
framerate = None
- 将码率数据中的空格替换为 '' 而不是使用正则表达式:
bitrate = video_info[2].replace(' ', '')
完整代码如下:
import os
import subprocess
import math
from collections import namedtuple
# 视频格式
supported_formats = ['.mp4', '.avi', '.mkv', '.wmv', '.mov', '.flv', '.m2ts', '.ts', '.rm', '.rmvb',
'.vob', '.3gp', '.webm', '.hdmov', '.mp4v', '.mpv4', '.divx', '.xvid', '.f4v',
'.mpeg', '.asf', '.asx', '.m2t']
# 视频文件夹
video_folder = '/home/115/up'
# 获取视频文件列表(包括子目录)
video_files = [os.path.join(root, file) for root, dirs, files in os.walk(video_folder)
for file in files if any(file.endswith(format) for format in supported_formats)]
VideoInfo = namedtuple('VideoInfo', ['format', 'resolution', 'bitrate', 'framerate', 'duration'])
AudioInfo = namedtuple('AudioInfo', ['bitrate', 'sampling_rate', 'language'])
# 遍历所有视频文件
for video_file in video_files:
# 获取文件名
file_name = os.path.basename(video_file)
# 获取文件大小并进行单位换算
size = os.path.getsize(video_file)
size_str = f'{size / 1024 / 1024:.2f} MiB' if size >= 1024 * 1024 else f'{size / 1024:.2f} KiB' if size >= 1024 else f'{size} B'
# 使用 mediainfo 获取视频信息 / 音频信息
video_output = VideoInfo(*subprocess.run(['mediainfo', '--Inform=Video;%Format%|%Width%x%Height%|%BitRate/String%|%FrameRate%|%Duration/String3%',
video_file], stdout=subprocess.PIPE).stdout.decode().strip().split('|')
)
audio_output = subprocess.run(['mediainfo', '--Inform=Audio;%BitRate/String%|%SamplingRate/String%|%Language/String%', video_file], stdout=subprocess.PIPE).stdout.decode().strip()
audio_info = audio_output.split('|')
audio_output = [AudioInfo(*audio_info[i*3:i*3+3]) for i in range(len(audio_info)//3)]
# 时长取整
duration = video_output.duration.split('.')[0]
h, m, s = duration.split(':')
duration = f'{h}:{m}:{str(s).zfill(2)}'
# 以分钟计算的时长 2
duration_minutes = int(h) * 60 + int(m) + math.ceil(float(s)) / 60
# 计算压缩比率
ratio = round(duration_minutes / size * 1000000000, 2)
# 获取帧率
try:
framerate = float(video_output.framerate)
except ValueError:
framerate = None
# 打印文件信息
print(f'{file_name}, {size_str}, {duration}, {video_output.resolution}, {video_output.bitrate.replace(' ', '')}, {framerate}, {' / '.join([audio.language for audio in audio_output])}, {ratio}')
这些优化可以使代码更加简洁、高效,并提高可读性。
原文地址: https://www.cveoy.top/t/topic/mHjI 著作权归作者所有。请勿转载和采集!