Files
tools/VideoCompress/main.py
2026-01-11 12:40:07 +08:00

627 lines
21 KiB
Python
Raw Blame History

This file contains ambiguous Unicode characters

This file contains Unicode characters that might be confused with other characters. If you think that this is intentional, you can safely ignore this warning. Use the Escape button to reveal them.

import subprocess
from pathlib import Path
import sys
import os
import logging
from datetime import datetime
from time import time
from rich.logging import RichHandler
from rich.progress import Progress
from pickle import dumps, loads
from typing import Optional, Callable, Literal, List, Any, TYPE_CHECKING
import atexit
import re
import get_frame
import json
try:
from pydantic import BaseModel, Field, field_validator, model_validator
HAS_PYDANTIC = True
class Config(BaseModel):
save_to: Literal["single", "multi"] = Field("single", description="保存到单文件夹或者每个子文件夹创建compress_dir")
crf: Optional[int] = Field(18, ge=0, le=51, description="CRF值范围0-51")
bitrate: Optional[str] = Field(None, description="比特率,格式如: 1000k, 2.5M, 1500B")
codec: str = Field("h264", description="ffmpeg的codec如果使用GPU需要对应设置")
hwaccel: Optional[Literal["amf", "qsv", "cuda"]] = Field(None, description="使用GPU加速")
extra: List[str] = Field([], description="插入到ffmpeg输出前的自定义参数")
ffmpeg: str = "ffmpeg"
ffprobe: str = "ffprobe"
manual: Optional[List[str]] = Field(None, description=r"手动设置ffmpeg命令ffmpeg -i {input} {manual} {output}")
video_ext: List[str] = Field([".mp4", ".mkv"], description="视频文件后缀,含.")
compress_dir_name: str = Field("compress", description="压缩文件夹名称")
resolution: Optional[str] = Field(None, description="统一到特定尺寸None为不使用缩放")
fps: int = Field(30, description="fps", ge=0)
test_video_resolution: str = "1920x1080"
test_video_fps: int = Field(30, ge=0)
test_video_input: str = "compress_video_test.mp4"
test_video_output: str = "compressed_video_test.mp4"
disable_hwaccel_when_fail: bool = Field(True, description="当运行失败时,禁用硬件加速")
@field_validator('bitrate')
@classmethod
def validate_bitrate(cls, v: Optional[str]) -> Optional[str]:
if v is None:
return v
pattern = r'^[\d\.]+[MkB]*$'
if not re.match(pattern, v):
raise ValueError('bitrate格式不正确应为数字+单位(M/k/B),如: 1000k, 2.5M')
return v
@field_validator('resolution')
@classmethod
def validate_resolution(cls, v: Optional[str]) -> Optional[str]:
if v is None:
return v
pattern = r'^((-1)|\d+):((-1)|\d+)$'
if not re.match(pattern, v):
raise ValueError('resolution格式不正确应为{数字/-1}:{数字/-1}')
return v
@field_validator("compress_dir_name")
@classmethod
def valid_path(cls, v: str) -> str:
if re.search(r'[\\/:*?"<>|\x00-\x1F]', v):
raise ValueError("某配置不符合目录名语法")
return v
@model_validator(mode='after')
def validate_mutual_exclusive(self):
crf_none = self.crf is None
bitrate_none = self.bitrate is None
# 有且只有一者为None
if crf_none == bitrate_none:
raise ValueError('crf和bitrate必须互斥有且只有一个为None')
return self
def dump(self):
return self.model_dump()
except ImportError:
HAS_PYDANTIC = False
from dataclasses import dataclass, asdict
import copy
@dataclass
class Config:
save_to: str = "single"
crf: Optional[int] = 18
bitrate: Optional[str] = None
codec: str = "h264"
hwaccel: Optional[str] = None
extra: List[str] = []
ffmpeg: str = "ffmpeg"
ffprobe: str = "ffprobe"
manual: Optional[List[str]] = None
video_ext: List[str] = [".mp4", ".mkv"]
compress_dir_name: str = "compress"
resolution: Optional[str] = None
fps: int = 30
test_video_resolution: str = "1920x1080"
test_video_fps: int = 30
test_video_input: str = "compress_video_test.mp4"
test_video_output: str = "compressed_video_test.mp4"
disable_hwaccel_when_fail: bool = True
def update(self, other):
if isinstance(other, dict):
d = other
elif isinstance(other, Config):
d = asdict(other)
else:
return
for k, v in d.items():
if hasattr(self, k):
setattr(self, k, v)
def copy(self):
return copy.deepcopy(self)
def dump(self):
return asdict(self)
root = None
if os.environ.get("INSTALL", "0") == "1":
CFG_FILE = Path(os.getenv("APPDATA", "C:/")) / "VideoCompress" / "config.json"
else:
CFG_FILE = Path(sys.path[0]) / "config.json"
if CFG_FILE.exists():
try:
import json
if HAS_PYDANTIC:
assert BaseModel # type: ignore
assert issubclass(Config, BaseModel)
CFG = Config.model_validate_json(CFG_FILE.read_text())
else:
assert Config
cfg:dict[str, Any] = json.loads(CFG_FILE.read_text())
CFG = Config(**cfg)
get_frame.ffprobe = CFG.ffprobe
logging.debug(CFG)
except KeyboardInterrupt as e:
raise e
except Exception as e:
logging.warning("Invalid config file, ignored.")
logging.debug(e)
else:
try:
if HAS_PYDANTIC:
if TYPE_CHECKING:
assert BaseModel # type: ignore
assert issubclass(Config, BaseModel)
CFG = Config() # type: ignore
CFG_FILE.write_text(CFG.model_dump_json(indent=4))
else:
import json
if TYPE_CHECKING:
assert Config
assert asdict # type: ignore
CFG = Config() # type: ignore
CFG_FILE.write_text(json.dumps(asdict(CFG), indent=4))
logging.info("Config file created.")
except Exception as e:
logging.warning("Failed to create config file.", exc_info=e)
def get_cmd(video_path: str | Path, output_file: str | Path) -> list[str]:
if isinstance(video_path, Path):
video_path = str(video_path.resolve())
if isinstance(output_file, Path):
output_file = str(output_file.resolve())
if CFG.manual is not None:
command = [CFG.ffmpeg, "-hide_banner", "-i", video_path]
command.extend(CFG.manual)
command.append(output_file)
return command
command = [
CFG.ffmpeg,
"-hide_banner",
]
if CFG.hwaccel is not None:
command.extend(
[
"-hwaccel",
CFG.hwaccel,
"-hwaccel_output_format",
CFG.hwaccel,
]
)
command.extend(
[
"-i",
video_path,
]
)
if CFG.bitrate is not None:
if CFG.resolution is not None:
command.extend(
[
"-vf",
f"scale={CFG.resolution}",
]
)
command.extend(
[
"-c:v",
CFG.codec,
"-b:v",
CFG.bitrate,
"-r",
str(CFG.fps),
"-y",
]
)
else:
if CFG.resolution is not None:
command.extend(
[
"-vf",
f"scale={CFG.resolution}",
]
)
command.extend(
[
"-c:v",
CFG.codec,
"-global_quality",
str(CFG.crf),
"-r",
str(CFG.fps),
"-y",
]
)
command.extend(CFG.extra)
command.append(output_file)
logging.debug(f"Create CMD: {command}")
return command
# 配置logging
def setup_logging():
log_dir = Path("logs")
log_dir.mkdir(exist_ok=True)
log_file = log_dir / f"video_compress_{datetime.now().strftime('%Y%m%d')}.log"
stream = RichHandler(rich_tracebacks=True, tracebacks_show_locals=True)
stream.setLevel(logging.INFO)
stream.setFormatter(logging.Formatter("%(message)s"))
file = logging.FileHandler(log_file, encoding="utf-8")
file.setLevel(logging.DEBUG)
logging.basicConfig(
level=logging.DEBUG,
format="%(asctime)s - %(levelname) 7s - %(message)s",
handlers=[file, stream],
)
def fmt_time(t: float | int) -> str:
if t > 3600:
return f"{t//3600}h {t//60}min {t%60}s"
elif t > 60:
return f"{t//60}min {t%60}s"
else:
return f"{round(t)}s"
def process_video(
video_path: Path,
compress_dir: Optional[Path] = None,
update_func: Optional[Callable[[Optional[int], Optional[str]], None]] = None,
):
if compress_dir is None:
# 在视频文件所在目录下创建 compress 子目录(如果不存在)
compress_dir = video_path.parent / CFG.compress_dir_name
else:
assert root
compress_dir /= video_path.parent.relative_to(root)
assert isinstance(compress_dir, Path)
compress_dir.mkdir(exist_ok=True, parents=True)
# 输出文件路径:与原文件同名,保存在 compress 目录下
output_file = compress_dir / (video_path.stem + video_path.suffix)
if output_file.is_file():
logging.warning(f"文件{output_file}存在,跳过")
return False
video_path_str = str(video_path.absolute())
command = get_cmd(video_path_str, output_file)
try:
result = subprocess.Popen(
command,
stdout=subprocess.PIPE,
stderr=subprocess.PIPE,
encoding="utf-8",
text=True,
)
total = ""
while result.poll() is None:
line = " "
while result.poll() is None and line[-1:] not in "\r\n":
assert result.stderr is not None
line += result.stderr.read(1)
total += line[-1]
# print(line[-1])
if "warning" in line.lower():
logging.warning(f"[FFmpeg]({video_path_str}): {line}")
elif "error" in line.lower():
logging.error(f"[FFmpeg]({video_path_str}): {line}")
elif "assertion" in line.lower():
logging.error(f"[FFmpeg]({video_path_str}): {line}")
elif "frame=" in line and update_func is not None:
# print(line,end="")
match = re.search(r"frame=\s*(\d+)", line)
frame_number = int(match.group(1)) if match else None
match = re.search(r"[\d\.]+x", line)
rate = match.group(0) if match else None
update_func(frame_number, rate)
if result.returncode != 0:
logging.error(
f"处理文件 {video_path_str} 失败"
)
logging.debug(f"返回码: {result.returncode}; cmd={' '.join(command)}")
output_file.unlink(missing_ok=True)
assert result.stdout is not None
logging.debug(result.stdout.read())
logging.debug(total)
if CFG.hwaccel == "mediacodec" and CFG.codec in [
"h264_mediacodec",
"hevc_mediacodec",
]:
logging.info(
"mediacodec硬件加速器已知在较短片段上存在异常将禁用加速重试。"
)
output_file.unlink(missing_ok=True)
bak = CFG.codec, CFG.hwaccel
CFG.hwaccel = None
CFG.codec = "h264" if CFG.codec == "h264_mediacodec" else "hevc"
assert not output_file.exists()
ret = process_video(video_path, compress_dir, update_func)
CFG.codec, CFG.hwaccel = bak
if not ret:
logging.error("重试仍然失败。")
return False
else:
return True
elif CFG.disable_hwaccel_when_fail and CFG.hwaccel is not None:
logging.info("正在禁用硬件加速器重试,进度条可能发生混乱。")
output_file.unlink(missing_ok=True)
if TYPE_CHECKING:
assert BaseModel # type: ignore
assert isinstance(CFG, BaseModel)
bak = CFG.codec, CFG.hwaccel
CFG.hwaccel = None
if (
CFG.codec.endswith("_mediacodec")
or CFG.codec.endswith("_qsv")
or CFG.codec.endswith("_nvenc")
or CFG.codec.endswith("_amf")
):
CFG.codec = CFG.codec.split("_")[0]
assert not output_file.exists()
ret = process_video(video_path, compress_dir, update_func)
CFG.codec, CFG.hwaccel = bak
if not ret:
logging.error("重试仍然失败。")
return False
else:
logging.debug(f"文件处理成功: {video_path_str} -> {output_file}")
except KeyboardInterrupt as e:
raise e
except Exception as e:
logging.error(
f"执行 ffmpeg 命令时发生异常, 文件:{str(video_path_str)}cmd={' '.join(map(str,command))}",
exc_info=e,
)
return False
return True
def traverse_directory(root_dir: Path):
video_extensions = set(CFG.video_ext)
sm = None
# 获取视频文件列表和帧数信息
video_files:list[Path] = []
que = list(root_dir.glob("*"))
while que:
d = que.pop()
for file in d.glob("*") if d.is_dir() else [d]:
if (
file.parent.name == CFG.compress_dir_name
or file.name == CFG.compress_dir_name
):
continue
if file.is_file() and file.suffix.lower() in video_extensions:
video_files.append(file)
elif file.is_dir():
que.append(file)
if not video_files:
logging.warning("未找到需要处理的视频文件")
return
# 获取视频信息
frames: dict[Path, float] = {}
cached_data: dict[Path, float] = {}
info_file = Path("video_info.cache")
if info_file.is_file():
try:
cached_data = loads(info_file.read_bytes())
if isinstance(cached_data, dict):
logging.debug("Loaded video info from cache.")
else:
cached_data = {}
except Exception as e:
logging.debug("Failed to load video info cache.", exc_info=e)
with Progress() as prog:
task = prog.add_task("正在获取视频信息", total=len(video_files))
for file in video_files:
prog.advance(task)
if file in cached_data and cached_data[file] > 0:
frames[file] = cached_data[file]
continue
fr = get_frame.get_video_frame_count(str(file.resolve()))
if fr is None:
logging.debug(
f"无法获取视频信息: {file}, 时长为N/A默认使用0s"
)
frames[file] = 0 if fr is None else fr
if 0 in frames.values():
logging.warning(
f"视频{', '.join([f.name for f,frames in frames.items() if frames==0])}文件帧数信息获取失败。总进度估计将不准确。"
)
prog.remove_task(task)
try:
info_file.write_bytes(dumps(frames))
logging.debug("Saved video info to cache.")
except Exception as e:
logging.debug("Failed to save video info cache.", exc_info=e)
logging.debug(f"开始遍历目录: {root_dir}, 共{len(frames)}个视频文件")
# 创建进度条
with Progress() as prog:
total_frames = sum(frames.values())
main_task = prog.add_task(
"总进度", total=total_frames if total_frames > 0 else len(frames)
)
# 创建文件队列
for file in frames.keys():
# 进度跟踪
filename = file.relative_to(root_dir)
# 创建文件级进度条
if frames[file] == 0:
file_task = prog.add_task(f"{filename}")
else:
file_task = prog.add_task(f"{filename}", total=frames[file])
with prog._lock:
completed_start = prog._tasks[main_task].completed
def update_progress(x, rate):
if frames[file] == 0:
prog.update(
file_task,
description=f"{filename} 已处理{x}{f'速率{rate}' if rate else ''}",
)
else:
prog.update(
file_task,
completed=x,
description=f"{filename} {f'速率{rate}' if rate else ''}",
)
prog.update(main_task, completed=completed_start + x)
if CFG.save_to == "single":
process_video(
file, root_dir / CFG.compress_dir_name, update_progress
)
else:
process_video(file, None, update_progress)
# 移除文件级进度条
prog.update(main_task, completed=completed_start + frames[file])
prog.remove_task(file_task)
try:
info_file.unlink(missing_ok=True)
except Exception as e:
logging.warning("无法删除视频信息缓存文件", exc_info=e)
def test():
os.environ["PATH"] = (
Path(__file__).parent.as_posix() + os.pathsep + os.environ["PATH"]
)
try:
subprocess.run(
[CFG.ffmpeg, "-version"], stdout=-3, stderr=-3
).check_returncode()
except Exception as e:
print(__file__)
logging.critical("无法运行ffmpeg")
exit(-1)
try:
ret = subprocess.run(
f"{CFG.ffmpeg} -hide_banner -f lavfi -i testsrc=duration=1:size={CFG.test_video_resolution}:rate={CFG.test_video_fps} -c:v libx264 -y -pix_fmt yuv420p {CFG.test_video_input}".split(),
stdout=subprocess.PIPE,
stderr=subprocess.PIPE,
text=True,
)
if ret.returncode != 0:
logging.warning("无法生成测试视频.")
logging.debug(ret.stdout)
logging.debug(ret.stderr)
ret.check_returncode()
cmd = get_cmd(
CFG.test_video_input,
CFG.test_video_output,
)
ret = subprocess.run(
cmd, stdout=subprocess.PIPE, stderr=subprocess.PIPE, text=True
)
if ret.returncode != 0:
logging.error("测试视频压缩失败")
logging.debug(ret.stdout)
logging.debug(ret.stderr)
logging.error("Error termination via test failed.")
exit(-1)
if get_frame.get_video_frame_count("compress_video_test.mp4") is None:
logging.error("测试读取帧数失败,将无法正确显示进度。")
os.remove("compress_video_test.mp4")
os.remove("compressed_video_test.mp4")
except KeyboardInterrupt as e:
raise e
except Exception as e:
if os.path.exists("compress_video_test.mp4"):
os.remove("compress_video_test.mp4")
logging.warning("测试未通过,继续运行可能出现未定义行为。")
logging.debug("Test error", exc_info=e)
def exit_pause():
if os.name == "nt":
os.system("pause")
elif os.name == "posix":
os.system("read -p 'Press Enter to continue...'")
def main(_root=None):
atexit.register(exit_pause)
global root
setup_logging()
tot_bgn = time()
logging.info("-------------------------------")
logging.info(datetime.now().strftime("Video Compress started at %Y/%m/%d %H:%M"))
if _root is not None:
root = Path(_root)
else:
# 通过命令行参数传入需要遍历的目录
if len(sys.argv) < 2:
print(f"用法python {__file__} <目标目录>")
logging.warning("Error termination via invalid input.")
sys.exit(1)
root = Path(sys.argv[1])
if root.name.lower() == CFG.compress_dir_name.lower():
logging.critical("请修改目标目录名为非compress。")
logging.error("Error termination via invalid input.")
sys.exit(1)
logging.info("开始验证环境")
test()
if not root.is_dir():
print("提供的路径不是一个有效目录。")
logging.warning("Error termination via invalid input.")
sys.exit(1)
try:
traverse_directory(root)
tot_end = time()
logging.info(f"Elapsed time: {fmt_time(tot_end-tot_bgn)}")
logging.info("Normal termination of Video Compress.")
except KeyboardInterrupt:
logging.warning(
"Error termination via keyboard interrupt, CHECK IF LAST PROCSSING VIDEO IS COMPLETED."
)
except Exception as e:
logging.error(
"Error termination via unhandled error, CHECK IF LAST PROCSSING VIDEO IS COMPLETED.",
exc_info=e,
)
if __name__ == "__main__":
# sys.argv.append(r'C:\Users\flt\Documents\WeChat Files\wxid_m8h0igh8p52p22\FileStorage\Video')
main()