Files
subtitles-sync-whisper/core/subtitles.py

71 lines
2.5 KiB
Python

import os
import re
import shutil
from typing import List
from config import SYNC_CONFIG
from .types import SubtitleEntry
class SubtitleHandler:
@staticmethod
def parse_time(t):
h, m, s, ms = int(t[:2]), int(t[3:5]), int(t[6:8]), int(t[9:])
return h * 3600000 + m * 60000 + s * 1000 + ms
@staticmethod
def format_time(ms):
ms = max(0, ms)
h, r = divmod(ms, 3600000)
m, r = divmod(r, 60000)
s, ms = divmod(r, 1000)
return f"{h:02}:{m:02}:{s:02},{ms:03}"
@staticmethod
def parse_srt(filepath: str) -> List[SubtitleEntry]:
if not os.path.exists(filepath): return []
encodings = ['utf-8-sig', 'utf-8', 'latin-1']
content = ""
for enc in encodings:
try:
with open(filepath, 'r', encoding=enc) as f:
content = f.read()
break
except UnicodeDecodeError:
continue
entries = []
pattern = re.compile(r'(\d+)\n(\d{2}:\d{2}:\d{2},\d{3}) --> (\d{2}:\d{2}:\d{2},\d{3})\n((?:(?!\r?\n\r?\n).)*)',
re.DOTALL)
for match in pattern.finditer(content):
start = SubtitleHandler.parse_time(match.group(2))
end = SubtitleHandler.parse_time(match.group(3))
entries.append(SubtitleEntry(int(match.group(1)), start, end, match.group(4).strip()))
return entries
@staticmethod
def create_backup(filepath: str):
"""Creates a .bak copy of the subtitles if one doesn't exist."""
backup_path = filepath + ".bak"
if not os.path.exists(backup_path):
try:
shutil.copy2(filepath, backup_path)
print(f"Backup created: {os.path.basename(backup_path)}")
except IOError as e:
print(f"Warning: Could not create backup: {e}")
@staticmethod
def write_srt(filepath: str, entries: List[SubtitleEntry]):
# 1. Ensure backup exists before overwriting
if SYNC_CONFIG['create_backup']:
SubtitleHandler.create_backup(filepath)
# 2. Overwrite
try:
with open(filepath, 'w', encoding='utf-8') as f:
for entry in entries:
f.write(
f"{entry.index}\n{SubtitleHandler.format_time(entry.start_ms)} --> {SubtitleHandler.format_time(entry.end_ms)}\n{entry.raw_text}\n\n")
except IOError as e:
print(f"Error writing subtitle file: {e}")