| import json
|
| import locale
|
| import os
|
| import random
|
| import re
|
| import string
|
| import threading
|
| import urllib3
|
| from typing import Any, List
|
| from uuid import uuid4
|
| from pathlib import Path
|
|
|
| from loguru import logger
|
|
|
| from app.models import const
|
|
|
| urllib3.disable_warnings()
|
|
|
|
|
| def get_uuid(remove_hyphen: bool = False):
|
| u = str(uuid4())
|
| if remove_hyphen:
|
| u = u.replace("-", "")
|
| return u
|
|
|
|
|
| def get_root_dir():
|
| return os.path.dirname(os.path.dirname(os.path.dirname(os.path.realpath(__file__))))
|
|
|
|
|
| def resource_dir(sub_dir: str = ""):
|
| d = os.path.join(get_root_dir(), "resource")
|
| if sub_dir:
|
| d = os.path.join(d, sub_dir)
|
| return d
|
|
|
| def task_dir(sub_dir: str = "") -> str:
|
| """获取任务目录路径
|
| Args:
|
| sub_dir (str, optional): 子目录名. Defaults to "".
|
| Returns:
|
| str: 任务目录的绝对路径
|
| """
|
|
|
| root_dir = get_root_dir()
|
|
|
| d = os.path.join(root_dir, "tasks")
|
| if sub_dir:
|
| d = os.path.join(d, sub_dir)
|
|
|
|
|
| os.makedirs(d, exist_ok=True)
|
|
|
| return d
|
|
|
|
|
| def font_dir(sub_dir: str = ""):
|
| d = resource_dir("fonts")
|
| if sub_dir:
|
| d = os.path.join(d, sub_dir)
|
| if not os.path.exists(d):
|
| os.makedirs(d)
|
| return d
|
|
|
|
|
| def song_dir(sub_dir: str = ""):
|
| d = resource_dir("songs")
|
| if sub_dir:
|
| d = os.path.join(d, sub_dir)
|
| if not os.path.exists(d):
|
| os.makedirs(d)
|
| return d
|
|
|
|
|
| def public_dir(sub_dir: str = ""):
|
| d = resource_dir("public")
|
| if sub_dir:
|
| d = os.path.join(d, sub_dir)
|
| if not os.path.exists(d):
|
| os.makedirs(d)
|
| return d
|
|
|
|
|
| def run_in_background(func, *args, **kwargs):
|
| def run():
|
| try:
|
| func(*args, **kwargs)
|
| except Exception as e:
|
| logger.error(f"run_in_background error: {e}")
|
|
|
| thread = threading.Thread(target=run)
|
| thread.start()
|
| return thread
|
|
|
|
|
| def time_convert_seconds_to_hmsm(seconds) -> str:
|
| hours = int(seconds // 3600)
|
| seconds = seconds % 3600
|
| minutes = int(seconds // 60)
|
| milliseconds = int(seconds * 1000) % 1000
|
| seconds = int(seconds % 60)
|
| return "{:02d}:{:02d}:{:02d},{:03d}".format(hours, minutes, seconds, milliseconds)
|
|
|
|
|
| def text_to_srt(idx: int, msg: str, start_time: float, end_time: float) -> str:
|
| start_time = time_convert_seconds_to_hmsm(start_time)
|
| end_time = time_convert_seconds_to_hmsm(end_time)
|
| srt = """%d
|
| %s --> %s
|
| %s
|
| """ % (
|
| idx,
|
| start_time,
|
| end_time,
|
| msg,
|
| )
|
| return srt
|
|
|
|
|
| def str_contains_punctuation(word):
|
| for p in const.PUNCTUATIONS:
|
| if p in word:
|
| return True
|
| return False
|
|
|
|
|
| def split_string_by_punctuations(s):
|
| result = []
|
| txt = ""
|
|
|
| previous_char = ""
|
| next_char = ""
|
| for i in range(len(s)):
|
| char = s[i]
|
| if char == "\n":
|
| result.append(txt.strip())
|
| txt = ""
|
| continue
|
|
|
| if i > 0:
|
| previous_char = s[i - 1]
|
| if i < len(s) - 1:
|
| next_char = s[i + 1]
|
|
|
| if char == "." and previous_char.isdigit() and next_char.isdigit():
|
|
|
| txt += char
|
| continue
|
|
|
| if char not in const.PUNCTUATIONS:
|
| txt += char
|
| else:
|
| result.append(txt.strip())
|
| txt = ""
|
| result.append(txt.strip())
|
|
|
| result = list(filter(None, result))
|
| return result
|
|
|
|
|
| def split_string_by_punctuations_new(text: str) -> List[str]:
|
| """按标点符号分割文本"""
|
| result = []
|
| txt = ""
|
|
|
| previous_char = ""
|
| next_char = ""
|
| for i in range(len(text)):
|
| char = text[i]
|
| if char == "\n":
|
| if txt.strip():
|
| result.append(txt.strip())
|
| txt = ""
|
| continue
|
|
|
| if i > 0:
|
| previous_char = text[i - 1]
|
| if i < len(text) - 1:
|
| next_char = text[i + 1]
|
|
|
| if char == "." and previous_char.isdigit() and next_char.isdigit():
|
| txt += char
|
| continue
|
|
|
| if char not in [".", "。", "!", "?", "...", "…"]:
|
| txt += char
|
| else:
|
| txt += char
|
| if txt.strip():
|
| result.append(txt.strip())
|
| txt = ""
|
|
|
| if txt.strip():
|
| result.append(txt.strip())
|
| return result
|
|
|
|
|
| def random_str(length: int = 8) -> str:
|
| """生成随机字符串"""
|
| letters = string.ascii_lowercase + string.digits
|
| return ''.join(random.choice(letters) for _ in range(length))
|
|
|
|
|
| def md5(text):
|
| import hashlib
|
|
|
| return hashlib.md5(text.encode("utf-8")).hexdigest()
|
|
|
|
|
| def get_system_locale():
|
| try:
|
| loc = locale.getdefaultlocale()
|
|
|
|
|
| language_code = loc[0].split("_")[0]
|
| return language_code
|
| except Exception:
|
| return "en"
|
|
|
|
|
| def load_locales(i18n_dir):
|
| _locales = {}
|
| for root, dirs, files in os.walk(i18n_dir):
|
| for file in files:
|
| if file.endswith(".json"):
|
| lang = file.split(".")[0]
|
| with open(os.path.join(root, file), "r", encoding="utf-8") as f:
|
| _locales[lang] = json.loads(f.read())
|
| return _locales
|
|
|
|
|
| def parse_extension(filename):
|
| return os.path.splitext(filename)[1].strip().lower().replace(".", "")
|
|
|
| def extract_id(video_file: str) -> str:
|
| """
|
| 从路径中提取 ID(tasks 目录下的第一级子目录名)
|
| 兼容 Windows 和 Linux
|
| """
|
| path = Path(video_file)
|
|
|
|
|
| try:
|
| parts = path.parts
|
| index = parts.index("tasks")
|
| return parts[index + 1]
|
| except (ValueError, IndexError):
|
| raise ValueError(f"Invalid path format: {video_file}")
|
|
|