podcast-search / src /config.py
terapyon's picture
srtの分割を1分にし、configなどを整え、READMEを書いた
d788666
raw
history blame
467 Bytes
from datetime import timedelta
import re
from pathlib import Path
# import logging
HERE = Path(__file__).resolve().parent
DUCKDB_FILE = HERE.parent / "db" / "terapyon-podcast.duckdb"
STORE_DIR = HERE.parent / "store"
DATA_DIR = HERE.parent / "data"
PODCAST_TITLE_LIST = str(STORE_DIR / 'title-list-202301-202501.parquet')
EPISODES_PARQUET = str(STORE_DIR / 'podcast-*.parquet')
divider_time = timedelta(minutes=1)
RE_PODCAST_SRT_FILE = re.compile(r"[_-](\d+)[_-]")