109 lines
3.8 KiB
Python
109 lines
3.8 KiB
Python
import re
|
||
from typing import Tuple, Optional
|
||
|
||
import parse
|
||
|
||
|
||
class FormatParser(object):
|
||
_key = ""
|
||
_split_chars = r"\.|\s+|\(|\)|\[|]|-|\+|【|】|/|~|;|&|\||#|_|「|」|~"
|
||
|
||
def __init__(self, eformat: str, details: str = None, part: str = None,
|
||
offset: int = None, key: str = "ep"):
|
||
"""
|
||
:params eformat: 格式化字符串
|
||
:params details: 格式化详情
|
||
:params part: 分集
|
||
:params offset: 偏移量
|
||
:prams key: EP关键字
|
||
"""
|
||
self._format = eformat
|
||
self._start_ep = None
|
||
self._end_ep = None
|
||
self._part = None
|
||
if part:
|
||
self._part = part
|
||
if details:
|
||
if re.compile("\\d{1,4}-\\d{1,4}").match(details):
|
||
self._start_ep = details
|
||
self._end_ep = details
|
||
else:
|
||
tmp = details.split(",")
|
||
if len(tmp) > 1:
|
||
self._start_ep = int(tmp[0])
|
||
self._end_ep = int(tmp[0]) if int(tmp[0]) > int(tmp[1]) else int(tmp[1])
|
||
else:
|
||
self._start_ep = self._end_ep = int(tmp[0])
|
||
self.__offset = int(offset) if offset else 0
|
||
self._key = key
|
||
|
||
@property
|
||
def format(self):
|
||
return self._format
|
||
|
||
@property
|
||
def start_ep(self):
|
||
return self._start_ep
|
||
|
||
@property
|
||
def end_ep(self):
|
||
return self._end_ep
|
||
|
||
@property
|
||
def part(self):
|
||
return self._part
|
||
|
||
@property
|
||
def offset(self):
|
||
return self.__offset
|
||
|
||
def match(self, file: str) -> bool:
|
||
if not self._format:
|
||
return True
|
||
s, e = self.__handle_single(file)
|
||
if not s:
|
||
return False
|
||
if self._start_ep is None:
|
||
return True
|
||
if self._start_ep <= s <= self._end_ep:
|
||
return True
|
||
return False
|
||
|
||
def split_episode(self, file_name: str) -> Tuple[Optional[int], Optional[int], Optional[str]]:
|
||
"""
|
||
拆分集数,返回开始集数,结束集数,Part信息
|
||
"""
|
||
# 指定的具体集数,直接返回
|
||
if self._start_ep is not None and self._start_ep == self._end_ep:
|
||
if isinstance(self._start_ep, str):
|
||
s, e = self._start_ep.split("-")
|
||
if int(s) == int(e):
|
||
return int(s) + self.__offset, None, self.part
|
||
return int(s) + self.__offset, int(e) + self.__offset, self.part
|
||
return self._start_ep + self.__offset, None, self.part
|
||
if not self._format:
|
||
return None, None, None
|
||
s, e = self.__handle_single(file_name)
|
||
return s + self.__offset if s is not None else None, \
|
||
e + self.__offset if e is not None else None, self.part
|
||
|
||
def __handle_single(self, file: str) -> Tuple[Optional[int], Optional[int]]:
|
||
"""
|
||
处理单集,返回单集的开始和结束集数
|
||
"""
|
||
if not self._format:
|
||
return None, None
|
||
ret = parse.parse(self._format, file)
|
||
if not ret or not ret.__contains__(self._key):
|
||
return None, None
|
||
episodes = ret.__getitem__(self._key)
|
||
if not re.compile(r"^(EP)?(\d{1,4})(-(EP)?(\d{1,4}))?$", re.IGNORECASE).match(episodes):
|
||
return None, None
|
||
episode_splits = list(filter(lambda x: re.compile(r'[a-zA-Z]*\d{1,4}', re.IGNORECASE).match(x),
|
||
re.split(r'%s' % self._split_chars, episodes)))
|
||
if len(episode_splits) == 1:
|
||
return int(re.compile(r'[a-zA-Z]*', re.IGNORECASE).sub("", episode_splits[0])), None
|
||
else:
|
||
return int(re.compile(r'[a-zA-Z]*', re.IGNORECASE).sub("", episode_splits[0])), int(
|
||
re.compile(r'[a-zA-Z]*', re.IGNORECASE).sub("", episode_splits[1]))
|