feat：刮削模块支持覆盖

2023-12-17 10:49:00 +08:00 · 2023-12-17 10:49:00 +08:00 · cd7f688e78
commit cd7f688e78
parent cb12a052ac
5 changed files with 86 additions and 45 deletions
--- a/app/chain/init.py
+++ b/app/chain/init.py
@ -421,15 +421,19 @@ class ChainBase(metaclass=ABCMeta):
        """
        return self.run_module("post_torrents_message", message=message, torrents=torrents)

-    def scrape_metadata(self, path: Path, mediainfo: MediaInfo, transfer_type: str) -> None:
+    def scrape_metadata(self, path: Path, mediainfo: MediaInfo, transfer_type: str,
+                        force_nfo: bool = False, force_img: bool = False) -> None:
        """
        刮削元数据
        :param path: 媒体文件路径
        :param mediainfo:  识别的媒体信息
        :param transfer_type:  转移模式
+        :param force_nfo:  强制刮削nfo
+        :param force_img:  强制刮削图片
        :return: 成功或失败
        """
-        self.run_module("scrape_metadata", path=path, mediainfo=mediainfo, transfer_type=transfer_type)
+        self.run_module("scrape_metadata", path=path, mediainfo=mediainfo,
+                        transfer_type=transfer_type, force_nfo=force_nfo, force_img=force_img)

    def register_commands(self, commands: Dict[str, dict]) -> None:
        """
--- a/app/modules/douban/init.py
+++ b/app/modules/douban/init.py
@ -588,12 +588,15 @@ class DoubanModule(_ModuleBase):
            return []
        return infos.get("subject_collection_items")

-    def scrape_metadata(self, path: Path, mediainfo: MediaInfo, transfer_type: str) -> None:
+    def scrape_metadata(self, path: Path, mediainfo: MediaInfo, transfer_type: str,
+                        force_nfo: bool = False, force_img: bool = False) -> None:
        """
        刮削元数据
        :param path: 媒体文件路径
        :param mediainfo:  识别的媒体信息
        :param transfer_type: 传输类型
+        :param force_nfo: 是否强制刮削nfo
+        :param force_img: 是否强制刮削图片
        :return: 成功或失败
        """
        if settings.SCRAP_SOURCE != "douban":
@ -630,7 +633,9 @@ class DoubanModule(_ModuleBase):
            self.scraper.gen_scraper_files(meta=meta,
                                           mediainfo=mediainfo,
                                           file_path=scrape_path,
-                                           transfer_type=transfer_type)
+                                           transfer_type=transfer_type,
+                                           force_nfo=force_nfo,
+                                           force_img=force_img)
        else:
            # 目录下的所有文件
            for file in SystemUtils.list_files(path, settings.RMT_MEDIAEXT):
@ -667,7 +672,9 @@ class DoubanModule(_ModuleBase):
                    self.scraper.gen_scraper_files(meta=meta,
                                                   mediainfo=mediainfo,
                                                   file_path=file,
-                                                   transfer_type=transfer_type)
+                                                   transfer_type=transfer_type,
+                                                   force_nfo=force_nfo,
+                                                   force_img=force_img)
                except Exception as e:
                    logger.error(f"刮削文件 {file} 失败，原因：{str(e)}")
        logger.info(f"{path} 刮削完成")
--- a/app/modules/douban/scraper.py
+++ b/app/modules/douban/scraper.py
@ -14,53 +14,67 @@ from app.utils.system import SystemUtils


 class DoubanScraper:
-
    _transfer_type = settings.TRANSFER_TYPE
+    _force_nfo = False
+    _force_img = False

    def gen_scraper_files(self, meta: MetaBase, mediainfo: MediaInfo,
-                          file_path: Path, transfer_type: str):
+                          file_path: Path, transfer_type: str,
+                          force_nfo: bool = False, force_img: bool = False):
        """
        生成刮削文件
        :param meta: 元数据
        :param mediainfo: 媒体信息
        :param file_path: 文件路径或者目录路径
        :param transfer_type: 转输类型
+        :param force_nfo: 强制生成NFO
+        :param force_img: 强制生成图片
        """

        self._transfer_type = transfer_type
+        self._force_nfo = force_nfo
+        self._force_img = force_img

        try:
            # 电影
            if mediainfo.type == MediaType.MOVIE:
                # 强制或者不已存在时才处理
-                if not file_path.with_name("movie.nfo").exists() \
-                        and not file_path.with_suffix(".nfo").exists():
+                if self._force_nfo or (not file_path.with_name("movie.nfo").exists()
+                                       and not file_path.with_suffix(".nfo").exists()):
                    #  生成电影描述文件
                    self.__gen_movie_nfo_file(mediainfo=mediainfo,
                                              file_path=file_path)
                # 生成电影图片
-                self.__save_image(url=mediainfo.poster_path,
-                                  file_path=file_path.with_name(f"poster{Path(mediainfo.poster_path).suffix}"))
+                image_path = file_path.with_name(f"poster{Path(mediainfo.poster_path).suffix}")
+                if self._force_img or not image_path.exists():
+                    self.__save_image(url=mediainfo.poster_path,
+                                      file_path=image_path)
                # 背景图
                if mediainfo.backdrop_path:
-                    self.__save_image(url=mediainfo.backdrop_path,
-                                      file_path=file_path.with_name(f"backdrop{Path(mediainfo.backdrop_path).suffix}"))
+                    image_path = file_path.with_name(f"backdrop{Path(mediainfo.backdrop_path).suffix}")
+                    if self._force_img or not image_path.exists():
+                        self.__save_image(url=mediainfo.backdrop_path,
+                                          file_path=image_path)
            # 电视剧
            else:
                # 不存在时才处理
-                if not file_path.parent.with_name("tvshow.nfo").exists():
+                if self._force_nfo or not file_path.parent.with_name("tvshow.nfo").exists():
                    # 根目录描述文件
                    self.__gen_tv_nfo_file(mediainfo=mediainfo,
                                           dir_path=file_path.parents[1])
                # 生成根目录图片
-                self.__save_image(url=mediainfo.poster_path,
-                                  file_path=file_path.with_name(f"poster{Path(mediainfo.poster_path).suffix}"))
+                image_path = file_path.with_name(f"poster{Path(mediainfo.poster_path).suffix}")
+                if self._force_img or not image_path.exists():
+                    self.__save_image(url=mediainfo.poster_path,
+                                      file_path=image_path)
                # 背景图
                if mediainfo.backdrop_path:
-                    self.__save_image(url=mediainfo.backdrop_path,
-                                      file_path=file_path.with_name(f"backdrop{Path(mediainfo.backdrop_path).suffix}"))
+                    image_path = file_path.with_name(f"backdrop{Path(mediainfo.backdrop_path).suffix}")
+                    if self._force_img or not image_path.exists():
+                        self.__save_image(url=mediainfo.backdrop_path,
+                                          file_path=image_path)
                # 季目录NFO
-                if not file_path.with_name("season.nfo").exists():
+                if self._force_nfo or not file_path.with_name("season.nfo").exists():
                    self.__gen_tv_season_nfo_file(mediainfo=mediainfo,
                                                  season=meta.begin_season,
                                                  season_path=file_path.parent)
@ -175,8 +189,6 @@ class DoubanScraper:
        """
        下载图片并保存
        """
-        if file_path.exists():
-            return
        if not url:
            return
        try:
@ -201,8 +213,6 @@ class DoubanScraper:
        """
        保存NFO
        """
-        if file_path.exists():
-            return
        xml_str = doc.toprettyxml(indent="  ", encoding="utf-8")
        if self._transfer_type in ['rclone_move', 'rclone_copy']:
            self.__save_remove_file(file_path, xml_str)
--- a/app/modules/themoviedb/init.py
+++ b/app/modules/themoviedb/init.py
@ -212,12 +212,15 @@ class TheMovieDbModule(_ModuleBase):

        return [MediaInfo(tmdb_info=info) for info in results]

-    def scrape_metadata(self, path: Path, mediainfo: MediaInfo, transfer_type: str) -> None:
+    def scrape_metadata(self, path: Path, mediainfo: MediaInfo, transfer_type: str,
+                        force_nfo: bool = False, force_img: bool = False) -> None:
        """
        刮削元数据
        :param path: 媒体文件路径
        :param mediainfo:  识别的媒体信息
        :param transfer_type:  转移类型
+        :param force_nfo:  强制刮削nfo
+        :param force_img:  强制刮削图片
        :return: 成功或失败
        """
        if settings.SCRAP_SOURCE != "themoviedb":
@ -229,13 +232,17 @@ class TheMovieDbModule(_ModuleBase):
            scrape_path = path / path.name
            self.scraper.gen_scraper_files(mediainfo=mediainfo,
                                           file_path=scrape_path,
-                                           transfer_type=transfer_type)
+                                           transfer_type=transfer_type,
+                                           force_nfo=force_nfo,
+                                           force_img=force_img)
        elif path.is_file():
            # 单个文件
            logger.info(f"开始刮削媒体库文件：{path} ...")
            self.scraper.gen_scraper_files(mediainfo=mediainfo,
                                           file_path=path,
-                                           transfer_type=transfer_type)
+                                           transfer_type=transfer_type,
+                                           force_nfo=force_nfo,
+                                           force_img=force_img)
        else:
            # 目录下的所有文件
            logger.info(f"开始刮削目录：{path} ...")
@ -244,7 +251,9 @@ class TheMovieDbModule(_ModuleBase):
                    continue
                self.scraper.gen_scraper_files(mediainfo=mediainfo,
                                               file_path=file,
-                                               transfer_type=transfer_type)
+                                               transfer_type=transfer_type,
+                                               force_nfo=force_nfo,
+                                               force_img=force_img)
        logger.info(f"{path} 刮削完成")

    def tmdb_discover(self, mtype: MediaType, sort_by: str, with_genres: str, with_original_language: str,
--- a/app/modules/themoviedb/scraper.py
+++ b/app/modules/themoviedb/scraper.py
@ -19,19 +19,26 @@ from app.utils.system import SystemUtils
 class TmdbScraper:
    tmdb = None
    _transfer_type = settings.TRANSFER_TYPE
+    _force_nfo = False
+    _force_img = False

    def __init__(self, tmdb):
        self.tmdb = tmdb

-    def gen_scraper_files(self, mediainfo: MediaInfo, file_path: Path, transfer_type: str):
+    def gen_scraper_files(self, mediainfo: MediaInfo, file_path: Path, transfer_type: str,
+                          force_nfo: bool = False, force_img: bool = False):
        """
        生成刮削文件，包括NFO和图片，传入路径为文件路径
        :param mediainfo: 媒体信息
        :param file_path: 文件路径或者目录路径
        :param transfer_type: 传输类型
+        :param force_nfo: 是否强制生成NFO
+        :param force_img: 是否强制生成图片
        """

        self._transfer_type = transfer_type
+        self._force_nfo = force_nfo
+        self._force_img = force_img

        def __get_episode_detail(_seasoninfo: dict, _episode: int):
            """
@ -46,8 +53,8 @@ class TmdbScraper:
            # 电影，路径为文件名 名称/名称.xxx 或者蓝光原盘目录 名称/名称
            if mediainfo.type == MediaType.MOVIE:
                # 不已存在时才处理
-                if not file_path.with_name("movie.nfo").exists() \
-                        and not file_path.with_suffix(".nfo").exists():
+                if self._force_nfo or (not file_path.with_name("movie.nfo").exists()
+                                       and not file_path.with_suffix(".nfo").exists()):
                    #  生成电影描述文件
                    self.__gen_movie_nfo_file(mediainfo=mediainfo,
                                              file_path=file_path)
@ -59,14 +66,16 @@ class TmdbScraper:
                            and isinstance(attr_value, str) \
                            and attr_value.startswith("http"):
                        image_name = attr_name.replace("_path", "") + Path(attr_value).suffix
-                        self.__save_image(url=attr_value,
-                                          file_path=file_path.with_name(image_name))
+                        image_path = file_path.with_name(image_name)
+                        if self._force_img or not image_path.exists():
+                            self.__save_image(url=attr_value,
+                                              file_path=image_path)
            # 电视剧，路径为每一季的文件名 名称/Season xx/名称 SxxExx.xxx
            else:
                # 识别
                meta = MetaInfo(file_path.stem)
                # 根目录不存在时才处理
-                if not file_path.parent.with_name("tvshow.nfo").exists():
+                if self._force_nfo or not file_path.parent.with_name("tvshow.nfo").exists():
                    # 根目录描述文件
                    self.__gen_tv_nfo_file(mediainfo=mediainfo,
                                           dir_path=file_path.parents[1])
@ -79,13 +88,15 @@ class TmdbScraper:
                            and isinstance(attr_value, str) \
                            and attr_value.startswith("http"):
                        image_name = attr_name.replace("_path", "") + Path(attr_value).suffix
-                        self.__save_image(url=attr_value,
-                                          file_path=file_path.parent.with_name(image_name))
+                        image_path = file_path.parent.with_name(image_name)
+                        if self._force_img or not image_path.exists():
+                            self.__save_image(url=attr_value,
+                                              file_path=image_path)
                # 查询季信息
                seasoninfo = self.tmdb.get_tv_season_detail(mediainfo.tmdb_id, meta.begin_season)
                if seasoninfo:
                    # 季目录NFO
-                    if not file_path.with_name("season.nfo").exists():
+                    if self._force_nfo or not file_path.with_name("season.nfo").exists():
                        self.__gen_tv_season_nfo_file(seasoninfo=seasoninfo,
                                                      season=meta.begin_season,
                                                      season_path=file_path.parent)
@ -96,7 +107,9 @@ class TmdbScraper:
                        ext = Path(seasoninfo.get('poster_path')).suffix
                        # URL
                        url = f"https://{settings.TMDB_IMAGE_DOMAIN}/t/p/original{seasoninfo.get('poster_path')}"
-                        self.__save_image(url, file_path.parent.with_name(f"season{sea_seq}-poster{ext}"))
+                        image_path = file_path.parent.with_name(f"season{sea_seq}-poster{ext}")
+                        if self._force_img or not image_path.exists():
+                            self.__save_image(url=url, file_path=image_path)
                    # 季的其它图片
                    for attr_name, attr_value in vars(mediainfo).items():
                        if attr_value \
@ -106,13 +119,15 @@ class TmdbScraper:
                                and isinstance(attr_value, str) \
                                and attr_value.startswith("http"):
                            image_name = attr_name.replace("_path", "") + Path(attr_value).suffix
-                            self.__save_image(url=attr_value,
-                                              file_path=file_path.parent.with_name(image_name))
+                            image_path = file_path.parent.with_name(image_name)
+                            if self._force_img or not image_path.exists():
+                                self.__save_image(url=attr_value,
+                                                  file_path=image_path)
                # 查询集详情
                episodeinfo = __get_episode_detail(seasoninfo, meta.begin_episode)
                if episodeinfo:
                    # 集NFO
-                    if not file_path.with_suffix(".nfo").exists():
+                    if self._force_nfo or not file_path.with_suffix(".nfo").exists():
                        self.__gen_tv_episode_nfo_file(episodeinfo=episodeinfo,
                                                       tmdbid=mediainfo.tmdb_id,
                                                       season=meta.begin_season,
@ -121,7 +136,7 @@ class TmdbScraper:
                    # 集的图片
                    episode_image = episodeinfo.get("still_path")
                    image_path = file_path.with_name(file_path.stem + "-thumb").with_suffix(Path(episode_image).suffix)
-                    if episode_image:
+                    if episode_image and (self._force_img or not image_path.exists()):
                        self.__save_image(
                            f"https://{settings.TMDB_IMAGE_DOMAIN}/t/p/original{episode_image}",
                            image_path)
@ -340,8 +355,6 @@ class TmdbScraper:
        """
        下载图片并保存
        """
-        if file_path.exists():
-            return
        try:
            logger.info(f"正在下载{file_path.stem}图片：{url} ...")
            r = RequestUtils().get_res(url=url, raise_exception=True)
@ -362,8 +375,6 @@ class TmdbScraper:
        """
        保存NFO
        """
-        if file_path.exists():
-            return
        xml_str = doc.toprettyxml(indent="  ", encoding="utf-8")
        if self._transfer_type in ['rclone_move', 'rclone_copy']:
            self.__save_remove_file(file_path, xml_str)