144 lines
		
	
	
		
			5.2 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
			
		
		
	
	
			144 lines
		
	
	
		
			5.2 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
| from datetime import datetime
 | ||
| from typing import List, Optional, Tuple, Union
 | ||
| 
 | ||
| from ruamel.yaml import CommentedMap
 | ||
| 
 | ||
| from app.core.context import MediaInfo, TorrentInfo
 | ||
| from app.log import logger
 | ||
| from app.modules import _ModuleBase
 | ||
| from app.modules.indexer.mtorrent import MTorrentSpider
 | ||
| from app.modules.indexer.spider import TorrentSpider
 | ||
| from app.modules.indexer.tnode import TNodeSpider
 | ||
| from app.modules.indexer.torrentleech import TorrentLeech
 | ||
| from app.schemas.types import MediaType
 | ||
| from app.utils.string import StringUtils
 | ||
| 
 | ||
| 
 | ||
| class IndexerModule(_ModuleBase):
 | ||
|     """
 | ||
|     索引模块
 | ||
|     """
 | ||
| 
 | ||
|     def init_module(self) -> None:
 | ||
|         pass
 | ||
| 
 | ||
|     def stop(self):
 | ||
|         pass
 | ||
| 
 | ||
|     def init_setting(self) -> Tuple[str, Union[str, bool]]:
 | ||
|         return "INDEXER", "builtin"
 | ||
| 
 | ||
|     def search_torrents(self, site: CommentedMap, mediainfo: MediaInfo = None,
 | ||
|                         keyword: str = None, page: int = 0, area: str = "title") -> List[TorrentInfo]:
 | ||
|         """
 | ||
|         搜索一个站点
 | ||
|         :param mediainfo:  识别的媒体信息
 | ||
|         :param site:  站点
 | ||
|         :param keyword:  搜索关键词,如有按关键词搜索,否则按媒体信息名称搜索
 | ||
|         :param page:  页码
 | ||
|         :param area:  搜索区域 title or imdbid
 | ||
|         :return: 资源列表
 | ||
|         """
 | ||
|         # 确认搜索的名字
 | ||
|         if keyword:
 | ||
|             search_word = keyword
 | ||
|         elif mediainfo:
 | ||
|             search_word = mediainfo.title
 | ||
|         else:
 | ||
|             search_word = None
 | ||
| 
 | ||
|         if search_word \
 | ||
|                 and site.get('language') == "en" \
 | ||
|                 and StringUtils.is_chinese(search_word):
 | ||
|             # 不支持中文
 | ||
|             logger.warn(f"{site.get('name')} 不支持中文搜索")
 | ||
|             return []
 | ||
| 
 | ||
|         # 去除搜索关键字中的特殊字符
 | ||
|         if search_word:
 | ||
|             search_word = StringUtils.clear(search_word, replace_word=" ", allow_space=True)
 | ||
| 
 | ||
|         # 开始索引
 | ||
|         result_array = []
 | ||
|         # 开始计时
 | ||
|         start_time = datetime.now()
 | ||
|         try:
 | ||
|             imdbid = mediainfo.imdb_id if mediainfo and area == "imdbid" else None
 | ||
|             if site.get('parser') == "TNodeSpider":
 | ||
|                 error_flag, result_array = TNodeSpider(site).search(
 | ||
|                     keyword=search_word,
 | ||
|                     imdbid=imdbid,
 | ||
|                     page=page
 | ||
|                 )
 | ||
|             elif site.get('parser') == "TorrentLeech":
 | ||
|                 error_flag, result_array = TorrentLeech(site).search(
 | ||
|                     keyword=search_word,
 | ||
|                     page=page
 | ||
|                 )
 | ||
|             elif site.get('parser') == "mTorrent":
 | ||
|                 error_flag, result_array = MTorrentSpider(site).search(
 | ||
|                     keyword=search_word,
 | ||
|                     mtype=mediainfo.type if mediainfo else None,
 | ||
|                     page=page
 | ||
|                 )
 | ||
|             else:
 | ||
|                 error_flag, result_array = self.__spider_search(
 | ||
|                     keyword=search_word,
 | ||
|                     imdbid=imdbid,
 | ||
|                     indexer=site,
 | ||
|                     mtype=mediainfo.type if mediainfo else None,
 | ||
|                     page=page
 | ||
|                 )
 | ||
|         except Exception as err:
 | ||
|             logger.error(f"{site.get('name')} 搜索出错:{err}")
 | ||
| 
 | ||
|         # 索引花费的时间
 | ||
|         seconds = round((datetime.now() - start_time).seconds, 1)
 | ||
| 
 | ||
|         # 返回结果
 | ||
|         if not result_array or len(result_array) == 0:
 | ||
|             logger.warn(f"{site.get('name')} 未搜索到数据,耗时 {seconds} 秒")
 | ||
|             return []
 | ||
|         else:
 | ||
|             logger.info(f"{site.get('name')} 搜索完成,耗时 {seconds} 秒,返回数据:{len(result_array)}")
 | ||
|             # 合并站点信息,以TorrentInfo返回
 | ||
|             return [TorrentInfo(site=site.get("id"),
 | ||
|                                 site_name=site.get("name"),
 | ||
|                                 site_cookie=site.get("cookie"),
 | ||
|                                 site_ua=site.get("ua"),
 | ||
|                                 site_proxy=site.get("proxy"),
 | ||
|                                 site_order=site.get("pri"),
 | ||
|                                 **result) for result in result_array]
 | ||
| 
 | ||
|     @staticmethod
 | ||
|     def __spider_search(indexer: CommentedMap,
 | ||
|                         keyword: str = None,
 | ||
|                         imdbid: str = None,
 | ||
|                         mtype: MediaType = None,
 | ||
|                         page: int = 0) -> (bool, List[dict]):
 | ||
|         """
 | ||
|         根据关键字搜索单个站点
 | ||
|         :param: indexer: 站点配置
 | ||
|         :param: keyword: 关键字
 | ||
|         :param: imdbid: imdbid
 | ||
|         :param: page: 页码
 | ||
|         :param: mtype: 媒体类型
 | ||
|         :param: timeout: 超时时间
 | ||
|         :return: 是否发生错误, 种子列表
 | ||
|         """
 | ||
|         _spider = TorrentSpider(indexer=indexer,
 | ||
|                                 mtype=mtype,
 | ||
|                                 keyword=keyword,
 | ||
|                                 imdbid=imdbid,
 | ||
|                                 page=page)
 | ||
| 
 | ||
|         return _spider.is_error, _spider.get_torrents()
 | ||
| 
 | ||
|     def refresh_torrents(self, site: CommentedMap) -> Optional[List[TorrentInfo]]:
 | ||
|         """
 | ||
|         获取站点最新一页的种子,多个站点需要多线程处理
 | ||
|         :param site:  站点
 | ||
|         :reutrn: 种子资源列表
 | ||
|         """
 | ||
|         return self.search_torrents(site=site)
 |