# -*- coding: utf-8 -*- import re from abc import ABCMeta, abstractmethod from typing import Tuple import chardet from ruamel.yaml import CommentedMap from app.helper.browser import PlaywrightHelper from app.log import logger from app.utils.http import RequestUtils from app.utils.string import StringUtils class _ISiteSigninHandler(metaclass=ABCMeta): """ 实现站点签到的基类,所有站点签到类都需要继承此类,并实现match和signin方法 实现类放置到sitesignin目录下将会自动加载 """ # 匹配的站点Url,每一个实现类都需要设置为自己的站点Url site_url = "" @abstractmethod def match(self, url: str) -> bool: """ 根据站点Url判断是否匹配当前站点签到类,大部分情况使用默认实现即可 :param url: 站点Url :return: 是否匹配,如匹配则会调用该类的signin方法 """ return True if StringUtils.url_equal(url, self.site_url) else False @abstractmethod def signin(self, site_info: CommentedMap) -> Tuple[bool, str]: """ 执行签到操作 :param site_info: 站点信息,含有站点Url、站点Cookie、UA等信息 :return: True|False,签到结果信息 """ pass @staticmethod def get_page_source(url: str, cookie: str, ua: str, proxies: dict, render: bool) -> str: """ 获取页面源码 :param url: Url地址 :param cookie: Cookie :param ua: UA :param proxies: 代理 :param render: 是否渲染 :return: 页面源码,错误信息 """ if render: return PlaywrightHelper().get_page_source(url=url, cookies=cookie, ua=ua, proxies=proxies) else: res = RequestUtils(cookies=cookie, ua=ua, proxies=proxies ).get_res(url=url) if res is not None: # 使用chardet检测字符编码 raw_data = res.content if raw_data: try: result = chardet.detect(raw_data) encoding = result['encoding'] # 解码为字符串 return raw_data.decode(encoding) except Exception as e: logger.error(f"chardet解码失败:{e}") return res.text else: return res.text return "" @staticmethod def sign_in_result(html_res: str, regexs: list) -> bool: """ 判断是否签到成功 """ html_text = re.sub(r"#\d+", "", re.sub(r"\d+px", "", html_res)) for regex in regexs: if re.search(str(regex), html_text): return True return False