fix hhanclub数据统计

This commit is contained in:
jxxghp
2023-08-30 14:51:55 +08:00
parent f8221bb526
commit 16289d86b6
3 changed files with 71 additions and 18 deletions

View File

@ -26,6 +26,7 @@ class SiteSchema(Enum):
NexusPhp = "NexusPhp"
NexusProject = "NexusProject"
NexusRabbit = "NexusRabbit"
NexusHhanclub = "NexusHhanclub"
SmallHorse = "Small Horse"
Unit3d = "Unit3d"
TorrentLeech = "TorrentLeech"

View File

@ -0,0 +1,60 @@
# -*- coding: utf-8 -*-
import re
from lxml import etree
from app.plugins.sitestatistic.siteuserinfo import SITE_BASE_ORDER, SiteSchema
from app.plugins.sitestatistic.siteuserinfo.nexus_php import NexusPhpSiteUserInfo
from app.utils.string import StringUtils
class NexusHhanclubSiteUserInfo(NexusPhpSiteUserInfo):
schema = SiteSchema.NexusHhanclub
order = SITE_BASE_ORDER + 20
@classmethod
def match(cls, html_text: str) -> bool:
return 'hhanclub.top' in html_text
def _parse_user_traffic_info(self, html_text):
super()._parse_user_traffic_info(html_text)
html_text = self._prepare_html_text(html_text)
html = etree.HTML(html_text)
# 上传、下载、分享率
upload_match = re.search(r"[_<>/a-zA-Z-=\"'\s#;]+([\d,.\s]+[KMGTPI]*B)",
html.xpath('//*[@id="user-info-panel"]/div[2]/div[2]/div[4]/text()')[0])
download_match = re.search(r"[_<>/a-zA-Z-=\"'\s#;]+([\d,.\s]+[KMGTPI]*B)",
html.xpath('//*[@id="user-info-panel"]/div[2]/div[2]/div[5]/text()')[0])
ratio_match = re.search(r"分享率][:_<>/a-zA-Z-=\"'\s#;]+([\d,.\s]+)",
html.xpath('//*[@id="user-info-panel"]/div[2]/div[1]/div[1]/div/text()')[0])
# 计算分享率
self.upload = StringUtils.num_filesize(upload_match.group(1).strip()) if upload_match else 0
self.download = StringUtils.num_filesize(download_match.group(1).strip()) if download_match else 0
# 优先使用页面上的分享率
calc_ratio = 0.0 if self.download <= 0.0 else round(self.upload / self.download, 3)
self.ratio = StringUtils.str_float(ratio_match.group(1)) if (
ratio_match and ratio_match.group(1).strip()) else calc_ratio
def _parse_user_detail_info(self, html_text: str):
"""
解析用户额外信息,加入时间,等级
:param html_text:
:return:
"""
super()._parse_user_detail_info(html_text)
html = etree.HTML(html_text)
if not html:
return
# 加入时间
join_at_text = html.xpath('//*[@id="mainContent"]/div/div[2]/div[4]/div[3]/span[2]/text()[1]')
if join_at_text:
self.join_at = StringUtils.unify_datetime_str(join_at_text[0].split(' (')[0].strip())
def _get_user_level(self, html):
super()._get_user_level(html)
self.user_level = html.xpath('//*[@id="mainContent"]/div/div[2]/div[2]/div[4]/img/@title')[0]

View File

@ -62,7 +62,7 @@ class NexusPhpSiteUserInfo(ISiteUserInfo):
def _parse_user_base_info(self, html_text: str):
# 合并解析,减少额外请求调用
self.__parse_user_traffic_info(html_text)
self._parse_user_traffic_info(html_text)
self._user_traffic_page = None
self._parse_message_unread(html_text)
@ -84,7 +84,7 @@ class NexusPhpSiteUserInfo(ISiteUserInfo):
self.username = str(ret[0])
return
def __parse_user_traffic_info(self, html_text):
def _parse_user_traffic_info(self, html_text):
html_text = self._prepare_html_text(html_text)
upload_match = re.search(r"[^总]上[传傳]量?[:_<>/a-zA-Z-=\"'\s#;]+([\d,.\s]+[KMGTPI]*B)", html_text,
re.IGNORECASE)
@ -102,7 +102,7 @@ class NexusPhpSiteUserInfo(ISiteUserInfo):
self.leeching = StringUtils.str_int(leeching_match.group(2)) if leeching_match and leeching_match.group(
2).strip() else 0
html = etree.HTML(html_text)
has_ucoin, self.bonus = self.__parse_ucoin(html)
has_ucoin, self.bonus = self._parse_ucoin(html)
if has_ucoin:
return
tmps = html.xpath('//a[contains(@href,"mybonus")]/text()') if html else None
@ -126,7 +126,7 @@ class NexusPhpSiteUserInfo(ISiteUserInfo):
logger.error(f"{self.site_name} 解析魔力值出错, 错误信息: {err}")
@staticmethod
def __parse_ucoin(html):
def _parse_ucoin(html):
"""
解析ucoin, 统一转换为铜币
:param html:
@ -151,14 +151,6 @@ class NexusPhpSiteUserInfo(ISiteUserInfo):
return True, gold * 100 * 100 + silver * 100 + copper
return False, 0.0
def _parse_user_traffic_info(self, html_text: str):
"""
上传/下载/分享率 [做种数/魔力值]
:param html_text:
:return:
"""
pass
def _parse_user_torrent_seeding_info(self, html_text: str, multi_page: bool = False) -> Optional[str]:
"""
做种相关信息
@ -238,9 +230,9 @@ class NexusPhpSiteUserInfo(ISiteUserInfo):
if not html:
return
self.__get_user_level(html)
self._get_user_level(html)
self.__fixup_traffic_info(html)
self._fixup_traffic_info(html)
# 加入日期
join_at_text = html.xpath(
@ -285,9 +277,9 @@ class NexusPhpSiteUserInfo(ISiteUserInfo):
if not self.seeding:
self.seeding = tmp_seeding
self.__fixup_torrent_seeding_page(html)
self._fixup_torrent_seeding_page(html)
def __fixup_torrent_seeding_page(self, html):
def _fixup_torrent_seeding_page(self, html):
"""
修正种子页面链接
:param html:
@ -320,7 +312,7 @@ class NexusPhpSiteUserInfo(ISiteUserInfo):
# if seeding_url_text:
# self._torrent_seeding_page = seeding_url_text
def __get_user_level(self, html):
def _get_user_level(self, html):
# 等级 获取同一行等级数据图片格式等级取title信息否则取文本信息
user_levels_text = html.xpath('//tr/td[text()="等級" or text()="等级" or *[text()="等级"]]/'
'following-sibling::td[1]/img[1]/@title')
@ -392,7 +384,7 @@ class NexusPhpSiteUserInfo(ISiteUserInfo):
return message_head_text, message_date_text, message_content_text
def __fixup_traffic_info(self, html):
def _fixup_traffic_info(self, html):
# fixup bonus
if not self.bonus:
bonus_text = html.xpath('//tr/td[text()="魔力值" or text()="猫粮"]/following-sibling::td[1]/text()')