JoeanAmier d1bca5a896 perf: 优化重定向链接获取逻辑
1. 更新 chunk 参数默认值
2. 更新配置文件参数说明

Closes #138
Closes #139
2024-08-04 15:35:23 +08:00

63 lines
1.9 KiB
Python

from httpx import HTTPError
from source.module import ERROR
from source.module import Manager
from source.module import logging
from source.module import retry
__all__ = ["Html"]
class Html:
def __init__(self, manager: Manager, ):
self.retry = manager.retry
self.message = manager.message
self.client = manager.request_client
self.headers = manager.headers
self.blank_headers = manager.blank_headers
@retry
async def request_url(
self,
url: str,
content=True,
log=None,
**kwargs,
) -> str:
headers = self.select_headers(url, )
try:
match content:
case True:
response = await self.__request_url_get(url, headers, **kwargs, )
response.raise_for_status()
return response.text
case False:
response = await self.__request_url_head(url, headers, **kwargs, )
return str(response.url)
except HTTPError as error:
logging(log, str(error), ERROR)
logging(
log, self.message("网络异常,请求 {0} 失败").format(url), ERROR)
return ""
@staticmethod
def format_url(url: str) -> str:
return bytes(url, "utf-8").decode("unicode_escape")
def select_headers(self, url: str) -> dict:
return self.headers if "explore" in url else self.blank_headers
async def __request_url_head(self, url: str, headers: dict, **kwargs, ):
return await self.client.head(
url,
headers=headers,
**kwargs,
)
async def __request_url_get(self, url: str, headers: dict, **kwargs, ):
return await self.client.get(
url,
headers=headers,
**kwargs,
)