mirror of
https://github.com/RYDE-WORK/MediaCrawler.git
synced 2026-02-06 08:53:21 +08:00
feat: 快手文件目录建立
This commit is contained in:
parent
3790e8041e
commit
95ca606938
1
media_platform/kuaishou/__init__.py
Normal file
1
media_platform/kuaishou/__init__.py
Normal file
@ -0,0 +1 @@
|
|||||||
|
# -*- coding: utf-8 -*-
|
||||||
71
media_platform/kuaishou/client.py
Normal file
71
media_platform/kuaishou/client.py
Normal file
@ -0,0 +1,71 @@
|
|||||||
|
# -*- coding: utf-8 -*-
|
||||||
|
from typing import Dict
|
||||||
|
import asyncio
|
||||||
|
import json
|
||||||
|
from typing import Dict, Optional
|
||||||
|
|
||||||
|
import httpx
|
||||||
|
from playwright.async_api import BrowserContext, Page
|
||||||
|
|
||||||
|
from tools import utils
|
||||||
|
|
||||||
|
from .exception import DataFetchError, IPBlockError
|
||||||
|
|
||||||
|
|
||||||
|
|
||||||
|
class KuaishouClient:
|
||||||
|
def __init__(
|
||||||
|
self,
|
||||||
|
timeout=10,
|
||||||
|
proxies=None,
|
||||||
|
*,
|
||||||
|
headers: Dict[str, str],
|
||||||
|
playwright_page: Page,
|
||||||
|
cookie_dict: Dict[str, str],
|
||||||
|
):
|
||||||
|
self.proxies = proxies
|
||||||
|
self.timeout = timeout
|
||||||
|
self.headers = headers
|
||||||
|
self._host = "https://edith.xiaohongshu.com"
|
||||||
|
self.playwright_page = playwright_page
|
||||||
|
self.cookie_dict = cookie_dict
|
||||||
|
|
||||||
|
async def _pre_headers(self, url: str, data=None):
|
||||||
|
pass
|
||||||
|
|
||||||
|
async def request(self, method, url, **kwargs) -> Dict:
|
||||||
|
async with httpx.AsyncClient(proxies=self.proxies) as client:
|
||||||
|
response = await client.request(
|
||||||
|
method, url, timeout=self.timeout,
|
||||||
|
**kwargs
|
||||||
|
)
|
||||||
|
data: Dict = response.json()
|
||||||
|
if data["success"]:
|
||||||
|
return data.get("data", data.get("success", {}))
|
||||||
|
else:
|
||||||
|
raise DataFetchError(data.get("msg", None))
|
||||||
|
|
||||||
|
async def get(self, uri: str, params=None) -> Dict:
|
||||||
|
final_uri = uri
|
||||||
|
if isinstance(params, dict):
|
||||||
|
final_uri = (f"{uri}?"
|
||||||
|
f"{'&'.join([f'{k}={v}' for k, v in params.items()])}")
|
||||||
|
headers = await self._pre_headers(final_uri)
|
||||||
|
return await self.request(method="GET", url=f"{self._host}{final_uri}", headers=headers)
|
||||||
|
|
||||||
|
async def post(self, uri: str, data: dict) -> Dict:
|
||||||
|
headers = await self._pre_headers(uri, data)
|
||||||
|
json_str = json.dumps(data, separators=(',', ':'), ensure_ascii=False)
|
||||||
|
return await self.request(method="POST", url=f"{self._host}{uri}",
|
||||||
|
data=json_str, headers=headers)
|
||||||
|
|
||||||
|
async def ping(self) -> bool:
|
||||||
|
"""get a note to check if login state is ok"""
|
||||||
|
utils.logger.info("Begin to ping xhs...")
|
||||||
|
ping_flag = False
|
||||||
|
try:
|
||||||
|
pass
|
||||||
|
except Exception as e:
|
||||||
|
utils.logger.error(f"Ping xhs failed: {e}, and try to login again...")
|
||||||
|
ping_flag = False
|
||||||
|
return ping_flag
|
||||||
1
media_platform/kuaishou/core.py
Normal file
1
media_platform/kuaishou/core.py
Normal file
@ -0,0 +1 @@
|
|||||||
|
# -*- coding: utf-8 -*-
|
||||||
9
media_platform/kuaishou/exception.py
Normal file
9
media_platform/kuaishou/exception.py
Normal file
@ -0,0 +1,9 @@
|
|||||||
|
from httpx import RequestError
|
||||||
|
|
||||||
|
|
||||||
|
class DataFetchError(RequestError):
|
||||||
|
"""something error when fetch"""
|
||||||
|
|
||||||
|
|
||||||
|
class IPBlockError(RequestError):
|
||||||
|
"""fetch so fast that the server block us ip"""
|
||||||
1
media_platform/kuaishou/field.py
Normal file
1
media_platform/kuaishou/field.py
Normal file
@ -0,0 +1 @@
|
|||||||
|
# -*- coding: utf-8 -*-
|
||||||
20
media_platform/kuaishou/login.py
Normal file
20
media_platform/kuaishou/login.py
Normal file
@ -0,0 +1,20 @@
|
|||||||
|
# -*- coding: utf-8 -*-
|
||||||
|
|
||||||
|
from base.base_crawler import AbstractLogin
|
||||||
|
|
||||||
|
|
||||||
|
class KuaishouLogin(AbstractLogin):
|
||||||
|
def __init__(self):
|
||||||
|
pass
|
||||||
|
|
||||||
|
async def begin(self):
|
||||||
|
pass
|
||||||
|
|
||||||
|
async def login_by_qrcode(self):
|
||||||
|
pass
|
||||||
|
|
||||||
|
async def login_by_mobile(self):
|
||||||
|
pass
|
||||||
|
|
||||||
|
async def login_by_cookies(self):
|
||||||
|
pass
|
||||||
Loading…
x
Reference in New Issue
Block a user