feat: B站评论API
This commit is contained in:
parent
a790d72db9
commit
8f04943105
@ -4,7 +4,7 @@
|
|||||||
# @Desc : bilibili 请求客户端
|
# @Desc : bilibili 请求客户端
|
||||||
import asyncio
|
import asyncio
|
||||||
import json
|
import json
|
||||||
from typing import Any, Callable, Dict, Optional
|
from typing import Any, Callable, Dict, Optional, List
|
||||||
from urllib.parse import urlencode
|
from urllib.parse import urlencode
|
||||||
|
|
||||||
import httpx
|
import httpx
|
||||||
@ -14,7 +14,7 @@ from tools import utils
|
|||||||
|
|
||||||
from .help import BilibiliSign
|
from .help import BilibiliSign
|
||||||
from .exception import DataFetchError
|
from .exception import DataFetchError
|
||||||
from .field import OrderType
|
from .field import SearchOrderType, CommentOrderType
|
||||||
|
|
||||||
|
|
||||||
class BilibiliClient:
|
class BilibiliClient:
|
||||||
@ -63,7 +63,8 @@ class BilibiliClient:
|
|||||||
:return:
|
:return:
|
||||||
"""
|
"""
|
||||||
local_storage = await self.playwright_page.evaluate("() => window.localStorage")
|
local_storage = await self.playwright_page.evaluate("() => window.localStorage")
|
||||||
wbi_img_urls = local_storage.get("wbi_img_urls", "") or local_storage.get("wbi_img_url") + "-" + local_storage.get("wbi_sub_url")
|
wbi_img_urls = local_storage.get("wbi_img_urls", "") or local_storage.get(
|
||||||
|
"wbi_img_url") + "-" + local_storage.get("wbi_sub_url")
|
||||||
if wbi_img_urls and "-" in wbi_img_urls:
|
if wbi_img_urls and "-" in wbi_img_urls:
|
||||||
img_url, sub_url = wbi_img_urls.split("-")
|
img_url, sub_url = wbi_img_urls.split("-")
|
||||||
else:
|
else:
|
||||||
@ -105,7 +106,7 @@ class BilibiliClient:
|
|||||||
self.cookie_dict = cookie_dict
|
self.cookie_dict = cookie_dict
|
||||||
|
|
||||||
async def search_video_by_keyword(self, keyword: str, page: int = 1, page_size: int = 20,
|
async def search_video_by_keyword(self, keyword: str, page: int = 1, page_size: int = 20,
|
||||||
order: OrderType = OrderType.DEFAULT):
|
order: SearchOrderType = SearchOrderType.DEFAULT):
|
||||||
"""
|
"""
|
||||||
KuaiShou web search api
|
KuaiShou web search api
|
||||||
:param keyword: 搜索关键词
|
:param keyword: 搜索关键词
|
||||||
@ -134,21 +135,31 @@ class BilibiliClient:
|
|||||||
}
|
}
|
||||||
return await self.post("", post_data)
|
return await self.post("", post_data)
|
||||||
|
|
||||||
async def get_video_comments(self, photo_id: str, pcursor: str = "") -> Dict:
|
async def get_video_comments(self,
|
||||||
|
video_id: str,
|
||||||
|
order_mode: CommentOrderType = CommentOrderType.DEFAULT,
|
||||||
|
pagination_str: str = '{"offset":""}'
|
||||||
|
) -> Dict:
|
||||||
"""get video comments
|
"""get video comments
|
||||||
:param photo_id: photo id you want to fetch
|
:param video_id: 视频 ID
|
||||||
:param pcursor: last you get pcursor, defaults to ""
|
:param order_mode: 排序方式
|
||||||
|
:param pagination_str: 分页字符串,由 api 返回下一个评论请求的分页信息
|
||||||
:return:
|
:return:
|
||||||
"""
|
"""
|
||||||
|
uri = "/x/v2/reply/wbi/main"
|
||||||
post_data = {
|
post_data = {
|
||||||
|
"oid": video_id,
|
||||||
|
"mode": order_mode.value,
|
||||||
|
"type": 1,
|
||||||
|
"pagination_str": pagination_str
|
||||||
}
|
}
|
||||||
return await self.post("", post_data)
|
return await self.post(uri, post_data)
|
||||||
|
|
||||||
async def get_video_all_comments(self, photo_id: str, crawl_interval: float = 1.0, is_fetch_sub_comments=False,
|
async def get_video_all_comments(self, video_id: str, crawl_interval: float = 1.0, is_fetch_sub_comments=False,
|
||||||
callback: Optional[Callable] = None, ):
|
callback: Optional[Callable] = None, ):
|
||||||
"""
|
"""
|
||||||
get video all comments include sub comments
|
get video all comments include sub comments
|
||||||
:param photo_id:
|
:param video_id:
|
||||||
:param crawl_interval:
|
:param crawl_interval:
|
||||||
:param is_fetch_sub_comments:
|
:param is_fetch_sub_comments:
|
||||||
:param callback:
|
:param callback:
|
||||||
@ -156,19 +167,19 @@ class BilibiliClient:
|
|||||||
"""
|
"""
|
||||||
|
|
||||||
result = []
|
result = []
|
||||||
pcursor = ""
|
is_end = False
|
||||||
while pcursor != "no_more":
|
pagination_str = '{"offset":""}'
|
||||||
comments_res = await self.get_video_comments(photo_id, pcursor)
|
while not is_end:
|
||||||
vision_commen_list = comments_res.get("visionCommentList", {})
|
comments_res = await self.get_video_comments(video_id, CommentOrderType.DEFAULT, pagination_str)
|
||||||
pcursor = vision_commen_list.get("pcursor", "")
|
curson_info: Dict = comments_res.get("data").get("cursor")
|
||||||
comments = vision_commen_list.get("rootComments", [])
|
comment_list: List[Dict] = comments_res.get("replies", [])
|
||||||
|
is_end = curson_info.get("is_end")
|
||||||
|
pagination_str = curson_info.get("pagination_reply").get("next_offset")
|
||||||
if callback: # 如果有回调函数,就执行回调函数
|
if callback: # 如果有回调函数,就执行回调函数
|
||||||
await callback(photo_id, comments)
|
await callback(video_id, comment_list)
|
||||||
|
|
||||||
await asyncio.sleep(crawl_interval)
|
await asyncio.sleep(crawl_interval)
|
||||||
if not is_fetch_sub_comments:
|
if not is_fetch_sub_comments:
|
||||||
result.extend(comments)
|
result.extend(comment_list)
|
||||||
continue
|
continue
|
||||||
# todo handle get sub comments
|
# todo handle get sub comments
|
||||||
return result
|
return result
|
||||||
|
@ -6,7 +6,7 @@
|
|||||||
from enum import Enum
|
from enum import Enum
|
||||||
|
|
||||||
|
|
||||||
class OrderType(Enum):
|
class SearchOrderType(Enum):
|
||||||
# 综合排序
|
# 综合排序
|
||||||
DEFAULT = ""
|
DEFAULT = ""
|
||||||
|
|
||||||
@ -21,3 +21,14 @@ class OrderType(Enum):
|
|||||||
|
|
||||||
# 最多收藏
|
# 最多收藏
|
||||||
MOST_MARK = "stow"
|
MOST_MARK = "stow"
|
||||||
|
|
||||||
|
|
||||||
|
class CommentOrderType(Enum):
|
||||||
|
# 仅按热度
|
||||||
|
DEFAULT = 0
|
||||||
|
|
||||||
|
# 按热度+按时间
|
||||||
|
MIXED = 1
|
||||||
|
|
||||||
|
# 按时间
|
||||||
|
TIME = 2
|
||||||
|
Loading…
Reference in New Issue
Block a user