From 0364b23b5b8c7ab330cab00a4cc9a8a30f234037 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?=E7=BF=9F=E6=8C=81=E6=B1=9F?= <129171955+2513502304@users.noreply.github.com> Date: Sun, 19 Jan 2025 19:55:18 +0800 Subject: [PATCH] =?UTF-8?q?Update=20core.py=EF=BC=8C=E4=B8=BA=E7=88=AC?= =?UTF-8?q?=E5=8F=96=E7=B1=BB=E5=9E=8B=E4=B8=BA`detail`=E5=92=8C`creator`?= =?UTF-8?q?=E7=9A=84=E4=BB=BB=E5=8A=A1=EF=BC=8C=E6=B7=BB=E5=8A=A0=E4=BA=86?= =?UTF-8?q?=E5=92=8C`search`=E4=BB=BB=E5=8A=A1=E4=B8=80=E6=A0=B7=E7=9A=84?= =?UTF-8?q?=EF=BC=8C=E7=94=A8=E4=BA=8E=E8=BD=AC=E5=AD=98up=E4=B8=BB?= =?UTF-8?q?=E4=BF=A1=E6=81=AF=E7=9A=84`bilibili=5Fstore.update=5Fup=5Finfo?= =?UTF-8?q?`=E7=9A=84=E5=87=BD=E6=95=B0=E8=B0=83=E7=94=A8?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit 正如`search`函数中一样,在调用`get_video_info_task`后,`bilibili_video`和`bilibili_up_info`信息都将获得。 原先的`get_specified_videos`在`detail`任务中仅保存了指定`bilibili_video`的信息,而`bilibili_up_info`信息尚未保存,`creator`任务的`get_creator_videos`中也调用了`get_specified_videos`获取指定创作者下所有的视频信息,同理也未保存`bilibili_up_info`信息。 所以只需为`get_specified_videos`添加一句`await bilibili_store.update_up_info(video_detail)`即可和`search`任务下获得的数据文件个数保持一致,不会缺少对应up主的个人信息。 已测试: - 原先仅`search`任务下产生`*_creator.csv`、`*_contents.csv`、`*_comments.csv`,而`detail`和`creator`任务下缺少`*_creator.csv`文件。 - 此次提交后将使三种模式下的数据文件个数一致。 --- media_platform/bilibili/core.py | 1 + 1 file changed, 1 insertion(+) diff --git a/media_platform/bilibili/core.py b/media_platform/bilibili/core.py index 4c2305b..62ba82d 100644 --- a/media_platform/bilibili/core.py +++ b/media_platform/bilibili/core.py @@ -297,6 +297,7 @@ class BilibiliCrawler(AbstractCrawler): if video_aid: video_aids_list.append(video_aid) await bilibili_store.update_bilibili_video(video_detail) + await bilibili_store.update_up_info(video_detail) await self.get_bilibili_video(video_detail, semaphore) await self.batch_get_video_comments(video_aids_list)