mirror of
https://github.com/RYDE-WORK/MediaCrawler.git
synced 2026-02-07 17:37:34 +08:00
fix: weibo creator duplicate bug
This commit is contained in:
parent
f9e7d56d4f
commit
c12a63acb2
@ -353,10 +353,7 @@ class WeiboClient:
|
|||||||
utils.logger.error(
|
utils.logger.error(
|
||||||
f"[WeiboClient.get_notes_by_creator] The current creator may have been banned by xhs, so they cannot access the data.")
|
f"[WeiboClient.get_notes_by_creator] The current creator may have been banned by xhs, so they cannot access the data.")
|
||||||
break
|
break
|
||||||
|
|
||||||
notes_has_more = notes_res.get("cardlistInfo", {}).get("total", 0) > crawler_total_count
|
|
||||||
since_id = notes_res.get("cardlistInfo", {}).get("since_id", "0")
|
since_id = notes_res.get("cardlistInfo", {}).get("since_id", "0")
|
||||||
crawler_total_count += 10
|
|
||||||
if "cards" not in notes_res:
|
if "cards" not in notes_res:
|
||||||
utils.logger.info(
|
utils.logger.info(
|
||||||
f"[WeiboClient.get_all_notes_by_creator] No 'notes' key found in response: {notes_res}")
|
f"[WeiboClient.get_all_notes_by_creator] No 'notes' key found in response: {notes_res}")
|
||||||
@ -370,5 +367,7 @@ class WeiboClient:
|
|||||||
await callback(notes)
|
await callback(notes)
|
||||||
await asyncio.sleep(crawl_interval)
|
await asyncio.sleep(crawl_interval)
|
||||||
result.extend(notes)
|
result.extend(notes)
|
||||||
|
crawler_total_count += 10
|
||||||
|
notes_has_more = notes_res.get("cardlistInfo", {}).get("total", 0) > crawler_total_count
|
||||||
return result
|
return result
|
||||||
|
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user