From 63859b11a4f50f95e141f54b8a5a5d5c27c9920b Mon Sep 17 00:00:00 2001
From: lsy2246 <lsy200546@hotmail.com>
Date: Fri, 29 Mar 2024 00:16:12 +0800
Subject: [PATCH] =?UTF-8?q?=E5=B0=8F=E8=AF=B4=E7=88=AC=E8=99=AB?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

---
 python/spider/book/biqg.cc.py | 47 +++++++++++++++++++++++++++++++++++
 1 file changed, 47 insertions(+)
 create mode 100644 python/spider/book/biqg.cc.py

diff --git a/python/spider/book/biqg.cc.py b/python/spider/book/biqg.cc.py
new file mode 100644
index 0000000..45fee5a
--- /dev/null
+++ b/python/spider/book/biqg.cc.py
@@ -0,0 +1,47 @@
+import asyncio
+import re
+
+import aiohttp
+import aiofiles
+from bs4 import BeautifulSoup
+import os
+from concurrent.futures import ThreadPoolExecutor, ProcessPoolExecutor  # 多线程/多进程
+
+
+async def aiodownload(url):
+    if not os.path.exists("xs"):
+        os.mkdir("xs")
+    async with aiohttp.ClientSession() as session:
+        async with session.get(url) as response:
+            html = BeautifulSoup(await response.read(), "html.parser")
+            title = html.find("h1", class_="wap_none").text
+            content = html.find("div", id="chaptercontent").text
+            if os.name == 'posix':
+                name = "xs\\" + title.split(" ")[0] + ".txt"
+            elif os.name == 'nt':
+                name = "xs/" + title.split(" ")[0] + ".txt"
+            content = content.replace("　　", "\n").replace(
+                "请收藏本站：https://www.biqg.cc。笔趣阁手机版：https://m.biqg.cc ", "").replace("『点此报错』『加入书签』",
+                                                                                              "")
+            async with aiofiles.open(name, "a+") as file:
+                await file.write(content)
+
+    print(title, "成功下载")
+
+
+async def main(urls):
+    takes = []
+    for url in urls:
+        take = asyncio.create_task(aiodownload(url))
+        takes.append(take)
+    await asyncio.wait(takes)
+
+
+if __name__ == "__main__":
+    urls = []
+    for index in range(1, 2):
+        url = f"https://www.biqg.cc/book/3670/{index}.html"
+        urls.append(url)
+    asyncio.run(main(urls=urls))
+    print("全部下载完成")
+