iridescentGray
diff --git a/‎README.md
Lines changed: 0 additions & 1 deletion b/‎README.md
Lines changed: 0 additions & 1 deletion
diff --git a/‎acrobatics/ktmm/README.md
Lines changed: 1 addition & 1 deletion b/‎acrobatics/ktmm/README.md
Lines changed: 1 addition & 1 deletion
diff --git a/‎acrobatics/ktmm/ktmm.py
Lines changed: 9 additions & 8 deletions b/‎acrobatics/ktmm/ktmm.py
Lines changed: 9 additions & 8 deletions
diff --git a/‎acrobatics/ktmm/requirements.txt
Lines changed: 1 addition & 1 deletion b/‎acrobatics/ktmm/requirements.txt
Lines changed: 1 addition & 1 deletion
diff --git a/‎crawler/my_playwright/README.md
Lines changed: 1 addition & 3 deletions b/‎crawler/my_playwright/README.md
Lines changed: 1 addition & 3 deletions
diff --git a/‎crawler/my_playwright/requirements.txt
Lines changed: 1 addition & 1 deletion b/‎crawler/my_playwright/requirements.txt
Lines changed: 1 addition & 1 deletion
diff --git a/‎crawler/my_scrapy/README.md
Lines changed: 4 additions & 6 deletions b/‎crawler/my_scrapy/README.md
Lines changed: 4 additions & 6 deletions
diff --git a/‎crawler/my_scrapy/get_cartoon/get_cartoon/middlewares.py
Lines changed: 2 additions & 3 deletions b/‎crawler/my_scrapy/get_cartoon/get_cartoon/middlewares.py
Lines changed: 2 additions & 3 deletions
diff --git a/‎crawler/my_scrapy/get_cartoon/get_cartoon/pipelines.py
Lines changed: 7 additions & 7 deletions b/‎crawler/my_scrapy/get_cartoon/get_cartoon/pipelines.py
Lines changed: 7 additions & 7 deletions
diff --git a/‎crawler/my_scrapy/get_cartoon/get_cartoon/settings.py
Lines changed: 3 additions & 3 deletions b/‎crawler/my_scrapy/get_cartoon/get_cartoon/settings.py
Lines changed: 3 additions & 3 deletions
diff --git a/‎crawler/my_scrapy/get_cartoon/get_cartoon/spiders/manhuagui.py
Lines changed: 39 additions & 31 deletions b/‎crawler/my_scrapy/get_cartoon/get_cartoon/spiders/manhuagui.py
Lines changed: 39 additions & 31 deletions
diff --git a/‎crawler/my_scrapy/hello_world_demo/hello_world_demo/middlewares.py
Lines changed: 2 additions & 3 deletions b/‎crawler/my_scrapy/hello_world_demo/hello_world_demo/middlewares.py
Lines changed: 2 additions & 3 deletions
diff --git a/‎crawler/my_scrapy/hello_world_demo/hello_world_demo/settings.py
Lines changed: 26 additions & 26 deletions b/‎crawler/my_scrapy/hello_world_demo/hello_world_demo/settings.py
Lines changed: 26 additions & 26 deletions
@@ -6,4 +6,3 @@ python自学项目
 
 - 记录python库的使用方法
 - 以代码记录学到的有趣的内容
-
@@ -18,4 +18,4 @@ ktmm是一个通过移动鼠标防止系统休眠的脚本。
 
 ### 卸载
 
-    pyenv virtualenv-delete ktmm
+    pyenv virtualenv-delete ktmm
@@ -1,10 +1,11 @@
-from pynput.mouse import Controller
 import time
 
-if __name__ == '__main__':
-	mouse = Controller()
-	while True:
-		mouse.move(0.5, 0.5)
-		time.sleep(10)
-		mouse.move(-0.5, -0.5)
-		time.sleep(10)
+from pynput.mouse import Controller
+
+if __name__ == "__main__":
+    mouse = Controller()
+    while True:
+        mouse.move(0.5, 0.5)
+        time.sleep(10)
+        mouse.move(-0.5, -0.5)
+        time.sleep(10)
@@ -1 +1 @@
-pynput
+pynput
@@ -1,6 +1,6 @@
 # Playwright
 
-Playwright相关demo 
+Playwright相关demo
 
 
 ## 环境搭建
@@ -35,5 +35,3 @@ hello_world_demo是一个scrapy的简单入门项目
 ## 卸载项目
 
     pyenv virtualenv-delete my_playwright
- 
-
@@ -1 +1 @@
-playwright
+playwright
@@ -1,9 +1,9 @@
 # Scrapy
 
-Scrapy相关demo 
+Scrapy相关demo
 
 ## 免责声明
-1. 若使用者滥用本项目,本人 无需承担 任何法律责任. 
+1. 若使用者滥用本项目,本人 无需承担 任何法律责任.
 2. 本程序仅供娱乐,源码全部开源,禁止滥用和二次贩卖盈利. 禁止用于商业用途.
 
 
@@ -15,7 +15,7 @@ Scrapy相关demo
     pyenv virtualenv  3.10.9 my-scrapy  //此外，还需要使用编译器的Add Interpreter功能把这个虚拟环境识别了
     pyenv activate my-scrapy
     python -m pip install --upgrade pip
-    cd crawler/my_scrapy 
+    cd crawler/my_scrapy
     pip install -r requirements.txt -i https://mirrors.aliyun.com/pypi/simple/
 
 
@@ -46,7 +46,7 @@ hello_world_demo是一个scrapy的简单入门项目
 get_cartoon是一个scrapy的漫画爬虫
 
 #### 相关文档
-    
+
     Scrapy： https://docs.scrapy.org/en/latest/intro/overview.html
 
 #### 启动
@@ -57,5 +57,3 @@ get_cartoon是一个scrapy的漫画爬虫
 ## 卸载项目
 
     pyenv virtualenv-delete my-scrapy
- 
-
@@ -3,10 +3,9 @@
 # See documentation in:
 # https://docs.scrapy.org/en/latest/topics/spider-middleware.html
 
-from scrapy import signals
-
 # useful for handling different item types with a single interface
-from itemadapter import is_item, ItemAdapter
+from itemadapter import ItemAdapter, is_item
+from scrapy import signals
 
 
 class GetCartoonSpiderMiddleware:
 
@@ -8,15 +8,13 @@
 import os
 
 import requests
-
 from get_cartoon import settings
 
 
 class MhgChapterPipeline:
-
     def process_item(self, item, spider):
         # 如果获取了图片链接，进行如下操作
-        web_image_items = item['web_image_items']
+        web_image_items = item["web_image_items"]
         if web_image_items:
             # 准备文件夹
             local_file_path = f'{settings.IMAGES_STORE}/{item["name"]}'
@@ -25,16 +23,18 @@ def process_item(self, item, spider):
 
             # 获取每一个图片链接
             for key, value in web_image_items.items():
-                image_file_name = f'{str(key)}.jpeg'
+                image_file_name = f"{str(key)}.jpeg"
                 # 图片保存路径
-                full_file_path = f'{local_file_path}/{image_file_name}'
+                full_file_path = f"{local_file_path}/{image_file_name}"
                 # 保存图片
                 self.save_to_local(full_file_path, value)
         return item
 
     def save_to_local(self, full_file_path, web_image):
-        with open(full_file_path, 'wb') as handle:
-            response = requests.get(url=web_image, headers={'Referer': 'https://www.manhuagui.com/'})
+        with open(full_file_path, "wb") as handle:
+            response = requests.get(
+                url=web_image, headers={"Referer": "https://www.manhuagui.com/"}
+            )
             for block in response.iter_content(1024):
                 if not block:
                     break
 
@@ -14,7 +14,7 @@
 NEWSPIDER_MODULE = "get_cartoon.spiders"
 
 # Crawl responsibly by identifying yourself (and your website) on the user-agent
-USER_AGENT = 'Mozilla/5.0 (Macintosh; Intel Mac OS X 10_14_6) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/92.0.4515.159 Safari/537.36'
+USER_AGENT = "Mozilla/5.0 (Macintosh; Intel Mac OS X 10_14_6) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/92.0.4515.159 Safari/537.36"
 
 # Obey robots.txt rules
 ROBOTSTXT_OBEY = False
@@ -65,7 +65,7 @@
 ITEM_PIPELINES = {
     "get_cartoon.pipelines.MhgChapterPipeline": 1,
 }
-IMAGES_STORE = str(pathlib.Path.home()) + '/Downloads/get_cartoon'
+IMAGES_STORE = str(pathlib.Path.home()) + "/Downloads/get_cartoon"
 
 # Enable and configure the AutoThrottle extension (disabled by default)
 # See https://docs.scrapy.org/en/latest/topics/autothrottle.html
@@ -91,4 +91,4 @@
 # Set settings whose default value is deprecated to a future-proof value
 REQUEST_FINGERPRINTER_IMPLEMENTATION = "2.7"
 TWISTED_REACTOR = "twisted.internet.asyncioreactor.AsyncioSelectorReactor"
-FEED_EXPORT_ENCODING = "utf-8"
+FEED_EXPORT_ENCODING = "utf-8"
@@ -1,30 +1,29 @@
 import scrapy
-
 from get_cartoon.items import MhgChapterItem
 
-domain = 'https://www.manhuagui.com'
+domain = "https://www.manhuagui.com"
 
 
 class ManhuaguiSpider(scrapy.Spider):
     name = "manhuagui"
     custom_settings = {
         "TWISTED_REACTOR": "twisted.internet.asyncioreactor.AsyncioSelectorReactor",
-        'CONCURRENT_REQUESTS': 4,
-        'DOWNLOAD_DELAY': 3,
-        'COOKIES_ENABLED': False,
-        'PLAYWRIGHT_BROWSER_TYPE': 'chromium',
+        "CONCURRENT_REQUESTS": 4,
+        "DOWNLOAD_DELAY": 3,
+        "COOKIES_ENABLED": False,
+        "PLAYWRIGHT_BROWSER_TYPE": "chromium",
         "DOWNLOAD_HANDLERS": {
             "https": "scrapy_playwright.handler.ScrapyPlaywrightDownloadHandler",
         },
         "PLAYWRIGHT_LAUNCH_OPTIONS": {
             "headless": True,
             "timeout": 15 * 1000,  # 15 seconds
-        }
+        },
     }
 
     def __init__(self, **kwargs):
-        self.allowed_domains = ['manhuagui.com']
-        self.start_urls = ['https://www.manhuagui.com/comic/22265/']
+        self.allowed_domains = ["manhuagui.com"]
+        self.start_urls = ["https://www.manhuagui.com/comic/22265/"]
         super().__init__(**kwargs)
 
     def start_requests(self):
@@ -41,42 +40,51 @@ def parse(self, response):
         chapter_items = []
         for chapters_selector in chapters_selectors:
             chapter_item = MhgChapterItem()
-            chapter_item['name'] = chapters_selector.xpath('a[1]/@title').extract_first()
-            chapter_item['url'] = chapters_selector.xpath('a[1]/@href').extract_first()
-            chapter_item['page_number'] = chapters_selector.xpath('a[1]/span/i/text()').extract_first().removesuffix(
-                'p')
-            chapter_item['web_image_items'] = {}
+            chapter_item["name"] = chapters_selector.xpath(
+                "a[1]/@title"
+            ).extract_first()
+            chapter_item["url"] = chapters_selector.xpath("a[1]/@href").extract_first()
+            chapter_item["page_number"] = (
+                chapters_selector.xpath("a[1]/span/i/text()")
+                .extract_first()
+                .removesuffix("p")
+            )
+            chapter_item["web_image_items"] = {}
             chapter_items.append(chapter_item)
 
         for chapter_item in chapter_items:
-            yield scrapy.Request(url=f'{domain}/{chapter_item["url"]}',
-                                 meta={'item': chapter_item},
-                                 callback=self.parse_every_chapter_pages)
+            yield scrapy.Request(
+                url=f'{domain}/{chapter_item["url"]}',
+                meta={"item": chapter_item},
+                callback=self.parse_every_chapter_pages,
+            )
 
     def parse_every_chapter_pages(self, response):
-        chapter_item = response.meta['item']
-        pages = int(chapter_item['page_number'])
+        chapter_item = response.meta["item"]
+        pages = int(chapter_item["page_number"])
         for page in range(1, pages, 1):
             page_url = f'{domain}/{chapter_item["url"]}#p={str(page)}'
-            yield scrapy.Request(url=page_url,
-                                 meta=dict(
-                                     item=chapter_item,
-                                     current_page=page,
-                                     playwright=True,
-                                     playwright_include_page=True
-                                 ),
-                                 callback=self.parse_image_url,
-                                 dont_filter=True,
-                                 errback=self.errback_close_page)
+            yield scrapy.Request(
+                url=page_url,
+                meta=dict(
+                    item=chapter_item,
+                    current_page=page,
+                    playwright=True,
+                    playwright_include_page=True,
+                ),
+                callback=self.parse_image_url,
+                dont_filter=True,
+                errback=self.errback_close_page,
+            )
 
     async def parse_image_url(self, response):
         web_page = response.meta["playwright_page"]
         await web_page.close()
         current_page_number = response.meta["current_page"]
         image_path = response.xpath('//*[@id="mangaFile"]/@src').extract_first()
-        chapter_item = response.meta['item']
+        chapter_item = response.meta["item"]
         # {漫画页数：漫画路径}
-        chapter_item['web_image_items'].update({current_page_number: image_path})
+        chapter_item["web_image_items"].update({current_page_number: image_path})
         yield chapter_item
 
     async def errback_close_page(self, failure):
 
@@ -3,10 +3,9 @@
 # See documentation in:
 # https://docs.scrapy.org/en/latest/topics/spider-middleware.html
 
-from scrapy import signals
-
 # useful for handling different item types with a single interface
-from itemadapter import is_item, ItemAdapter
+from itemadapter import ItemAdapter, is_item
+from scrapy import signals
 
 
 class HelloWorldDemoSpiderMiddleware:
 
@@ -16,7 +16,7 @@
 # USER_AGENT = "hello_world_demo (+http://www.yourdomain.com)"
 
 # 一定要配用户代理 否则无法使用
-USER_AGENT = 'Mozilla/5.0 (Macintosh; Intel Mac OS X 10_14_6) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/92.0.4515.159 Safari/537.36'
+USER_AGENT = "Mozilla/5.0 (Macintosh; Intel Mac OS X 10_14_6) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/92.0.4515.159 Safari/537.36"
 
 # Obey robots.txt rules
 ROBOTSTXT_OBEY = True
@@ -27,67 +27,67 @@
 # Configure a delay for requests for the same website (default: 0)
 # See https://docs.scrapy.org/en/latest/topics/settings.html#download-delay
 # See also autothrottle settings and docs
-#DOWNLOAD_DELAY = 3
+# DOWNLOAD_DELAY = 3
 # The download delay setting will honor only one of:
-#CONCURRENT_REQUESTS_PER_DOMAIN = 16
-#CONCURRENT_REQUESTS_PER_IP = 16
+# CONCURRENT_REQUESTS_PER_DOMAIN = 16
+# CONCURRENT_REQUESTS_PER_IP = 16
 
 # Disable cookies (enabled by default)
-#COOKIES_ENABLED = False
+# COOKIES_ENABLED = False
 
 # Disable Telnet Console (enabled by default)
-#TELNETCONSOLE_ENABLED = False
+# TELNETCONSOLE_ENABLED = False
 
 # Override the default request headers:
-#DEFAULT_REQUEST_HEADERS = {
+# DEFAULT_REQUEST_HEADERS = {
 #    "Accept": "text/html,application/xhtml+xml,application/xml;q=0.9,*/*;q=0.8",
 #    "Accept-Language": "en",
-#}
+# }
 
 # Enable or disable spider middlewares
 # See https://docs.scrapy.org/en/latest/topics/spider-middleware.html
-#SPIDER_MIDDLEWARES = {
+# SPIDER_MIDDLEWARES = {
 #    "hello_world_demo.middlewares.HelloWorldDemoSpiderMiddleware": 543,
-#}
+# }
 
 # Enable or disable downloader middlewares
 # See https://docs.scrapy.org/en/latest/topics/downloader-middleware.html
-#DOWNLOADER_MIDDLEWARES = {
+# DOWNLOADER_MIDDLEWARES = {
 #    "hello_world_demo.middlewares.HelloWorldDemoDownloaderMiddleware": 543,
-#}
+# }
 
 # Enable or disable extensions
 # See https://docs.scrapy.org/en/latest/topics/extensions.html
-#EXTENSIONS = {
+# EXTENSIONS = {
 #    "scrapy.extensions.telnet.TelnetConsole": None,
-#}
+# }
 
 # Configure item pipelines
 # See https://docs.scrapy.org/en/latest/topics/item-pipeline.html
-#ITEM_PIPELINES = {
+# ITEM_PIPELINES = {
 #    "hello_world_demo.pipelines.HelloWorldDemoPipeline": 300,
-#}
+# }
 
 # Enable and configure the AutoThrottle extension (disabled by default)
 # See https://docs.scrapy.org/en/latest/topics/autothrottle.html
-#AUTOTHROTTLE_ENABLED = True
+# AUTOTHROTTLE_ENABLED = True
 # The initial download delay
-#AUTOTHROTTLE_START_DELAY = 5
+# AUTOTHROTTLE_START_DELAY = 5
 # The maximum download delay to be set in case of high latencies
-#AUTOTHROTTLE_MAX_DELAY = 60
+# AUTOTHROTTLE_MAX_DELAY = 60
 # The average number of requests Scrapy should be sending in parallel to
 # each remote server
-#AUTOTHROTTLE_TARGET_CONCURRENCY = 1.0
+# AUTOTHROTTLE_TARGET_CONCURRENCY = 1.0
 # Enable showing throttling stats for every response received:
-#AUTOTHROTTLE_DEBUG = False
+# AUTOTHROTTLE_DEBUG = False
 
 # Enable and configure HTTP caching (disabled by default)
 # See https://docs.scrapy.org/en/latest/topics/downloader-middleware.html#httpcache-middleware-settings
-#HTTPCACHE_ENABLED = True
-#HTTPCACHE_EXPIRATION_SECS = 0
-#HTTPCACHE_DIR = "httpcache"
-#HTTPCACHE_IGNORE_HTTP_CODES = []
-#HTTPCACHE_STORAGE = "scrapy.extensions.httpcache.FilesystemCacheStorage"
+# HTTPCACHE_ENABLED = True
+# HTTPCACHE_EXPIRATION_SECS = 0
+# HTTPCACHE_DIR = "httpcache"
+# HTTPCACHE_IGNORE_HTTP_CODES = []
+# HTTPCACHE_STORAGE = "scrapy.extensions.httpcache.FilesystemCacheStorage"
 
 # Set settings whose default value is deprecated to a future-proof value
 REQUEST_FINGERPRINTER_IMPLEMENTATION = "2.7"
Original file line number	Diff line number	Diff line change
`@@ -6,4 +6,3 @@ python自学项目`
`6`	`6`
`7`	`7`	`- 记录python库的使用方法`
`8`	`8`	`- 以代码记录学到的有趣的内容`
`9`		`-`
Original file line number	Diff line number	Diff line change
`@@ -18,4 +18,4 @@ ktmm是一个通过移动鼠标防止系统休眠的脚本。`
`18`	`18`
`19`	`19`	`### 卸载`
`20`	`20`
`21`		`- pyenv virtualenv-delete ktmm`
	`21`	`+ pyenv virtualenv-delete ktmm`