Final version
This commit is contained in:
parent
d7fd3dd578
commit
63e275fa2f
30 changed files with 2918 additions and 5 deletions
27
code/playwright-disabled.py
Normal file
27
code/playwright-disabled.py
Normal file
|
@ -0,0 +1,27 @@
|
|||
import scrapy
|
||||
|
||||
|
||||
class QuotesPlaywrightSpider(scrapy.Spider):
|
||||
name = "quotes-playwright"
|
||||
custom_settings = {
|
||||
"DOWNLOAD_HANDLERS": {
|
||||
"http": "scrapy_playwright.handler.ScrapyPlaywrightDownloadHandler",
|
||||
"https": "scrapy_playwright.handler.ScrapyPlaywrightDownloadHandler",
|
||||
},
|
||||
"TWISTED_REACTOR": "twisted.internet.asyncioreactor.AsyncioSelectorReactor",
|
||||
"PLAYWRIGHT_LAUNCH_OPTIONS": {
|
||||
"headless": True,
|
||||
}
|
||||
}
|
||||
|
||||
def start_requests(self):
|
||||
yield scrapy.Request(
|
||||
url="http://quotes.toscrape.com/js/",
|
||||
meta={
|
||||
"playwright": False,
|
||||
},
|
||||
)
|
||||
|
||||
async def parse(self, response):
|
||||
with open("playwright-disabled.html", "w") as content:
|
||||
content.write(response.text)
|
Loading…
Add table
Add a link
Reference in a new issue