Initial commit

2023-10-23 19:57:49 -03:00 · 2023-10-23 19:57:49 -03:00 · b0b016a4d9
commit b0b016a4d9
37 changed files with 2447 additions and 0 deletions
--- a/code/exercise-1.py
+++ b/code/exercise-1.py
@ -0,0 +1,22 @@
+# Exercise 1
+
+# Target: https://quotes.toscrape.com/
+
+# On this page, you will find a collection of quotes along with their respective
+# authors. Each quote is accompanied by a link that directs you to a dedicated
+# page providing additional details about the author, the quote itself, and a list of associated tags.
+
+# Your task is to extract all of this information and export it into a JSON lines file.
+
+# TIP: your parse method can be used to yield items or schedule new requests for later processing.
+import scrapy
+
+
+class QuotesSpider(scrapy.Spider):
+    name = "quotes"
+    allowed_domains = ["quotes.toscrape.com"]
+    start_urls = ["https://quotes.toscrape.com"]
+
+    def parse(self, response):
+        # TODO
+        ...