Initial commit

This commit is contained in:
Renne Rocha 2023-10-23 19:57:49 -03:00
commit b0b016a4d9
37 changed files with 2447 additions and 0 deletions

22
code/exercise-1.py Normal file
View file

@ -0,0 +1,22 @@
# Exercise 1
# Target: https://quotes.toscrape.com/
# On this page, you will find a collection of quotes along with their respective
# authors. Each quote is accompanied by a link that directs you to a dedicated
# page providing additional details about the author, the quote itself, and a list of associated tags.
# Your task is to extract all of this information and export it into a JSON lines file.
# TIP: your parse method can be used to yield items or schedule new requests for later processing.
import scrapy
class QuotesSpider(scrapy.Spider):
name = "quotes"
allowed_domains = ["quotes.toscrape.com"]
start_urls = ["https://quotes.toscrape.com"]
def parse(self, response):
# TODO
...