-
Notifications
You must be signed in to change notification settings - Fork 2
/
scraper.py
27 lines (23 loc) · 826 Bytes
/
scraper.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
'''
This is a web scrapper example, scarping data from a quotes site
'''
#for a start you need two major modules,
#one to access the web address, by sending requests
#the other for identifying the HTML syntax
import requests
from bs4 import BeautifulSoup
#url => the address we want to scrape
url = 'http://quotes.toscrape.com/'
response = requests.get(url)
soup = BeautifulSoup(response.text, 'lxml')
quotes = soup.find_all('span', class_='text')
authors = soup.find_all('small', class_='author')
tags = soup.find_all('div', class_='tags')
#loop through the site and fetch the features of the site
for i in range(0, len(quotes)):
print(quotes[i].text)
print(authors[i].text)
quotesTags = tags[i].find_all('a', class_='tag')
for tag in quotesTags:
print(tag.text, end='\t')
print("="*25)