-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathwebscrape.py
33 lines (21 loc) · 845 Bytes
/
webscrape.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
import os
from bs4 import BeautifulSoup
import requests
url = 'https://www.scotiabank.com/ca/en/commercial-banking/scotia-connect-simple/'
listoflinks = ["payments.html", "administration.html",
"reporting.html", "additional-services.html"]
for item in listoflinks:
res = requests.get(url + item, headers={'User-Agent': 'Mozilla/5.0'})
soup = BeautifulSoup(res.text, "html.parser")
articles = soup.find_all("div", {"class": "card-content"})
for card in articles:
rows = card.find_all('div')
for row in rows:
details = row.find('p').getText().strip()
link = row.find("a")['href']
file = open("keywords.txt","a")
L = [details, link]
file.writelines(L)
file.close()
print(details)
print(link)