-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathScrapeSymbols.py
41 lines (30 loc) · 1.3 KB
/
ScrapeSymbols.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
# importing the libraries
from bs4 import BeautifulSoup
import requests
import csv
# only re-run this when you want to refresh the list of tickers
headings = []
for page in range(1, 7):
url="https://www.londonstockexchange.com/indices/ftse-aim-100-index/constituents/table?page="+str(page)
html_content = requests.get(url).text
soup = BeautifulSoup(html_content, "lxml")
symbolTable = soup.find("table", attrs={"class": "full-width ftse-index-table-table"})
symbolTableData = symbolTable.tbody.find_all("tr") # contains 2 rows
rowData = ""
for row in symbolTableData:
first = True
for element in row.find_all("td"):
if first:
rowData = (element.text).replace(',', '') # strip commas from numbers
rowData += '.L' # DISABLE THIS LINE, IF NOT LSE STOCK SYMBOLS
first = False
else:
rowData = rowData + "," + (element.text).replace(',', '') # strip commas from numbers
break # uncomment if you don't just want the first 2 columns
headings.append(rowData)
rowData = ""
#print(headings)
with open('datasets/symbols.csv','w',newline='\n') as file:
# Upload as open project on Github
for heading in sorted(headings):
file.write(heading+"\n")