powerexploit
diff --git a/‎System-Automation-Scripts/Questions_from_Project_Euler/README.md
Lines changed: 29 additions & 0 deletions b/‎System-Automation-Scripts/Questions_from_Project_Euler/README.md
Lines changed: 29 additions & 0 deletions
diff --git a/‎System-Automation-Scripts/Questions_from_Project_Euler/euler.py
Lines changed: 59 additions & 0 deletions b/‎System-Automation-Scripts/Questions_from_Project_Euler/euler.py
Lines changed: 59 additions & 0 deletions
diff --git a/‎System-Automation-Scripts/Questions_from_Project_Euler/images/euler_home.PNG
28.1 KB b/‎System-Automation-Scripts/Questions_from_Project_Euler/images/euler_home.PNG
28.1 KB
diff --git a/‎System-Automation-Scripts/Questions_from_Project_Euler/images/euler_questions.PNG
14.5 KB b/‎System-Automation-Scripts/Questions_from_Project_Euler/images/euler_questions.PNG
14.5 KB
diff --git a/‎System-Automation-Scripts/Questions_from_Project_Euler/images/question1.PNG
14.8 KB b/‎System-Automation-Scripts/Questions_from_Project_Euler/images/question1.PNG
14.8 KB
@@ -0,0 +1,29 @@
+# Project Euler #
+
+![Image](./images/euler_home.PNG)
+
+Project Euler is a series of challenging mathematical/computer programming problems that will require more than just mathematical insights to solve
+
+This script written in Python, gets all the 700+ questions across 15 pages which is written into a CSV file named Project_Euler.csv
+
+Beautiful Soup is used for scraping the URL : https://projecteuler.net/archives
+
+Regular expressions have also been used in order to obtain the description of the questions
+
+## Implementation ##
+
+Using **inspect element**, the contents of the page can be understood
+
+The structure of each page is as shown
+
+![Image](./images/euler_questions.PNG)
+
+The <tr> element consists of the description of the question
+
+Each question has the following components
+
+![Image](./images/question1.PNG)
+
+The contents are parsed and stored using Beautiful Soup, a library built for web scraping
+
+
@@ -0,0 +1,59 @@
+#!/usr/bin/env python3
+
+#Imports and dependencies
+
+import requests
+from bs4 import BeautifulSoup
+import re
+import csv
+
+def Euler():
+  
+  #The contents are written into a CSV file
+  #Each question has a serial number, name of the problem and description of the problem
+
+  with open('Project_Euler.csv', 'w', newline='') as file:
+    writer = csv.writer(file)
+    writer.writerow(["Problem Number", "Name" , "Description"])
+    
+    #There are 15 pages in all, the page number is appended to the URL
+    start = 1
+    pages = 15
+
+    for page in range(start , pages + start):
+      
+      #Response is got from each page, the questions are then searched for 
+      page_url = "https://projecteuler.net/archives;page="+ str(page)
+      response = requests.get(page_url)
+      soup = BeautifulSoup(response.text,"html.parser")
+      
+      #All the questions are located within the <table> tag
+      #This information can be found out by using inspect element, Ctrl+Shift+I
+
+      for link in soup.find('table' , attrs={"id" : "problems_table"}).find_all('a'):
+        
+        #The link to the question is located in a <a> tag
+        question_url = "https://projecteuler.net/" + link['href']
+
+        #The name and question number are obtained
+        question_number = link['href'].split('=')[-1]
+        question_name = link.string
+
+        ques_response = requests.get(question_url)
+        ques_contents = BeautifulSoup(ques_response.text, "html.parser")
+        description = ''
+        
+        #In each question element, the description is mentioned in the <div> tag
+
+        for content in ques_contents.find("div" , attrs={"class":"problem_content"}).children:  
+
+          #The content between the tags are obtained getting rid of the tag elements
+
+          content = re.sub(r'\<.*?>', r' ', str(content))
+          description += content
+        
+        #Each entry is written into the file
+
+        writer.writerow([question_number, question_name , description])
+
+Euler()