sanscript-tech
diff --git a/‎Python/Medium-article-scrapper/Article_downloader.py
Lines changed: 36 additions & 0 deletions b/‎Python/Medium-article-scrapper/Article_downloader.py
Lines changed: 36 additions & 0 deletions
diff --git a/‎Python/Medium-article-scrapper/README.md
Lines changed: 26 additions & 0 deletions b/‎Python/Medium-article-scrapper/README.md
Lines changed: 26 additions & 0 deletions
diff --git a/‎Python/Medium-article-scrapper/assets/content.PNG
3.09 KB b/‎Python/Medium-article-scrapper/assets/content.PNG
3.09 KB
diff --git a/‎Python/Medium-article-scrapper/assets/medium.PNG
1.32 KB b/‎Python/Medium-article-scrapper/assets/medium.PNG
1.32 KB
diff --git a/‎Python/Medium-article-scrapper/assets/promptURL.PNG
3.98 KB b/‎Python/Medium-article-scrapper/assets/promptURL.PNG
3.98 KB
@@ -0,0 +1,36 @@
+#!/usr/bin/env python3
+
+#Imports and dependencies
+
+import requests
+from bs4 import BeautifulSoup
+
+#The content is written into a text file
+
+file = open("Medium_article_content.txt", "w")
+
+#The URL of the article is entered here
+page_url = input("Enter the URL of the Medium Article ")
+
+#Based on the response got from the URL, the content is loaded into response
+
+response = requests.get(page_url)
+
+#Beautiful soup is a library used for web scraping and parsing the contents of a web page
+#Here a html parser is used to parse through the content embedded in the html tags
+
+soup = BeautifulSoup(response.text,"html.parser")
+
+#The content of the article is stored in the <article> tag
+
+for line in soup.find('article').find('div'):
+  
+  #All the content is essentially stored between <p> tags
+  
+  for content in line.find_all('p'):
+
+    #contents are written into a file
+    
+    file.write(content.text + '\n')
+
+file.close()
@@ -0,0 +1,26 @@
+# Medium Article Downloader
+
+![Image](assets/medium.PNG)
+
+Medium is a treasure trove of knowledge. It is a great place to read and write blogs
+
+Through this script, the contents of a medium article can be downloaded and stored
+
+The Beautiful Soup library in Python enables web scraping and enables parsing though html content, which web pages are made of. Here, the same has been used.
+
+
+## Requirements
+    - pip install requests:wq
+    - pip install BeautifulSoup
+
+
+## Working
+The user is prompted to enter the URL of the Medium article that has to be downloaded
+
+![Image](assets/promptURL.PNG)
+
+The contents are then stored in a file named Medium$_article$_content.txt
+
+![Image](assets/content.PNG)
+
+