forked from adi0509/Python
-
Notifications
You must be signed in to change notification settings - Fork 0
/
news_article.py
37 lines (27 loc) · 1.07 KB
/
news_article.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
#Description: Scrape and Summarize News Articles
#pip install nltk
#pip install newspaper3k
#Resources: Documenation: https://newspaper.readthedocs.io/en/latest/?source=post_page---------------------------
# Medium Article: https://towardsdatascience.com/scrape-and-summarize-news-articles-in-5-lines-of-python-code-175f0e5c7dfc
# Article Website: https://www.washingtonpost.com/technology/2019/07/17/you-downloaded-faceapp-heres-what-youve-just-done-your-privacy/?noredirect=on&utm_term=.f8b0b55b2805
#Import the libraries
import nltk
from newspaper import Article
#Get the article
url = 'https://www.washingtonpost.com/technology/2019/07/17/you-downloaded-faceapp-heres-what-youve-just-done-your-privacy/?noredirect=on&utm_term=.1938589d078f'
article = Article(url)
# Do some NLP
article.download()
article.parse()
nltk.download('punkt')
article.nlp()
#Get the authors
article.authors
#Get the publish date
article.publish_date
#Get the top image
article.top_image
#Get the article text
print(article.text)
#Get a summary of the article
print(article.summary)