Update scrape_sources.py
Browse files- scrape_sources.py +1 -1
scrape_sources.py
CHANGED
@@ -47,7 +47,7 @@ class NPRLite(Source):
|
|
47 |
# Returns None if article is only 1 line.
|
48 |
def retrieve_article(self, indata: stub) -> Tuple[str, List[Tuple[str, Any]]]:
|
49 |
"""Retrieves article data from text.npr.org subhead if exists, date, author(s), and whole text"""
|
50 |
-
|
51 |
container = Soup(get(self.source_url[:-5] + indata.link))
|
52 |
text_container = container.find('div', {'class': "paragraphs-container"}).find('p')
|
53 |
if isinstance(text_container, Soup):
|
|
|
47 |
# Returns None if article is only 1 line.
|
48 |
def retrieve_article(self, indata: stub) -> Tuple[str, List[Tuple[str, Any]]]:
|
49 |
"""Retrieves article data from text.npr.org subhead if exists, date, author(s), and whole text"""
|
50 |
+
st.write(f"""Retrieving article from:\n\t{self.source_url[:-5] + indata.link}\n""")
|
51 |
container = Soup(get(self.source_url[:-5] + indata.link))
|
52 |
text_container = container.find('div', {'class': "paragraphs-container"}).find('p')
|
53 |
if isinstance(text_container, Soup):
|