In [3]:
from bs4 import BeautifulSoup
import requests
In [6]:
page = requests.get('https://www.npr.org/programs/all-things-considered/')
In [10]:
soup = BeautifulSoup(page.content, 'html.parser')
In [36]:
articles = soup.find_all('article', {'class': "rundown-segment"})
In [37]:
len(articles)
Out[37]:
In [55]:
for article in articles:
audio = article.find('a', {'class': 'audio-module-listen'})
audioLink = audio.attrs['href']
print audioLink
In [ ]:
In [45]:
In [53]:
audioLink = audio.attrs['href']
In [54]:
audioLink
Out[54]:
In [ ]: