In [159]:
from urllib.request import urlopen
from bs4 import BeautifulSoup
import pandas as pd
html = urlopen("http://www.rosensys.com/upcoming-auctions")
soup = BeautifulSoup(html, "lxml")
#get elements
rstable = soup.table.tr
name = soup.h4.text
type1 = soup.h5.text
rstype = type1.replace("\n" ,"")
td1 = rstable.find_all('td')[1]
td2 = rstable.find_all('td')[2]
td3 = rstable.find_all('td')[3].a
ulink = td3['href']
sdate1 = soup.find("span", {"class":"date-display-single"}).text
sdate2 = sdate1.replace(",","")
sdate = sdate2.split(" - ")
aid = ulink.replace("https://www.maxanet.com/cgi-bin/mndetails.cgi?rosen","")
ulist = []
for item in soup.find_all('h4'):
aid = ulink.replace("https://www.maxanet.com/cgi-bin/mndetails.cgi?rosen","")
ulist.append(item.text)
print(ulist)
In [ ]: