import AdvancedHTMLParser
# crawls https://www.bundestag.de/bundestag/plenum/abstimmung/2016 for votes in xls format
# should then evaluate and store the results in a database
parser = AdvancedHTMLParser.AdvancedHTMLParser();
parser.parseFile("bundestag.html")
links = parser.getElementsByClassName("linkGeneric")
for link in links:
href = link.getAttribute("href")
if href.endswith(".xls"):
print href