diff --git a/crawler.py b/crawler.py index c535463..793af48 100644 --- a/crawler.py +++ b/crawler.py @@ -1,5 +1,8 @@ import AdvancedHTMLParser +# crawls https://www.bundestag.de/bundestag/plenum/abstimmung/2016 for votes in xls format +# should then evaluate and store the results in a database + parser = AdvancedHTMLParser.AdvancedHTMLParser(); parser.parseFile("bundestag.html")