def _generate(): for tr in scrape.read_table_pages(config.url("?operation=merkmaleVerzeichnis")): td = tr.find('td') if not td: continue if td.string: #print td.string.encode('utf-8') yield td.string.encode('utf-8') else: yield td.find('a').get('id').encode('utf-8')
def _generate(): for tr in scrape.read_table_pages( config.url("?operation=merkmaleVerzeichnis")): td = tr.find('td') if not td: continue if td.string: #print td.string.encode('utf-8') yield td.string.encode('utf-8') else: yield td.find('a').get('id').encode('utf-8')
def load_variable_tables(href): for tr in scrape.read_table_pages(href): yield tr.find('a').get('id')
def terms_it(): for tr in scrape.read_table_pages(config.url("?operation=begriffeVerzeichnis")): yield tr.findAll("a")[0].get("id")
def load_variables(stat_id): url = config.url("?sequenz=statistikMerkmale&selectionname=%s&sprache=de" % stat_id) for tr in scrape.read_table_pages(url): td = tr.find('td') if td: yield td.find('div').contents[0]