def main(): import sys url = sys.argv[1] filename = os.path.join(os.environ['IN_THE_ROOMS_ROOT'], 'meetings', '%d.html' % _id(url)) dt = dumptruck.DumpTruck( dbname = os.path.join(os.environ['IN_THE_ROOMS_ROOT'], 'intherooms.db'), adapt_and_convert = True ) html = lxml.html.parse(filename).getroot() if html == None: print('%d.html is empty' % _id(url)) exit() data = { 'Url': url, 'Meeting Description': meeting_info(html), } data = meeting_description(data) dt.insert(data, 'meeting_info')
def main(): import sys if len(sys.argv) != 2: print("USAGE: %d [location page url]" % sys.argv[0]) exit(1) url = sys.argv[1] filename = os.path.join(os.environ['IN_THE_ROOMS_ROOT'], 'locations', '%d.html' % _id(url)) dt = dumptruck.DumpTruck( dbname = os.path.join(os.environ['IN_THE_ROOMS_ROOT'], 'intherooms.db'), adapt_and_convert = True ) source = open(filename).read() if not re.findall(COORDS, source): print('No coordinates were found; this page probably redirects to the home page.') return html = lxml.html.parse(filename).getroot() data = { 'Url': url, } data.update(coords(source)) data['Location Description'] = description(html) dt.insert(data, 'location')