Exemplo n.º 1
0
def main():
    import sys
    url = sys.argv[1]
    filename = os.path.join(os.environ['IN_THE_ROOMS_ROOT'], 'meetings', '%d.html' % _id(url))
    dt = dumptruck.DumpTruck(
        dbname = os.path.join(os.environ['IN_THE_ROOMS_ROOT'], 'intherooms.db'),
        adapt_and_convert = True
    )
    html = lxml.html.parse(filename).getroot()
    if html == None:
        print('%d.html is empty' % _id(url))
        exit()
    data = {
        'Url': url,
        'Meeting Description': meeting_info(html),
    }
    data = meeting_description(data)
    dt.insert(data, 'meeting_info')
Exemplo n.º 2
0
def main():
    import sys
    if len(sys.argv) != 2:
        print("USAGE: %d [location page url]" % sys.argv[0])
        exit(1)

    url = sys.argv[1]

    filename = os.path.join(os.environ['IN_THE_ROOMS_ROOT'], 'locations', '%d.html' % _id(url))

    dt = dumptruck.DumpTruck(
        dbname = os.path.join(os.environ['IN_THE_ROOMS_ROOT'], 'intherooms.db'),
        adapt_and_convert = True
    )

    source = open(filename).read()

    if not re.findall(COORDS, source):
        print('No coordinates were found; this page probably redirects to the home page.')
        return

    html = lxml.html.parse(filename).getroot()

    data = {
        'Url': url,
    }
    data.update(coords(source))
    data['Location Description'] = description(html)
    dt.insert(data, 'location')