示例#1
0
def main_sqlite():
    import os
    import dumptruck
    import lxml.html
    dt = dumptruck.DumpTruck(
        dbname = os.path.join(os.environ['IN_THE_ROOMS_ROOT'], 'intherooms.db'),
        adapt_and_convert = True
    )
    dirname, n = search_args()
    filename = os.path.join(os.environ['IN_THE_ROOMS_ROOT'], 'searches-usa', dirname, '%d.html' % n)
    html = lxml.html.parse(filename).getroot()
    data = table_data(html)
    for row in data:
        row['Search Longitude'], row['Search Latitude'] = dirname.split(',')
        row['Search Page'] = n
    dt.upsert(data, 'meeting_search')
    print('Parsed (%s) page %d' % (dirname, n))
示例#2
0
def main_json():
    import json
    url = page(*search_args())
    html = lxml.html.parse(url)
    data = table_data(html)
    print(json.dumps(data))