def read_in_sessions(): sessions = defaultdict(list) db = connect_db() select_cursor = db.execute("SELECT session_id, query_id, template FROM templated_sessions ORDER BY session_id") for (session_id, query_id, template) in select_cursor.fetchall(): time_cursor = db.execute("SELECT time FROM queries WHERE id=?", [query_id]) time = float(time_cursor.fetchall()[0][0]) template = ParseTreeNode.from_dict(json.loads(template)) sessions[session_id].append((time, query_id, template)) db.close() return sessions
def main(): db = connect_db() cursor = db.execute("select count(distinct users.name) as cnt, template from templates, users, queries where templates.query_id = queries.id and queries.user_id = users.id group by template order by cnt desc") data = cursor.fetchall() for (cnt, template) in data: d = json.loads(template) template = ParseTreeNode.from_dict(d) template.print_tree() print "count: ", cnt print "" print "" db.close()
def read_data(): with open('/Users/salspaugh/queryexplorer/data/top_templates.csv') as file: data = [] first = True for line in file.readlines(): parts = line.split(',') if first: first = False continue cnt = int(parts[0]) jsonified_tree = ','.join(parts[1:]) d = json.loads(jsonified_tree) template = ParseTreeNode.from_dict(d) data.append((cnt, template)) return data