def scheduler(): while True: for node in Node.query.filter_by(enabled=True, mode="normal").all(): # Fetch the status of this node. status = node_status(node.url) if not status: log.debug("Error retrieving status of node %s", node.name) time.sleep(settings.interval) continue # Check whether this node still has enough samples to work with. if status["tasks"]["pending"] >= settings.threshold: continue # Schedule new samples for this node. q = Task.query.filter_by(status=Task.PENDING) tasks = q.limit(settings.threshold).all() for task in tasks: task.status = Task.ASSIGNED task.node_id = node.id if tasks: log.debug("Assigned %d tasks to %s", len(tasks), node.name) db.session.commit() time.sleep(10)
def handle_node(instance): node = Node.query.filter_by(name=instance).first() if not node: log.critical("Node not found: %s", instance) return while True: # Fetch the status of this node. status = node_status(node.url) if not status: log.debug("Error retrieving status of node %s", node.name) time.sleep(settings.interval) continue # Include the timestamp of when we retrieved this status. status["timestamp"] = int(time.time()) # Add this node status to the database for monitoring purposes. ns = NodeStatus(node.name, datetime.datetime.now(), status) db.session.add(ns) db.session.commit() # Submission of new tasks. if status["tasks"]["pending"] < settings.threshold: q = Task.query.filter_by(node_id=node.id, status=Task.ASSIGNED) q = q.order_by(Task.priority.desc(), Task.id) tasks = q.limit(settings.threshold).all() for t in tasks: t.task_id = submit_task(node.url, t.to_dict()) t.status = Task.PROCESSING t.delegated = datetime.datetime.now() log.debug("Submitted %d tasks to %s", len(tasks), node.name) db.session.commit() # Fetching of reports. tasks = fetch_tasks(node.url, status="reported") for task in tasks[:settings.threshold]: # In the case that a Cuckoo node has been reset over time it's # possible that there are multiple combinations of # node-id/task-id, in this case we take the last one available. # (This makes it possible to re-setup a Cuckoo node). q = Task.query.filter_by(node_id=node.id, task_id=task["id"]) t = q.order_by(Task.id.desc()).first() if t is None: log.debug("Node %s task #%d has not been submitted " "by us!", instance, task["id"]) # Should we delete this task? Improve through the usage of # the "owner" parameter. delete_task(node.url, task["id"]) continue dirpath = os.path.join(settings.reports_directory, "%d" % t.id) if not os.path.isdir(dirpath): os.makedirs(dirpath) # Fetch each report. for report_format in settings.report_formats: try: store_report(node.url, t.task_id, report_format, dirpath) except InvalidReport as e: log.critical("Error fetching report: %s", e) # Fetch the pcap file. if settings.pcap: pcap_path = os.path.join(dirpath, "dump.pcap") fetch_pcap(node.url, t.task_id, pcap_path) # Delete the task and all its associated files from the # Cuckoo node. delete_task(node.url, t.task_id) t.status = Task.FINISHED t.started = datetime.datetime.strptime(task["started_on"], "%Y-%m-%d %H:%M:%S") t.completed = datetime.datetime.now() log.debug("Fetched %d reports from %s", len(tasks), node.name) db.session.commit() time.sleep(settings.interval)