def download_testdroid_apk(args):
    if args.filename:
        testdroid_apk = os.path.join(args.files, args.filename)
    else:
        testdroid_apk = os.path.join(args.files,
                                     os.path.basename(testdroid_apk_url))
    if os.path.exists(testdroid_apk) and not args.force:
        logger.warning("%s exists. Skipping download." % testdroid_apk)
    else:
        # Add ?raw=true to force download.
        download_file(testdroid_apk_url + "?raw=true", testdroid_apk)
Пример #2
0
 def thread_active_jobs(self):
     while self.state == "RUNNING":
         logger.info("getting active runs")
         try:
             self.process_active_runs()
         except requests.exceptions.ConnectionError as e:
             logger.warning(
                 "exception raised when calling process_active_runs.")
             logger.warning(e)
             # TODO: if we see this a lot, add exponential backoff?
             time.sleep(10)
         time.sleep(10)
Пример #3
0
    def handle_queue(self, project_name, projects_config):
        logger.info("thread starting")
        stats = CACHE["projects"][project_name]["stats"]
        lock = CACHE["projects"][project_name]["lock"]

        while self.state == "RUNNING":
            project_config = projects_config[project_name]
            device_group_name = project_config["device_group_name"]
            additional_parameters = project_config["additional_parameters"]
            worker_type = additional_parameters.get("TC_WORKER_TYPE")

            with lock:
                if stats["OFFLINE"] or stats["DISABLED"]:
                    logger.warning("{:10s} DISABLED {} OFFLINE {} {}".format(
                        device_group_name,
                        stats["DISABLED"],
                        stats["OFFLINE"],
                        ", ".join(stats["OFFLINE_DEVICES"]),
                    ))

                taskcluster_provisioner_id = projects_config["defaults"][
                    "taskcluster_provisioner_id"]

                # create enough tests to service either the pending tasks or the number of idle
                # devices which do not already have a waiting test + a small logarithmic fudge
                # term based on the number of pending tasks (whichever is smaller).
                try:
                    pending_tasks = get_taskcluster_pending_tasks(
                        taskcluster_provisioner_id, worker_type)
                except requests.ConnectionError as e:
                    logger.warning(
                        "exception raised when calling get_taskcluster_pending_tasks."
                    )
                    logger.warning(e)
                    pending_tasks = 0
                # warning: only take the log of positive non-zero numbers, or a
                # "ValueError: math domain error" will be raised
                jobs_to_start = min(
                    pending_tasks,
                    stats["IDLE"] - stats["WAITING"] + 1 +
                    int(math.log10(1 + pending_tasks)),
                )
                if jobs_to_start < 0:
                    jobs_to_start = 0

                if stats["RUNNING"] or stats["WAITING"]:
                    logger.info(
                        "COUNT {} IDLE {} OFFLINE {} DISABLED {} RUNNING {} WAITING {} PENDING {} STARTING {}"
                        .format(
                            stats["COUNT"],
                            stats["IDLE"],
                            stats["OFFLINE"],
                            stats["DISABLED"],
                            stats["RUNNING"],
                            stats["WAITING"],
                            pending_tasks,
                            jobs_to_start,
                        ))

            for _task in range(jobs_to_start):
                if self.state != "RUNNING":
                    break
                try:
                    if TESTING:
                        logger.info(
                            "TESTING MODE: Would be starting test run.")
                    else:
                        # if there are no devices assigned, the API will throw an exception
                        # when we try to start, so detect and warn here.
                        if stats["COUNT"] == 0:
                            logger.warning(
                                "Didn't try to start a job because there are no devices assigned."
                            )
                        else:
                            test_run = run_test_for_project(project_name)
                            # increment so we don't start too many jobs before main thread updates stats
                            with lock:
                                stats["WAITING"] += 1

                            logger.info("test run {} started".format(
                                test_run["id"]))
                except RequestResponseError as e:
                    if e.status_code == 404 and re.search(
                            ARCHIVED_FILE_REGEX, str(e)):
                        logger.error(
                            "Test files have been archived. Exiting so configuration is rerun..."
                        )
                        logger.error("%s: %s" % (e.__class__.__name__, e))
                        self.state = "STOP"
                    elif e.status_code == 404 and re.search(
                            PROJECT_DOES_NOT_EXIST_REGEX, str(e)):
                        logger.error(
                            "Project does not exist!. Exiting so configuration is rerun..."
                        )
                        logger.error("%s: %s" % (e.__class__.__name__, e))
                        self.state = "STOP"
                    else:
                        logger.error("%s: %s" % (e.__class__.__name__, e))
                except Exception as e:
                    logger.error(
                        "Failed to create test run for group %s (%s: %s)." %
                        (device_group_name, e.__class__.__name__, e),
                        exc_info=True,
                    )

            if self.state == "RUNNING":
                time.sleep(self.wait)
        logger.info("thread exiting")
Пример #4
0
    def run(self):
        projects_config = CONFIG["projects"]
        CONFIG["threads"] = []

        active_job_thread = threading.Thread(target=self.thread_active_jobs,
                                             name="active_jobs",
                                             args=())
        logger.info("test-run-manager: loading existing runs")
        active_job_thread.start()
        CONFIG["threads"].append(active_job_thread)
        time.sleep(2)

        for project_name in projects_config:
            if project_name == "defaults":
                continue

            project_config = projects_config[project_name]
            # device_group_name = project_config['device_group_name']
            additional_parameters = project_config["additional_parameters"]
            worker_type = additional_parameters.get("TC_WORKER_TYPE")

            if not worker_type:
                # Only manage projects initiated via Taskcluster.
                continue

            # prepopulate stats
            self.get_bitbar_test_stats(project_name,
                                       projects_config[project_name])
            time.sleep(1)

            # multithread handle_queue
            # TODO: should name be project_name or device group name?
            t1 = threading.Thread(
                target=self.handle_queue,
                name=project_name,
                args=(
                    project_name,
                    projects_config,
                ),
            )
            CONFIG["threads"].append(t1)
            t1.start()

        # we need the main thread to keep running so it can handle signals
        # - https://www.g-loaded.eu/2016/11/24/how-to-terminate-running-python-threads-using-signals/
        while self.state == "RUNNING":
            waiting_total = 0
            running_total = 0
            time.sleep(60)
            logger.info("getting stats for all projects")
            for project_name in projects_config:
                if project_name == "defaults":
                    continue
                lock = CACHE["projects"][project_name]["lock"]
                stats = CACHE["projects"][project_name]["stats"]
                waiting_total += stats["WAITING"]
                running_total += stats["RUNNING"]
                with lock:
                    try:
                        self.get_bitbar_test_stats(
                            project_name, projects_config[project_name])
                    except requests.exceptions.ConnectionError as e:
                        logger.warning(
                            "exception raised when calling get_bitbar_test_stats."
                        )
                        logger.warning(e)
                        # TODO: if we see this a lot, add exponential backoff?
                        time.sleep(15)
                time.sleep(1)
            logger.info("WAITING_TOTAL {} RUNNING_TOTAL {}".format(
                waiting_total, running_total))
        logger.info("main thread exiting")