Exemple #1
0
def stream_logs(experiment):
    pod_id = EXPERIMENT_JOB_NAME_FORMAT.format(
        task_type=TaskType.MASTER,  # We default to master
        task_idx=0,
        experiment_uuid=experiment.uuid.hex)
    k8s_manager = K8SManager(namespace=settings.K8S_NAMESPACE, in_cluster=True)
    return base.stream_logs(
        k8s_manager=k8s_manager,
        pod_id=pod_id,
        container_job_name=settings.CONTAINER_NAME_EXPERIMENT_JOB)
Exemple #2
0
def stream_logs(experiment: 'Experiment') -> Iterable[str]:
    pod_id = EXPERIMENT_JOB_NAME_FORMAT.format(
        task_type=TaskType.MASTER,  # We default to master
        task_idx=0,
        experiment_uuid=experiment.uuid.hex)
    k8s_manager = K8SManager(namespace=conf.get('K8S_NAMESPACE'),
                             in_cluster=True)
    return base.stream_logs(
        k8s_manager=k8s_manager,
        pod_id=pod_id,
        container_job_name=conf.get('CONTAINER_NAME_EXPERIMENT_JOB'))
Exemple #3
0
def stream_logs(experiment: 'Experiment') -> Iterable[str]:
    pod_id = EXPERIMENT_JOB_NAME_FORMAT.format(
        task_type=experiment.default_job_role,
        task_idx=0,
        experiment_uuid=experiment.uuid.hex)
    k8s_manager = K8SManager(namespace=conf.get('K8S_NAMESPACE'), in_cluster=True)
    container_job_name = get_experiment_job_container_name(backend=experiment.backend,
                                                           framework=experiment.framework)
    return base.stream_logs(k8s_manager=k8s_manager,
                            pod_id=pod_id,
                            container_job_name=container_job_name)
Exemple #4
0
def process_logs(experiment, temp=True):
    pod_id = EXPERIMENT_JOB_NAME_FORMAT.format(
        task_type=TaskType.MASTER,  # We default to master
        task_idx=0,
        experiment_uuid=experiment.uuid.hex)
    k8s_manager = K8SManager(namespace=settings.K8S_NAMESPACE, in_cluster=True)
    log_lines = base.process_logs(
        k8s_manager=k8s_manager,
        pod_id=pod_id,
        container_job_name=settings.CONTAINER_NAME_EXPERIMENT_JOB)

    safe_log_experiment(experiment_name=experiment.unique_name,
                        log_lines=log_lines,
                        temp=temp,
                        append=False)
Exemple #5
0
def process_logs(experiment: 'Experiment', temp: bool = True) -> None:
    pod_id = EXPERIMENT_JOB_NAME_FORMAT.format(
        task_type=experiment.default_job_role,
        task_idx=0,
        experiment_uuid=experiment.uuid.hex)
    k8s_manager = K8SManager(namespace=conf.get('K8S_NAMESPACE'), in_cluster=True)
    container_job_name = get_experiment_job_container_name(backend=experiment.backend,
                                                           framework=experiment.framework)
    log_lines = base.process_logs(k8s_manager=k8s_manager,
                                  pod_id=pod_id,
                                  container_job_name=container_job_name)

    safe_log_experiment(experiment_name=experiment.unique_name,
                        log_lines=log_lines,
                        temp=temp,
                        append=False)
Exemple #6
0
def process_logs(experiment_job, temp=True, k8s_manager=None):
    task_type = experiment_job.role
    task_id = experiment_job.sequence
    pod_id = EXPERIMENT_JOB_NAME_FORMAT.format(
        task_type=task_type,  # We default to master
        task_idx=task_id,
        experiment_uuid=experiment_job.experiment.uuid.hex)
    if not k8s_manager:
        k8s_manager = K8SManager(namespace=settings.K8S_NAMESPACE, in_cluster=True)
    log_lines = base.process_logs(k8s_manager=k8s_manager,
                                  pod_id=pod_id,
                                  container_job_name=settings.CONTAINER_NAME_EXPERIMENT_JOB,
                                  task_type=task_type,
                                  task_idx=task_id)

    safe_log_experiment_job(experiment_job_name=experiment_job.unique_name,
                            log_lines=log_lines,
                            temp=temp,
                            append=False)
Exemple #7
0
 def get_resource_name(self, task_type, task_idx):  # pylint:disable=arguments-differ
     return EXPERIMENT_JOB_NAME_FORMAT.format(
         task_type=task_type,
         task_idx=task_idx,
         experiment_uuid=self.experiment_uuid)
Exemple #8
0
 def pod_id(self) -> str:
     return EXPERIMENT_JOB_NAME_FORMAT.format(
         task_type=self.role,
         task_idx=self.sequence,
         experiment_uuid=self.experiment.uuid.hex)
Exemple #9
0
 def get_job_name(self, task_type, task_idx):
     return EXPERIMENT_JOB_NAME_FORMAT.format(
         task_type=task_type,
         task_idx=task_idx,
         experiment_uuid=self.experiment_uuid)