Python Pipelineの例、python_pachyderm.client.pps.pps_pb2.Pipeline Pythonの例

コード例 #1

0

ファイルを表示

    def list_job(self, pipeline_name=None, input_commit=None, output_commit=None, history=None):
        """
        Lists jobs. Yields `JobInfo` objects.

        Params:

        * pipeline_name: An optional string representing a pipeline name to
        filter on.
        * input_commit: An optional list of tuples, strings, or `Commit`
        objects representing input commits to filter on.
        * output_commit: An optional tuple, string, or `Commit` object
        representing an output commit to filter on.
        * history: An optional int that indicates to return jobs from
          historical versions of pipelines. Semantics are:
            * 0: Return jobs from the current version of the pipeline or
              pipelines.
            * 1: Return the above and jobs from the next most recent version
            * 2: etc.
            * -1: Return jobs from all historical versions.
        """

        pipeline = proto.Pipeline(name=pipeline_name) if pipeline_name is not None else None

        if isinstance(input_commit, list):
            input_commit = [commit_from(ic) for ic in input_commit]
        elif input_commit is not None:
            input_commit = [commit_from(input_commit)]

        output_commit = commit_from(output_commit) if output_commit is not None else None

        req = proto.ListJobRequest(pipeline=pipeline, input_commit=input_commit,
                                   output_commit=output_commit, history=history)

        return self.stub.ListJobStream(req, metadata=self.metadata)

コード例 #2

0

ファイルを表示

 def rerun_pipeline(self, pipeline_name, exclude=tuple(), include=tuple()):
     req = proto.RerunPipelineRequest(
         pipeline=proto.Pipeline(name=pipeline_name),
         exclude=exclude,
         include=include
     )
     self.stub.RerunPipeline(req, metadata=self.metadata)

コード例 #3

0

ファイルを表示

    def get_pipeline_logs(self, pipeline_name, data_filters=None, master=None,
                          datum=None, follow=None, tail=None):
        """
        Gets logs for a pipeline. Yields `LogMessage` objects.

        Params:

        * pipeline_name: A string representing a pipeline to get
        logs of.
        * data_filters: An optional iterable of strings specifying the names
        of input files from which we want processing logs. This may contain
        multiple files, to query pipelines that contain multiple inputs. Each
        filter may be an absolute path of a file within a pps repo, or it may
        be a hash for that file (to search for files at specific versions.)
        * master: An optional bool.
        * datum: An optional `Datum` object.
        * follow: An optional bool specifying whether logs should continue to
        stream forever.
        * tail: An optional int. If nonzero, the number of lines from the end
        of the logs to return.  Note: tail applies per container, so you will
        get tail * <number of pods> total lines back.
        """

        req = proto.GetLogsRequest(
            pipeline=proto.Pipeline(name=pipeline_name),
            data_filters=data_filters, master=master, datum=datum,
            follow=follow, tail=tail,
        )
        return self.stub.GetLogs(req, metadata=self.metadata)

コード例 #4

0

ファイルを表示

    def create_pipeline(self, pipeline_name, transform=None, parallelism_spec=None,
                        hashtree_spec=None, egress=None, update=None, output_branch=None,
                        scale_down_threshold=None, resource_requests=None,
                        resource_limits=None, input=None, description=None, cache_size=None,
                        enable_stats=None, reprocess=None, batch=None, max_queue_size=None,
                        service=None, chunk_spec=None, datum_timeout=None,
                        job_timeout=None, salt=None, standby=None, datum_tries=None,
                        scheduling_spec=None, pod_patch=None):
        """
        Creates a pipeline. For more info, please refer to the pipeline spec
        document:
        http://docs.pachyderm.io/en/latest/reference/pipeline_spec.html

        Params:
        * pipeline_name: A string representing the pipeline name.
        * transform: An optional `Transform` object.
        * parallelism_spec: An optional `ParallelismSpec` object.
        * hashtree_spec: An optional `HashtreeSpec` object.
        * egress: An optional `Egress` object.
        * update: An optional bool specifying whether this should behave as an
        upsert.
        * output_branch: An optional string representing the branch to output
        results on.
        * scale_down_threshold: An optional protobuf `Duration` object.
        * resource_requests: An optional `ResourceSpec` object.
        * resource_limits: An optional `ResourceSpec` object.
        * input: An optional `Input` object.
        * description: An optional string describing the pipeline.
        * cache_size: An optional string.
        * enable_stats: An optional bool.
        * reprocess: An optional bool. If true, pachyderm forces the pipeline
        to reprocess all datums. It only has meaning if `update` is `True`.
        * batch: An optional bool.
        * max_queue_size: An optional int.
        * service: An optional `Service` object.
        * chunk_spec: An optional `ChunkSpec` object.
        * datum_timeout: An optional protobuf `Duration` object.
        * job_timeout: An optional protobuf `Duration` object.
        * salt: An optional stirng.
        * standby: An optional bool.
        * datum_tries: An optional int.
        * scheduling_spec: An optional `SchedulingSpec` object.
        * pod_patch: An optional string.
        """

        req = proto.CreatePipelineRequest(
            pipeline=proto.Pipeline(name=pipeline_name),
            transform=transform, parallelism_spec=parallelism_spec,
            hashtree_spec=hashtree_spec, egress=egress, update=update,
            output_branch=output_branch, scale_down_threshold=scale_down_threshold,
            resource_requests=resource_requests, resource_limits=resource_limits,
            input=input, description=description, cache_size=cache_size,
            enable_stats=enable_stats, reprocess=reprocess, batch=batch,
            max_queue_size=max_queue_size, service=service,
            chunk_spec=chunk_spec, datum_timeout=datum_timeout,
            job_timeout=job_timeout, salt=salt, standby=standby,
            datum_tries=datum_tries, scheduling_spec=scheduling_spec,
            pod_patch=pod_patch
        )
        self.stub.CreatePipeline(req, metadata=self.metadata)

コード例 #5

0

ファイルを表示

    def inspect_pipeline(self, pipeline_name, history=None):
        """
        Inspects a pipeline. Returns a `PipelineInfo` object.

        Params:

        * pipeline_name: A string representing the pipeline name.
        * history: An optional int that indicates to return jobs from
        historical versions of pipelines. Semantics are:
            * 0: Return jobs from the current version of the pipeline or
              pipelines.
            * 1: Return the above and jobs from the next most recent version
            * 2: etc.
            * -1: Return jobs from all historical versions.
        """

        pipeline = proto.Pipeline(name=pipeline_name)

        if history is None:
            req = proto.InspectPipelineRequest(pipeline=pipeline)
            return self.stub.InspectPipeline(req, metadata=self.metadata)
        else:
            # `InspectPipeline` doesn't support history, but `ListPipeline`
            # with a pipeline filter does, so we use that here
            req = proto.ListPipelineRequest(pipeline=pipeline, history=history)
            pipelines = self.stub.ListPipeline(req, metadata=self.metadata).pipeline_info
            assert len(pipelines) <= 1
            return pipelines[0] if len(pipelines) else None

コード例 #6

0

ファイルを表示

 def create_pipeline(self,
                     pipeline_name,
                     transform=None,
                     parallelism_spec=None,
                     hashtree_spec=None,
                     egress=None,
                     update=None,
                     output_branch=None,
                     scale_down_threshold=None,
                     resource_requests=None,
                     resource_limits=None,
                     input=None,
                     description=None,
                     cache_size=None,
                     enable_stats=None,
                     reprocess=None,
                     batch=None,
                     max_queue_size=None,
                     service=None,
                     chunk_spec=None,
                     datum_timeout=None,
                     job_timeout=None,
                     salt=None,
                     standby=None,
                     datum_tries=None,
                     scheduling_spec=None,
                     pod_spec=None,
                     pod_patch=None):
     req = proto.CreatePipelineRequest(
         pipeline=proto.Pipeline(name=pipeline_name),
         transform=transform,
         parallelism_spec=parallelism_spec,
         hashtree_spec=hashtree_spec,
         egress=egress,
         update=update,
         output_branch=output_branch,
         scale_down_threshold=scale_down_threshold,
         resource_requests=resource_requests,
         resource_limits=resource_limits,
         input=input,
         description=description,
         cache_size=cache_size,
         enable_stats=enable_stats,
         reprocess=reprocess,
         batch=batch,
         max_queue_size=max_queue_size,
         service=service,
         chunk_spec=chunk_spec,
         datum_timeout=datum_timeout,
         job_timeout=job_timeout,
         salt=salt,
         standby=standby,
         datum_tries=datum_tries,
         scheduling_spec=scheduling_spec,
         pod_spec=pod_spec,
         pod_patch=pod_patch)
     self.stub.CreatePipeline(req, metadata=self.metadata)

コード例 #7

0

ファイルを表示

    def stop_pipeline(self, pipeline_name):
        """
        Stops a pipeline.

        Params:
        * pipeline_name: A string representing the pipeline name.
        """
        req = proto.StopPipelineRequest(pipeline=proto.Pipeline(name=pipeline_name))
        self.stub.StopPipeline(req, metadata=self.metadata)

コード例 #8

0

ファイルを表示

 def list_job(self, pipeline_name=None, input_commit=None, output_commit=None):
     if isinstance(input_commit, list):
         input_commit = [commit_from(ic) for ic in input_commit]
     elif isinstance(input_commit, six.string_types):
         input_commit = [commit_from(input_commit)]
     if output_commit:
         output_commit = commit_from(output_commit)
     req = proto.ListJobRequest(pipeline=proto.Pipeline(name=pipeline_name), input_commit=input_commit,
                                output_commit=output_commit)
     return self.stub.ListJob(req, metadata=self.metadata)

コード例 #9

0

ファイルを表示

    def delete_pipeline(self, pipeline_name, force=None):
        """
        Deletes a pipeline.

        Params:
        * pipeline_name: A string representing the pipeline name.
        * force: Whether to force delete.
        """

        req = proto.DeletePipelineRequest(pipeline=proto.Pipeline(name=pipeline_name), force=force)
        self.stub.DeletePipeline(req, metadata=self.metadata)

コード例 #10

0

ファイルを表示

    def get_logs(self, pipeline_name=None, job_id=None, data_filters=tuple(), master=False):
        pipeline = proto.Pipeline(name=pipeline_name) if pipeline_name else None
        job = proto.Job(id=job_id) if job_id else None

        if pipeline is None and job is None:
            raise ValueError("One of 'pipeline_name' or 'job_id' must be specified")

        req = proto.GetLogsRequest(
            pipeline=pipeline, job=job, data_filters=data_filters,
            master=master
        )
        return list(self.stub.GetLogs(req, metadata=self.metadata))

コード例 #11

0

ファイルを表示

 def create_job(self, transform, pipeline_name, pipeline_version, parallelism_spec, inputs, egress, service, output_repo,
                output_branch, parent_job, resource_spec, input, new_branch, incremental, enable_stats, salt, batch):
     req = proto.CreateJobRequest(
         transform=transform, pipeline=proto.Pipeline(name=pipeline_name),
         pipeline_version=pipeline_version,
         parallelism_spec=parallelism_spec, inputs=inputs,
         egress=egress, service=service, output_repo=output_repo,
         output_branch=output_branch, parent_job=parent_job,
         resource_spec=resource_spec, input=input, new_branch=new_branch,
         incremental=incremental, enable_stats=enable_stats, salt=salt,
         batch=batch
     )
     return self.stub.CreateJob(req, metadata=self.metadata)

コード例 #12

0

ファイルを表示

    def run_pipeline(self, pipeline_name, provenance=None):
        """
        Runs a pipeline.

        Params:
        * pipeline_name: A string representing the pipeline name.
        * provenance: An optional iterable of `CommitProvenance` objects
        representing the pipeline execution provenance.
        """
        req = proto.RunPipelineRequest(
            pipeline=proto.Pipeline(name=pipeline_name),
            provenance=provenance,
        )
        self.stub.RunPipeline(req, metadata=self.metadata)

コード例 #13

0

ファイルを表示

    def flush_job(self, commits, pipeline_names=None):
        """
        Blocks until all of the jobs which have a set of commits as
        provenance have finished. Yields `JobInfo` objects.

        Params:
        * commits: A list of tuples, strings, or `Commit` objects representing
        the commits to flush.
        * pipeline_names: An optional list of strings specifying pipeline
        names. If specified, only jobs within these pipelines will be flushed.
        """

        commits = [commit_from(c) for c in commits]
        pipelines = [proto.Pipeline(name=name) for name in pipeline_names] if pipeline_names is not None else None
        req = proto.FlushJobRequest(commits=commits, to_pipelines=pipelines)
        return self.stub.FlushJob(req)

コード例 #14

0

ファイルを表示

 def stop_pipeline(self, pipeline_name):
     req = proto.StopPipelineRequest(pipeline=proto.Pipeline(pipeline_name))
     self.stub.StopPipeline(req, metadata=self.metadata)

コード例 #15

0

ファイルを表示

 def start_pipeline(self, pipeline_name):
     req = proto.StartPipelineRequest(pipeline=proto.Pipeline(
         name=pipeline_name))
     self.stub.StartPipeline(req, metadata=self.metadata)

コード例 #16

0

ファイルを表示

 def delete_pipeline(self, pipeline_name, all=False):
     req = proto.DeletePipelineRequest(
         pipeline=proto.Pipeline(name=pipeline_name), all=all)
     self.stub.DeletePipeline(req, metadata=self.metadata)

コード例 #17

0

ファイルを表示

 def inspect_pipeline(self, pipeline_name):
     req = proto.InspectPipelineRequest(pipeline=proto.Pipeline(
         name=pipeline_name))
     return self.stub.InspectPipeline(req, metadata=self.metadata)