Python Pipeline примеры, kale.Pipeline Python примеры использования

Пример #1

0

Показать файл

    def __init__(self,
                 nb_path: str,
                 nb_metadata_overrides: Dict[str, Any] = None,
                 skip_validation: bool = False):
        """Instantiate a new NotebookProcessor.

        Args:
            nb_path: Path to source notebook
            nb_metadata_overrides: Override notebook config settings
            skip_validation: Set to True in order to skip the notebook's
                metadata validation. This is useful in case the
                NotebookProcessor is used to parse a part of the notebook
                (e.g., retrieve pipeline metrics) and the notebook config (for
                pipeline generation) might still be invalid.
        """
        self.nb_path = os.path.expanduser(nb_path)
        self.notebook = self._read_notebook()

        nb_metadata = self.notebook.metadata.get(KALE_NB_METADATA_KEY, dict())

        # fixme: needed?
        nb_metadata.update({"notebook_path": nb_path})
        if nb_metadata_overrides:
            nb_metadata.update(nb_metadata_overrides)
        # validate and populate defaults
        # FIXME: Maybe improve this by implementing a "skip_validation" flag
        #  in the config class
        self.config = None
        if not skip_validation:
            self.config = NotebookConfig(**nb_metadata)
        self.pipeline = Pipeline(self.config)

Пример #2

0

Показать файл

Файл: test_config.py Проект: ydataai/kale

def test_get_volumes_parameters_exc(dummy_nb_config, volumes):
    """Tests that volumes are correctly converted from list into dict."""
    with pytest.raises(ValueError,
                       match="VolumeTypeValidator:"
                       " Value unknown is not allowed"):
        pipeline = Pipeline(NotebookConfig(**dummy_nb_config, volumes=volumes))
        pipeline.set_volume_pipeline_parameters()

Пример #3

0

Показать файл

Файл: baseprocessor.py Проект: srinivasav22/kale

 def __init__(self,
              config: PipelineConfig = None,
              skip_validation: bool = False,
              **kwargs):
     self.config = config
     if not config and not skip_validation:
         self.config = self.config_cls(**kwargs)
     self.pipeline = Pipeline(self.config)

Пример #4

0

Показать файл

Файл: dependencies.py Проект: zhilongli/kale

def assign_metrics(pipeline: Pipeline, pipeline_metrics: dict):
    """Assign pipeline metrics to specific pipeline steps.

    This assignment follows a similar logic to the detection of `out`
    dependencies. Starting from a temporary step - child of all the leaf nodes,
    all the nodes in the pipelines are traversed in reversed topological order.
    When a step shows one of the metrics as part of its code, then that metric
    is assigned to the step.

    Args:
        pipeline: Pipeline object
        pipeline_metrics (dict): a dict of pipeline metrics where the key is
            the KFP sanitized name and the value the name of the original
            variable.
    """
    # create a temporary step at the end of the pipeline to simplify the
    # iteration from the leaf steps
    tmp_step_name = "_tmp"
    leaf_steps = pipeline.get_leaf_steps()
    if not leaf_steps:
        return
    [pipeline.add_edge(step.name, tmp_step_name) for step in leaf_steps]

    # pipeline_metrics is a dict having sanitized variable names as keys and
    # the corresponding variable names as values. Here we need to refer to
    # the sanitized names using the python variables.
    # XXX: We could change parse_metrics_print_statements() to return the
    # XXX: reverse dictionary, but that would require changing either
    # XXX: rpc.nb.get_pipeline_metrics() or change in the JupyterLab Extension
    # XXX: parsing of the RPC result
    rev_pipeline_metrics = {v: k for k, v in pipeline_metrics.items()}
    metrics_left = set(rev_pipeline_metrics.keys())
    for anc in graphutils.get_ordered_ancestors(pipeline, tmp_step_name):
        if not metrics_left:
            break

        anc_step = pipeline.get_step(anc)
        anc_source = '\n'.join(anc_step.source)
        # get all the marshal candidates from father's source and intersect
        # with the metrics that have not been matched yet
        marshal_candidates = kale_ast.get_marshal_candidates(anc_source)
        assigned_metrics = metrics_left.intersection(marshal_candidates)
        # Remove the metrics that have already been assigned.
        metrics_left.difference_update(assigned_metrics)
        # Generate code to produce the metrics artifact in the current step
        if assigned_metrics:
            code = METRICS_TEMPLATE % ("    " + ",\n    ".join([
                '"%s": %s' % (rev_pipeline_metrics[x], x)
                for x in sorted(assigned_metrics)
            ]))
            anc_step.source.append(code)
        # need to have a `metrics` flag set to true in order to set the
        # metrics output artifact in the pipeline template
        anc_step.metrics = True

    pipeline.remove_node(tmp_step_name)

Пример #5

0

Показать файл

def test_generate_function(_nb_config_mock, notebook_processor, step_name,
                           source, ins, outs, metadata, target):
    """Test that python code is generated correctly."""
    pipeline = Pipeline(NotebookConfig(**{**DUMMY_NB_CONFIG, **metadata}))
    pipeline.processor = notebook_processor
    step = Step(name=step_name, source=source, ins=ins, outs=outs)
    compiler = Compiler(pipeline)
    res = compiler.generate_lightweight_component(step)
    target = open(os.path.join(THIS_DIR, "../assets/functions", target)).read()
    assert res.strip() == target.strip()

Пример #6

0

Показать файл

def test_set_volume_pipeline_parameters(notebook_processor, dummy_nb_config,
                                        volumes, target):
    """Tests that volumes are correctly converted from list into dict."""
    notebook_processor.pipeline = Pipeline(
        NotebookConfig(**dummy_nb_config, volumes=volumes))
    notebook_processor._set_volume_pipeline_parameters()
    assert target == notebook_processor.pipeline.pipeline_parameters

Пример #7

0

Показать файл

Файл: test_parser.py Проект: gbrlins/kale-1

def test_merge_code(dummy_nb_config):
    """Test the merge code functionality."""
    pipeline = Pipeline(NotebookConfig(**dummy_nb_config))
    pipeline.add_step(Step(name="test", source=["test1"]))
    pipeline.get_step("test").merge_code("test2")

    assert pipeline.get_step("test").source == ["test1", "test2"]

Пример #8

0

Показать файл