示例#1
0
def test_run_step_five():
    result = execute_pipeline(
        define_repository().get_pipeline('pyspark_pagerank_step_five'),
        environment_dict={
            'solids': {
                'parse_pagerank_data_step_five': {
                    'inputs': {
                        'pagerank_data':
                        script_relative_path('pagerank_data.txt')
                    }
                },
                'calculate_ranks_step_five': {
                    'config': {
                        'iterations': 3
                    }
                },
            }
        },
    )
    assert result.success

    assert set(
        result.result_for_solid('log_ranks_step_five').output_value()) == {
            ('alessimportantsite.com', 0.5055833333333333),
            ('whatdoesitallmeananyways.com', 0.5055833333333333),
            ('importantsite.com', 2.4832499999999995),
            ('anotherlessimportantsite.com', 0.5055833333333333),
        }
def test_run_step_four():
    result = execute_pipeline(
        define_repository().get_pipeline('pyspark_pagerank_step_four'),
        environment_dict={
            'solids': {
                'parse_pagerank_data_step_four': {
                    'inputs': {'pagerank_data': script_relative_path('pagerank_data.txt')}
                }
            }
        },
    )
    assert result.success

    assert set(result.result_for_solid('rest_of_pipeline').transformed_value()) == {
        ('anotherlessimportantsite.com', 0.9149999999999999),
        ('whatdoesitallmeananyways.com', 0.9149999999999999),
        ('importantsite.com', 1.255),
        ('alessimportantsite.com', 0.9149999999999999),
    }
示例#3
0
def test_pyspark_pagerank_repo():
    assert define_repository().get_all_pipelines()
示例#4
0
def test_run_step_one():
    assert execute_pipeline(
        define_repository().get_pipeline('pyspark_pagerank_step_one')).success