def begin_pipeline(**kwargs):
    print("begin_pipeline:")
    s3_bucket = os.environ.get("S3_BUCKET", "")
    folder_path = kwargs['dag_run'].conf.get('folder_path')
    s3_file = kwargs['dag_run'].conf.get('s3_file')
    uuid_mapping_file = kwargs['dag_run'].conf.get('uuid_mapping_file')
    biobank_file = kwargs['dag_run'].conf.get('biobank_file')
    mapping_file = kwargs['dag_run'].conf.get('mapping_file')

    dp = DagPebbles()
    download_key = dp.get_download_key(s3_bucket, folder_path, s3_file)
    pipeline_state_args = {
        "s3_bucket": s3_bucket,
        "folder_path": folder_path,
        "s3_file": s3_file,
        "uuid_mapping_file": uuid_mapping_file,
        "biobank_file": biobank_file,
        "mapping_file": mapping_file,
        "download_key": download_key
    }
    dp.save_pipeline_state(**pipeline_state_args)

    kwargs["ti"].xcom_push(key="folder_path", value=folder_path)
    kwargs["ti"].xcom_push(key="s3_file", value=s3_file)
    kwargs["ti"].xcom_push(key="download_key", value=download_key)
    kwargs["ti"].xcom_push(key="uuid_mapping_file", value=uuid_mapping_file)
    kwargs["ti"].xcom_push(key="biobank_file", value=biobank_file)
    kwargs["ti"].xcom_push(key="mapping_file", value=mapping_file)
Ejemplo n.º 2
0
def stage_custom_dmp_files(**kwargs):
    print("stage_custom_dmp_files:")
    dp = DagPebbles()
    custom_log_file = kwargs['dag_run'].conf.get('custom_log_file')
    custom_dmp_file = kwargs['dag_run'].conf.get('custom_dmp_file')
    pipeline_args = {
        "custom_log_file": custom_log_file,
        "custom_dmp_file": custom_dmp_file
    }
    dp.save_pipeline_state(**pipeline_args)
    dp.stage_custom_dmp_files(**pipeline_args)