Python ReadAllFromVcf示例

编程语言: Python

命名空间/包名称: gcp_variant_transforms.beam_io.vcfio

类/类型: ReadAllFromVcf

hotexamples.com的示例: 3

Python ReadAllFromVcf - 已找到3个示例。这些是从开源项目中提取的最受好评的gcp_variant_transforms.beam_io.vcfio.ReadAllFromVcf现实Python示例。您可以评价示例，以帮助我们提高示例质量。

常用方法

显示隐藏

ReadAllFromVcf(3)

示例#1

显示文件

 def test_pipeline_read_all_multiple_files_large(self):
   pipeline = TestPipeline()
   pcoll = (pipeline
            | 'Create' >> beam.Create(
                [testdata_util.get_full_file_path('valid-4.0.vcf'),
                 testdata_util.get_full_file_path('valid-4.1-large.vcf'),
                 testdata_util.get_full_file_path('valid-4.2.vcf')])
            | 'Read' >> ReadAllFromVcf())
   assert_that(pcoll, asserts.count_equals_to(9900))
   pipeline.run()

示例#2

显示文件

 def test_pipeline_read_all_multiple_files(self):
   with TempDir() as tempdir:
     file_name_1 = self._create_temp_vcf_file(
         _SAMPLE_HEADER_LINES + _SAMPLE_TEXT_LINES, tempdir)
     file_name_2 = self._create_temp_vcf_file(
         _SAMPLE_HEADER_LINES + _SAMPLE_TEXT_LINES, tempdir)
     pipeline = TestPipeline()
     pcoll = (pipeline
              | 'Create' >> beam.Create([file_name_1, file_name_2])
              | 'Read' >> ReadAllFromVcf())
     assert_that(pcoll, asserts.count_equals_to(2 * len(_SAMPLE_TEXT_LINES)))
     pipeline.run()

示例#3

显示文件

  def _assert_pipeline_read_files_record_count_equal(
      self, input_pattern, expected_count, use_read_all=False):
    """Helper method for verifying total records read.

    Args:
      input_pattern (str): Input file pattern to read.
      expected_count (int): Expected number of reacords that was read.
      use_read_all (bool): Whether to use the scalable ReadAllFromVcf transform
        instead of ReadFromVcf.
    """
    pipeline = TestPipeline()
    if use_read_all:
      pcoll = (pipeline
               | 'Create' >> beam.Create([input_pattern])
               | 'Read' >> ReadAllFromVcf())
    else:
      pcoll = pipeline | 'Read' >> ReadFromVcf(input_pattern)
    assert_that(pcoll, asserts.count_equals_to(expected_count))
    pipeline.run()