コード例 #1
0
	def test_samples_created_correctly_for_skipping_align_with_mocked_directory_structure(self, mock_os, mock_join, mock_parse_method):
		"""
		Tests the case where we want to skip alignment and the target suffix is given for the BAM files
		In this case, we mock the return value from os.walk() and make the actual call to the find_files() method
		"""
		# list of tuples linking the sample names and conditions:
		pairings = [('A', 'X'),('B', 'X'),('C', 'Y')]
		mock_parse_method.return_value = pairings
		
		# mock the find_files() method returning some paths to bam files:
		bamfiles = ['/path/to/project/dir/Sample_A/A.sort.primary.bam','/path/to/project/dir/Sample_B/B.sort.primary.bam','/path/to/project/dir/C.sort.primary.bam']

		# setup all the necessary parameters that the method will look at:
		p = PipelineBuilder('')
		p.all_samples = []
		mock_pipeline_params = Params()
		mock_pipeline_params.add(project_directory = '/path/to/project_dir')
		mock_pipeline_params.add(sample_annotation_file = '/path/to/project_dir/samples.txt')
		mock_pipeline_params.add(skip_align = True)
		mock_pipeline_params.add(target_bam = 'sort.primary.bam')
		p.builder_params = mock_pipeline_params

		mock_os.walk.return_value = [('/path/to/project/dir', ['Sample_A', 'Sample_B'], ['C.sort.primary.bam']),
			('/path/to/project/dir/Sample_A', ['another_dir'], ['A.sort.primary.bam']),
			('/path/to/project/dir/Sample_B', [], ['B.sort.primary.bam']),
			('/path/to/project/dir/Sample_A/another_dir', [], ['A.sort.bam']),
			]

		p._PipelineBuilder__check_and_create_samples()
		for i,s in enumerate(p.all_samples):
			self.assertTrue(s.sample_name == pairings[i][0])
			self.assertTrue(s.read_1_fastq == None)
			self.assertTrue(s.read_2_fastq == None)
			self.assertTrue(s.bamfiles == [bamfiles[i]] )
コード例 #2
0
	def test_samples_created_correctly_for_skipping_align(self, mock_find_files, mock_parse_method):
		"""
		Tests the case where we want to skip alignment and the target suffix is given for the BAM files
		In this test, the call to the find_file method is mocked out with a dummy return value
		"""
		# list of tuples linking the sample names and conditions:
		pairings = [('A', 'X'),('B', 'X'),('C', 'Y')]
		mock_parse_method.return_value = pairings
		
		# mock the find_file() method returning some paths to bam files:
		bamfiles = [['A.sort.bam'],['B.sort.bam'],['C.sort.bam']]
		mock_find_files.side_effect = bamfiles

		# setup all the necessary parameters that the method will look at:
		p = PipelineBuilder('')
		p.all_samples = []
		mock_pipeline_params = Params()
		mock_pipeline_params.add(project_directory = '/path/to/project_dir')
		mock_pipeline_params.add(sample_annotation_file = '/path/to/project_dir/samples.txt')
		mock_pipeline_params.add(skip_align = True)
		mock_pipeline_params.add(target_bam = 'sort.bam')
		p.builder_params = mock_pipeline_params

		p._PipelineBuilder__check_and_create_samples()
		for i,s in enumerate(p.all_samples):
			self.assertTrue(s.sample_name == pairings[i][0])
			self.assertTrue(s.read_1_fastq == None)
			self.assertTrue(s.read_2_fastq == None)
			self.assertTrue(s.bamfiles == bamfiles[i] )
コード例 #3
0
	def test_exception_raised_if_missing_second_fastq_in_paired_alignment(self, mock_os, mock_glob, mock_join, mock_parse_method):
		"""
		Tests that an exception is raised if paired-end alignment is specified, but no read 2 fastq files are found
		"""
		# list of tuples linking the sample names and conditions:
		pairings = [('A', 'X'),('B', 'X'),('C', 'Y')]
		mock_parse_method.return_value = pairings
		
		# setup all the necessary parameters that the method will look at:
		p = PipelineBuilder('')
		p.all_samples = []
		mock_pipeline_params = Params()
		mock_pipeline_params.add(project_directory = '/path/to/project_dir')
		mock_pipeline_params.add(read_1_fastq_tag = '_R1_001.fastq.gz')
		mock_pipeline_params.add(read_2_fastq_tag = '_R2_001.fastq.gz')
		mock_pipeline_params.add(sample_annotation_file = '/path/to/project_dir/samples.txt')
		mock_pipeline_params.add(skip_align = False)
		mock_pipeline_params.add(paired_alignment = True)
		mock_pipeline_params.add(target_bam = 'sort.bam')
		mock_pipeline_params.add(sample_dir_prefix = 'Sample_')
		p.builder_params = mock_pipeline_params

		# mock there being only R1 fastq files for one of the samples:
		glob_return = [['A_R1_001.fastq.gz'],['A_R2_001.fastq.gz'],['B_R1_001.fastq.gz'],[], ['C_R1_001.fastq.gz'],['C_R2_001.fastq.gz']]
		mock_glob.glob.side_effect = glob_return

		# mock the missing config file: 
		mock_os.path.isdir.return_value = True

		with self.assertRaises(MissingFileException):
			p._PipelineBuilder__check_and_create_samples()
コード例 #4
0
    def test_raises_exception_if_skipping_align_and_pairing_not_specified(
            self, mock_find_files, mock_parse_method):
        """
		Tests the case where we want to skip alignment and the user has not given whether the BAM files were created
		from paired or unpaired protocol
		"""
        # list of tuples linking the sample names and conditions:
        pairings = [('A', 'X'), ('B', 'X'), ('C', 'Y')]
        mock_parse_method.return_value = pairings

        # mock the find_file() method returning some paths to bam files:
        bamfiles = [['A.sort.bam'], ['B.sort.bam'], ['C.sort.bam']]
        mock_find_files.side_effect = bamfiles

        # setup all the necessary parameters that the method will look at:
        p = PipelineBuilder('')
        p.all_samples = []
        mock_pipeline_params = Params()
        mock_pipeline_params.add(project_directory='/path/to/project_dir')
        mock_pipeline_params.add(
            sample_annotation_file='/path/to/project_dir/samples.txt')
        mock_pipeline_params.add(skip_align=True)
        mock_pipeline_params.add(target_bam='sort.bam')
        p.builder_params = mock_pipeline_params

        with self.assertRaises(ParameterNotFoundException):
            p._PipelineBuilder__check_and_create_samples()
コード例 #5
0
    def test_exception_raised_if_multiple_fastq_found(self, mock_os, mock_glob,
                                                      mock_join,
                                                      mock_parse_method):
        """
		Tests that an exception is raised if there is more than 1 fastq file (e.g. if glob's matching
		routine matches more than one fastq file)
		"""
        # list of tuples linking the sample names and conditions:
        pairings = [('A', 'X'), ('B', 'X'), ('C', 'Y')]
        mock_parse_method.return_value = pairings

        # setup all the necessary parameters that the method will look at:
        p = PipelineBuilder('')
        p.all_samples = []
        mock_pipeline_params = Params()
        mock_pipeline_params.add(project_directory='/path/to/project_dir')
        mock_pipeline_params.add(read_1_fastq_tag='_R1_001.fastq.gz')
        mock_pipeline_params.add(read_2_fastq_tag='_R2_001.fastq.gz')
        mock_pipeline_params.add(read_1_fastqc_tag='_R1_001_fastqc')
        mock_pipeline_params.add(read_2_fastqc_tag='_R2_001_fastqc')
        mock_pipeline_params.add(fastqc_report_file='fastqc_report.html')
        mock_pipeline_params.add(
            sample_annotation_file='/path/to/project_dir/samples.txt')
        mock_pipeline_params.add(skip_align=False)
        mock_pipeline_params.add(target_bam='sort.bam')
        mock_pipeline_params.add(sample_dir_prefix='Sample_')
        p.builder_params = mock_pipeline_params

        # mock the missing config file:
        mock_os.path.isdir.return_value = True

        # mock there being only R1 fastq files, and have one of the entries return >1 in the list:
        glob_return = [['A_R1_001.fastq.gz'], [], [], [],
                       ['B_R1_001.fastq.gz', 'B_AT_R1_001.fastq.gz'], [], [],
                       [], ['C_R1_001.fastq.gz'], [], [], []]
        mock_glob.glob.side_effect = glob_return

        with self.assertRaises(MultipleFileFoundException):
            p._PipelineBuilder__check_and_create_samples()

        # mock there being both R1 and R2 fastq files (And we want paired alignment), and have one of the R2 entries return >1 in the list:
        glob_return = [['A_R1_001.fastq.gz'], ['A_R2_001.fastq.gz'], [], [],
                       ['B_R1_001.fastq.gz'], ['B_R2_001.fastq.gz'], [], [],
                       ['C_R1_001.fastq.gz'],
                       ['C_R2_001.fastq.gz', 'C_AT_R2_001.fastq.gz'], [], []]
        mock_glob.glob.side_effect = glob_return

        with self.assertRaises(MultipleFileFoundException):
            p._PipelineBuilder__check_and_create_samples()
コード例 #6
0
    def test_samples_created_correctly_for_paired_end_protocol(
            self, mock_os, mock_glob, mock_join, mock_parse_method):
        """
		Tests that, given alignment is desired and the correct project structure is in place, the 
		correct samples are added to the pipeline (paired-end reads)
		"""
        # list of tuples linking the sample names and conditions:
        pairings = [('A', 'X'), ('B', 'X'), ('C', 'Y')]
        mock_parse_method.return_value = pairings

        # setup all the necessary parameters that the method will look at:
        p = PipelineBuilder('')
        p.all_samples = []
        mock_pipeline_params = Params()
        mock_pipeline_params.add(project_directory='/path/to/project_dir')
        mock_pipeline_params.add(read_1_fastq_tag='_R1_001.fastq.gz')
        mock_pipeline_params.add(read_2_fastq_tag='_R2_001.fastq.gz')
        mock_pipeline_params.add(read_1_fastqc_tag='_R1_001_fastqc')
        mock_pipeline_params.add(read_2_fastqc_tag='_R2_001_fastqc')
        mock_pipeline_params.add(fastqc_report_file='fastqc_report.html')
        mock_pipeline_params.add(
            sample_annotation_file='/path/to/project_dir/samples.txt')
        mock_pipeline_params.add(skip_align=False)
        mock_pipeline_params.add(paired_alignment=True)
        mock_pipeline_params.add(target_bam='sort.bam')
        mock_pipeline_params.add(sample_dir_prefix='Sample_')
        p.builder_params = mock_pipeline_params

        # mock unique R1 and R2 fastq files:
        glob_return = [['A_R1_001.fastq.gz'], ['A_R2_001.fastq.gz'], [], [],
                       ['B_R1_001.fastq.gz'], ['B_R2_001.fastq.gz'], [], [],
                       ['C_R1_001.fastq.gz'], ['C_R2_001.fastq.gz'], [], []]
        mock_glob.glob.side_effect = glob_return

        # mock the missing config file:
        mock_os.path.isdir.return_value = True

        p._PipelineBuilder__check_and_create_samples()
        for i, s in enumerate(p.all_samples):
            self.assertTrue(s.sample_name == pairings[i][0])
            self.assertTrue(s.read_1_fastq == glob_return[i * 4][0])
            self.assertTrue(s.read_2_fastq == glob_return[i * 4 + 1][0])
            self.assertTrue(s.bamfiles == [])