Example #1
0
 def test_Butterfly_is_identified_correctly(self):
     lines = ["20140920 17:28:14 30084 befulton 20 62435 0 S 24215176 0 37768 24080384 92 4 14420 30 0.03 0.17 "
              "4 00:00.20 0 6 519 0 203 1 0 0 1056 java -Xmx20G -Xms1G -jar /trinity/Butterfly/Butterfly.jar "
              "-N 100000 -L 200 -F 500 -C /jobdir/trinity_out/chrysalis/Component_bins/Cbin5/c6058.graph "
              "--max_number_of_paths_per_node=10 --path_reinforcement_distance=75 --triplet-lock"]
     _, line_dict, _, _, _ = make_data_files.build_datasets(generate(lines))
     self.assertEquals(lines, line_dict['Butterfly'])
Example #2
0
 def test_build_datasets_adds_inchworm_to_line_dict(self):
     lines = [
         "20140919 11:08:49 44009 user 20 44008 0 R 10975748 0 10837764 10957692 92 128 3416 9 0.00 4.99 99 "
         "01:33:35 0 0 0 0 0 0 0 0 1 /N/test/Inchworm/bin/inchworm --kmers jellyfish.kmers.fa --run_inchworm "
         "-K 25 -L 25 --monitor 1"
     ]
     _, line_dict, _, _, _ = make_data_files.build_datasets(generate(lines))
     self.assertEquals(lines, line_dict['inchworm'])
Example #3
0
 def test_Butterfly_is_identified_correctly(self):
     lines = [
         "20140920 17:28:14 30084 befulton 20 62435 0 S 24215176 0 37768 24080384 92 4 14420 30 0.03 0.17 "
         "4 00:00.20 0 6 519 0 203 1 0 0 1056 java -Xmx20G -Xms1G -jar /trinity/Butterfly/Butterfly.jar "
         "-N 100000 -L 200 -F 500 -C /jobdir/trinity_out/chrysalis/Component_bins/Cbin5/c6058.graph "
         "--max_number_of_paths_per_node=10 --path_reinforcement_distance=75 --triplet-lock"
     ]
     _, line_dict, _, _, _ = make_data_files.build_datasets(generate(lines))
     self.assertEquals(lines, line_dict['Butterfly'])
Example #4
0
 def test_Chrysalis_is_identified_correctly(self):
     lines = ["20140920 11:29:54 49383 befulton 20 43684 0 S 18468 0 1464 300 92 236 3416 8 0.00 0.00 0 00:02.44 "
              "0 0 0 0 0 0 0 0 0 /trinity/Chrysalis/Chrysalis "
              "-i both.fa -iworm /jobdir/trinity_out/inchworm.K25.L25.fa.clipped.fa -o "
              "/jobdir/trinity_out/chrysalis -cpu 16 -min_glue 2 "
              "-min_iso_ratio 0.05 -glue_factor 0.05 -weldmer_size 48 -min 200 -dist 500 -max_reads 200000 "
              "-sort_buffer_size 20G -max_mem_reads 1000000 -strand 1 -paired -reads_for_pairs both.fa "
              "-butterfly /trinity/Butterfly/Butterfly.jar"]
     _, line_dict, _, _, _ = make_data_files.build_datasets(generate(lines))
     self.assertEquals(lines, line_dict['Chrysalis'])
Example #5
0
 def test_build_datasets_adds_bowtie_build_to_line_dict_if_no_path(self):
     lines = ["20140919 11:11:24 44143 user 20 44131 0 R 547552 0 502040 535608 164 260 3244 9 0.01 4.98 99 "
              "02:27.86 0 960 0 960 0 124 0 0 0 bowtie-build /N/test/trinity_out/jaccard_clip_workdir/iworm.fa "
              "/N/trinity_out/jaccard_clip_workdir/iworm.fa",
              "20140919 11:11:29 44143 user 20 44131 0 R 547552 0 502040 535608 164 260 3244 9 0.01 4.98 99 02:27.86"
              " 0 960 0 960 0 124 0 0 0 bowtie-build /N/trinity_out/jaccard_clip_workdir/iworm.fa "
              "/N/trinity_out/jaccard_clip_workdir/iworm.fa",
              "20140919 11:11:34 44143 user 20 44131 0 R 547552 0 502040 535608 164 260 3244 9 0.01 4.98 99 02:27.86"
              " 0 960 0 960 0 124 0 0 0 some_app /N/trinity_out/bowtie-build/jaccard_clip_workdir/iworm.fa "
              "/N/trinity_out/jaccard_clip_workdir/iworm.fa"]
     _, line_dict, _, _, _ = make_data_files.build_datasets(generate(lines))
     self.assertEquals(lines[0:2], line_dict['bowtie-build'])
Example #6
0
 def test_Chrysalis_is_identified_correctly(self):
     lines = [
         "20140920 11:29:54 49383 befulton 20 43684 0 S 18468 0 1464 300 92 236 3416 8 0.00 0.00 0 00:02.44 "
         "0 0 0 0 0 0 0 0 0 /trinity/Chrysalis/Chrysalis "
         "-i both.fa -iworm /jobdir/trinity_out/inchworm.K25.L25.fa.clipped.fa -o "
         "/jobdir/trinity_out/chrysalis -cpu 16 -min_glue 2 "
         "-min_iso_ratio 0.05 -glue_factor 0.05 -weldmer_size 48 -min 200 -dist 500 -max_reads 200000 "
         "-sort_buffer_size 20G -max_mem_reads 1000000 -strand 1 -paired -reads_for_pairs both.fa "
         "-butterfly /trinity/Butterfly/Butterfly.jar"
     ]
     _, line_dict, _, _, _ = make_data_files.build_datasets(generate(lines))
     self.assertEquals(lines, line_dict['Chrysalis'])
Example #7
0
 def test_build_datasets_adds_bowtie_build_to_line_dict_if_no_path(self):
     lines = [
         "20140919 11:11:24 44143 user 20 44131 0 R 547552 0 502040 535608 164 260 3244 9 0.01 4.98 99 "
         "02:27.86 0 960 0 960 0 124 0 0 0 bowtie-build /N/test/trinity_out/jaccard_clip_workdir/iworm.fa "
         "/N/trinity_out/jaccard_clip_workdir/iworm.fa",
         "20140919 11:11:29 44143 user 20 44131 0 R 547552 0 502040 535608 164 260 3244 9 0.01 4.98 99 02:27.86"
         " 0 960 0 960 0 124 0 0 0 bowtie-build /N/trinity_out/jaccard_clip_workdir/iworm.fa "
         "/N/trinity_out/jaccard_clip_workdir/iworm.fa",
         "20140919 11:11:34 44143 user 20 44131 0 R 547552 0 502040 535608 164 260 3244 9 0.01 4.98 99 02:27.86"
         " 0 960 0 960 0 124 0 0 0 some_app /N/trinity_out/bowtie-build/jaccard_clip_workdir/iworm.fa "
         "/N/trinity_out/jaccard_clip_workdir/iworm.fa"
     ]
     _, line_dict, _, _, _ = make_data_files.build_datasets(generate(lines))
     self.assertEquals(lines[0:2], line_dict['bowtie-build'])
Example #8
0
 def test_shell_c_commands_are_dropped(self):
     lines = ["20140919 10:06:14 43812 befulton 20 43684 0 S 108160 0 1228 196 92 848 1832 1 0.00 0.00 0 00:00.00 " \
             "0 0 0 0 0 0 0 0 0 sh -c /trinity/trinity-plugins/fastool/fastool --rev  --illumina-trinity " \
             "--to-fasta /jobdir/reads.left.fq >> left.fa"]
     _, line_dict, _, _, _ = make_data_files.build_datasets(generate(lines))
     self.assertEquals(0, len(line_dict))
Example #9
0
 def test_build_datasets_adds_inchworm_to_line_dict(self):
     lines = ["20140919 11:08:49 44009 user 20 44008 0 R 10975748 0 10837764 10957692 92 128 3416 9 0.00 4.99 99 "
              "01:33:35 0 0 0 0 0 0 0 0 1 /N/test/Inchworm/bin/inchworm --kmers jellyfish.kmers.fa --run_inchworm "
              "-K 25 -L 25 --monitor 1"]
     _, line_dict, _, _, _ = make_data_files.build_datasets(generate(lines))
     self.assertEquals(lines, line_dict['inchworm'])
Example #10
0
 def test_build_datasets_returns_last_line_time_as_end_time(self):
     lines = ["20140919 13:10:49\n",
              "20140919 11:10:49\n",
              "20140919 11:27:49\n"]
     _, _, _, _, end_time = make_data_files.build_datasets(generate(lines))
     self.assertEquals(['20140919', '11:27:49'], end_time)
Example #11
0
 def test_shell_c_commands_are_dropped(self):
     lines = ["20140919 10:06:14 43812 befulton 20 43684 0 S 108160 0 1228 196 92 848 1832 1 0.00 0.00 0 00:00.00 " \
             "0 0 0 0 0 0 0 0 0 sh -c /trinity/trinity-plugins/fastool/fastool --rev  --illumina-trinity " \
             "--to-fasta /jobdir/reads.left.fq >> left.fa"]
     _, line_dict, _, _, _ = make_data_files.build_datasets(generate(lines))
     self.assertEquals(0, len(line_dict))
Example #12
0
 def test_build_datasets_returns_last_line_time_as_end_time(self):
     lines = [
         "20140919 13:10:49\n", "20140919 11:10:49\n", "20140919 11:27:49\n"
     ]
     _, _, _, _, end_time = make_data_files.build_datasets(generate(lines))
     self.assertEquals(['20140919', '11:27:49'], end_time)