Esempio n. 1
0
    def test_get_files_paths_subdirectories_dirs_formats(self):
        project_dir = "tests/resources/projects/project-003-subdirectories"
        os.chdir(project_dir)

        paths = ["data/input"]
        files = get_files_in_paths(paths)
        self.assertEqual(len(files), 1)
        self.assertTrue("data/input/input.csv" in files)
        self.assertFalse("data/processed/input.csv" in files)
        self.assertFalse("askanna.yml" in files)

        paths = ["data/input/*"]
        files = get_files_in_paths(paths)
        self.assertEqual(len(files), 1)
        self.assertTrue("data/input/input.csv" in files)
        self.assertFalse("data/processed/input.csv" in files)
        self.assertFalse("askanna.yml" in files)

        paths = ["/data/input"]
        files = get_files_in_paths(paths)
        self.assertEqual(len(files), 0)  # because the folder doesn't exist

        paths = ["data/input/"]
        files = get_files_in_paths(paths)
        self.assertEqual(len(files), 1)
        self.assertTrue("data/input/input.csv" in files)
        self.assertFalse("data/processed/input.csv" in files)
        self.assertFalse("askanna.yml" in files)

        paths = ["data/input/*"]
        files = get_files_in_paths(paths)
        self.assertEqual(len(files), 1)
        self.assertTrue("data/input/input.csv" in files)
        self.assertFalse("data/processed/input.csv" in files)
        self.assertFalse("askanna.yml" in files)
Esempio n. 2
0
    def test_get_files_paths_simple(self):
        project_dir = "tests/resources/projects/project-001-simple"
        os.chdir(project_dir)

        files = get_files_in_paths(["."])
        self.assertEqual(len(files), 3)
        self.assertTrue("askanna.yml" in files)

        files = get_files_in_paths(["*"])
        self.assertEqual(len(files), 3)
        self.assertTrue("askanna.yml" in files)
Esempio n. 3
0
    def test_get_files_paths_simple_single_file(self):
        project_dir = "tests/resources/projects/project-001-simple"
        os.chdir(project_dir)

        paths = ["result.json"]
        files = get_files_in_paths(paths)
        self.assertEqual(len(files), 1)
        self.assertTrue("result.json" in files)

        paths = ["/result.json"]
        files = get_files_in_paths(paths)
        self.assertEqual(len(files), 0)  # because the file doesn't exist
Esempio n. 4
0
    def test_get_files_paths_directories_dirs(self):
        project_dir = "tests/resources/projects/project-002-directories"
        os.chdir(project_dir)

        paths = ["data"]
        files = get_files_in_paths(paths)
        self.assertEqual(len(files), 2)
        self.assertTrue("data/input.csv" in files)
        self.assertFalse("askanna.yml" in files)

        paths = ["data/*"]
        files = get_files_in_paths(paths)
        self.assertEqual(len(files), 2)
        self.assertTrue("data/input.csv" in files)
        self.assertFalse("askanna.yml" in files)
Esempio n. 5
0
    def test_get_files_paths_subdirectories(self):
        project_dir = "tests/resources/projects/project-003-subdirectories"
        os.chdir(project_dir)

        files = get_files_in_paths(".")
        self.assertEqual(len(files), 28)
        self.assertTrue("askanna.yml" in files)
Esempio n. 6
0
    def test_get_files_paths_subdirectories_unique_files(self):
        project_dir = "tests/resources/projects/project-003-subdirectories"
        os.chdir(project_dir)

        paths = ["data", "model/model.pkl", "model/"]
        files = get_files_in_paths(paths)
        self.assertEqual(len(files), 5)
        self.assertFalse("model/model.pkl" in files)
        self.assertTrue("data/processed/input.csv" in files)
        self.assertFalse("askanna.yml" in files)
Esempio n. 7
0
    def test_get_files_paths_subdirectories_single_file(self):
        project_dir = "tests/resources/projects/project-003-subdirectories"
        os.chdir(project_dir)

        paths = ["model/model.pkl"]
        files = get_files_in_paths(paths)
        self.assertEqual(len(files), 0)
        self.assertFalse("model/model.pkl" in files)
        self.assertFalse("data/input.csv" in files)
        self.assertFalse("askanna.yml" in files)
Esempio n. 8
0
    def test_get_files_from_excluded_paths(self):
        project_dir = "tests/resources/projects/project-003-subdirectories"
        os.chdir(project_dir)

        exclude_paths = [
            "/",
            "/bin",
            "/dev",
            "/lib",
            "/mnt",
            "/opt",
            "/proc",
            "/tmp",
            "/usr",
            "/var",
        ]

        paths = ["/"]
        files = get_files_in_paths(paths, exclude_paths)
        self.assertEqual(len(files), 0)
        self.assertFalse("askanna.yml" in files)

        paths = ["/bin"]
        files = get_files_in_paths(paths, exclude_paths)
        self.assertEqual(len(files), 0)
        self.assertFalse("askanna.yml" in files)

        paths = ["/var"]
        files = get_files_in_paths(paths, exclude_paths)
        self.assertEqual(len(files), 0)
        self.assertFalse("askanna.yml" in files)

        paths = exclude_paths
        self.assertGreater(len(paths), 0)
        files = get_files_in_paths(paths, exclude_paths)
        self.assertEqual(len(files), 0)
        self.assertFalse("askanna.yml" in files)

        paths = ["/", "."]
        files = get_files_in_paths(paths, exclude_paths)
        self.assertEqual(len(files), 28)
        self.assertTrue("askanna.yml" in files)
Esempio n. 9
0
    def test_get_files_paths_directories_unique_files(self):
        project_dir = "tests/resources/projects/project-002-directories"
        os.chdir(project_dir)

        paths = ["data", "/data", "data/"]
        files = get_files_in_paths(paths)
        self.assertEqual(len(files), 2)
        self.assertTrue("data/input.csv" in files)
        self.assertFalse("askanna.yml" in files)

        paths = ["data", "/data", "data/", "data/dump.txt"]
        files = get_files_in_paths(paths)
        self.assertEqual(len(files), 2)
        self.assertTrue("data/input.csv" in files)
        self.assertFalse("askanna.yml" in files)

        paths = ["/data", "model/model.pkl", "model/"]
        files = get_files_in_paths(paths)
        self.assertEqual(len(files), 1)
        self.assertTrue("model/model.pkl" in files)
        self.assertFalse("askanna.yml" in files)