Beispiel #1
0
    def list_all_files(self):
        """
        list all the files and directories for a given path.
        ignore .svn, .git, .gitignore, *.pyc
        :return: e.g.: {
            'path': '/home/source'
            'dirs': ['dir1', 'dir2', 'dir3'],
            'files': ['file1', 'file2', 'file3'],
            'dir1': ['dir1/f1.py', 'dir1/a/f2.py'],
            'dir2': ['dir2/f1.py', 'dir2/f2.py', 'dir2/aa/bb/cc/dd.py'],
            'dir3': []
        }
        """
        cache = file_db.query_dirs(self.path)
        if cache:
            return cache
        result = {
            'path': self.path,
            'dirs': [],
            'files': []
        }
        dirs = []
        files = []
        for filename in os.listdir(self.path):
            # ignore .git .ssh .svn, etc
            if not filename.startswith('.'):
                full_path = os.path.join(self.path, filename)
                if os.path.isdir(full_path):
                    dirs.append(filename)
                else:
                    # ignore .pyc
                    if filename.endswith('.py'):
                        parser = CodeParser(filename=full_path)
                        statements, _ = parser.parse_source()
                        files.append(("/" + filename, len(statements)))
        result['dirs'] = sorted(dirs)
        result['files'] = sorted(files)

        for dirname in result['dirs']:
            full_path = self.path + '/' + dirname
            result[dirname] = self._dfs(full_path)
        file_db.save_dirs(self.path, result)
        return result
Beispiel #2
0
 def _dfs(self, filename):
     stack = []
     ret = []
     stack.append(filename)
     while len(stack) > 0:
         tmp = stack.pop()
         if os.path.isdir(tmp):
             for item in os.listdir(tmp):
                 # ignore .git .xxoo
                 if not item.startswith('.'):
                     # why not use path.join? because in windows we usually have a\\b and
                     # in linux we usually have a/b, however, the path is the id of some
                     # html element, which may cause conflicts
                     stack.append(tmp + '/' + item)
         else:
             if not tmp.startswith('.') and tmp.endswith('.py'):
                 # ignore .gitignore, *.pyc
                 parser = CodeParser(filename=tmp)
                 statements, _ = parser.parse_source()
                 ret.append((tmp.replace(self.path, ''), len(statements)))
     return ret
Beispiel #3
0
 def _dfs(self, filename):
     stack = []
     ret = []
     stack.append(filename)
     while len(stack) > 0:
         tmp = stack.pop()
         if os.path.isdir(tmp):
             for item in os.listdir(tmp):
                 # ignore .git .xxoo
                 if not item.startswith('.'):
                     # why not use path.join? because in windows we usually have a\\b and
                     # in linux we usually have a/b, however, the path is the id of some
                     # html element, which may cause conflicts
                     stack.append(tmp + '/' + item)
         else:
             if not tmp.startswith('.') and tmp.endswith('.py'):
                 # ignore .gitignore, *.pyc
                 parser = CodeParser(filename=tmp)
                 statements, _ = parser.parse_source()
                 ret.append((tmp.replace(self.path, ''), len(statements)))
     return ret
Beispiel #4
0
    def list_all_files(self):
        """
        list all the files and directories for a given path.
        ignore .svn, .git, .gitignore, *.pyc
        :return: e.g.: {
            'path': '/home/source'
            'dirs': ['dir1', 'dir2', 'dir3'],
            'files': ['file1', 'file2', 'file3'],
            'dir1': ['dir1/f1.py', 'dir1/a/f2.py'],
            'dir2': ['dir2/f1.py', 'dir2/f2.py', 'dir2/aa/bb/cc/dd.py'],
            'dir3': []
        }
        """
        cache = file_db.query_dirs(self.path)
        if cache:
            return cache
        result = {'path': self.path, 'dirs': [], 'files': []}
        dirs = []
        files = []
        for filename in os.listdir(self.path):
            # ignore .git .ssh .svn, etc
            if not filename.startswith('.'):
                full_path = os.path.join(self.path, filename)
                if os.path.isdir(full_path):
                    dirs.append(filename)
                else:
                    # ignore .pyc
                    if filename.endswith('.py'):
                        parser = CodeParser(filename=full_path)
                        statements, _ = parser.parse_source()
                        files.append(("/" + filename, len(statements)))
        result['dirs'] = sorted(dirs)
        result['files'] = sorted(files)

        for dirname in result['dirs']:
            full_path = self.path + '/' + dirname
            result[dirname] = self._dfs(full_path)
        file_db.save_dirs(self.path, result)
        return result