Exemple #1
0
 def _split_dependency_path(self, file_name):
     if file_name in self.root_cache:
         root = self.root_cache[file_name]
         dep_path = file_name[len(root) + 1:]
     else:
         root, dep_path = relfile(file_name, [])
         self.root_cache[file_name] = root
     return root, dep_path
Exemple #2
0
    def _add_dependencies(self, fn, in_roots, files):
        """
        :param fn: file name
        :param in_roots: in list of dir / files in root
        :param files: depended files
        Modified in this method.
        """
        from_ = relfile(fn, [])
        if from_ is None:
            return None

        # Add the dependencies.
        for dfn in files:
            xfn = dfn
            if basename(xfn) == '__init__.py':
                xfn = dirname(xfn)

            to_ = relfile(xfn, [])
            into = to_[0] in in_roots
            if into:
                # Skip internal dependency.
                continue
            self.all_files[from_].add(to_)
Exemple #3
0
 def scan(self):
     """
     Returns an ImportGraph
     """
     self.optsVerbose -= self.optsQuiet
     setup_logging(self.optsVerbose)
     info = logging.info
     warning = logging.warning
     debug = logging.debug
     if self.optsInternal and self.optsExternal:
         message = "Using --internal and --external at the same time " \
             "does not make sense."
         raise SnakefoodScannerException(message)
     if self.optsPrintRoots:
         inroots = find_roots(self.args, self.optsIgnores)
         for dn in sorted(inroots):
             print(dn)
         return
     info("")
     info("Input paths:")
     for arg in self.args:
         fn = os.path.realpath(arg)
         info('  {}'.format(fn))
         if not os.path.exists(fn):
             message = "Filename '{}' does not exist.".format(fn)
             raise SnakefoodScannerException(message)
     # Get the list of package roots for our input files and prepend
     # them to the module search path to insure localized imports.
     inroots = find_roots(self.args, self.optsIgnores)
     if (self.optsInternal or self.optsExternal) and not inroots:
         message = "No package roots found from the given files or " \
             "directories. Using --internal with these roots will  " \
             "generate no dependencies."
         raise SnakefoodScannerException(message)
     info("")
     info("Roots of the input files:")
     for root in inroots:
         info('  {}'.format(root))
     info("")
     info("Using the following import path to search for modules:")
     sys.path = inroots + sys.path
     for dn in sys.path:
         info("  {}".format(dn))
     inroots = frozenset(inroots)
     # Find all the dependencies.
     info("")
     info("Processing files:")
     info("")
     allfiles = defaultdict(set)
     allerrors = []
     processed_files = set()
     fiter = iter_pyfiles(self.args, self.optsIgnores, False)
     while 1:
         newfiles = set()
         for fn in fiter:
             if fn in processed_files:
                 continue  # Make sure we process each file only once.
             info("  {}".format(fn))
             processed_files.add(fn)
             if is_python(fn):
                 files, errors = find_dependencies(
                     fn, self.optsVerbose,
                     self.optsDoPragmas, self.optsVerbose)
                 allerrors.extend(errors)
             else:
                 # If the file is not a source file, we don't know how
                 # to get the dependencies of that (without importing,
                 # which we want to avoid).
                 files = []
             # When packages are the source of dependencies, remove the
             # __init__ file.  This is important because the targets
             # also do not include the __init__ (i.e. when "from
             # <package> import <subpackage>" is seen).
             if os.path.basename(fn) == '__init__.py':
                 fn = os.path.dirname(fn)
             # Make sure all the files at least appear in the output,
             # even if it has no dependency.
             from_ = relfile(fn, self.optsIgnores)
             if from_ is None:
                 continue
             infrom = from_[0] in inroots
             if self.optsInternal and not infrom:
                 continue
             if not self.optsExternal:
                 allfiles[from_].add((None, None))
             # Add the dependencies.
             for dfn in files:
                 xfn = dfn
                 if os.path.basename(xfn) == '__init__.py':
                     xfn = os.path.dirname(xfn)
                 to_ = relfile(xfn, self.optsIgnores)
                 into = to_[0] in inroots
                 if (self.optsInternal and not into) or \
                         (self.optsExternal and into):
                     continue
                 allfiles[from_].add(to_)
                 newfiles.add(dfn)
         if not (self.optsFollow and newfiles):
             break
         else:
             fiter = iter(sorted(newfiles))
     # If internal is used twice, we filter down  further the
     # dependencies to the set of files that were processed only,
     # not just to the files that live in the same roots.
     if self.optsInternal >= 2:
         filtfiles = type(allfiles)()
         for from_, tolist in allfiles.iteritems():
             filtfiles[from_] = set(
                 x for x in tolist if x in allfiles or x == (None, None))
         allfiles = filtfiles
     info("")
     info("SUMMARY")
     info("=======")
     # Output a list of the symbols that could not
     # be imported as modules.
     reports = [
         ("Modules that were ignored because not used:",
             ERROR_UNUSED, info),
         ("Modules that could not be imported:",
             ERROR_IMPORT, warning),
         ]
     if self.optsVerbose >= 2:
         reports.append(
             ("Symbols that could not be imported as modules:",
                 ERROR_SYMBOL, debug))
     for msg, errtype, efun in reports:
         names = set(name for (err, name) in allerrors if err is errtype)
         if names:
             efun("")
             efun(msg)
             for name in sorted(names):
                 efun("  {}".format(name))
     # Output the list of roots found.
     info("")
     info("Found roots:")
     foundRoots = set()
     for key, files in allfiles.iteritems():
         foundRoots.add(key[0])
         foundRoots.update(map(operator.itemgetter(0), files))
     if None in foundRoots:
         foundRoots.remove(None)
     for root in sorted(foundRoots):
         info("  {}".format(root))
     # Output the dependencies.
     entries = SnakefoodEntries()
     info("")
     for (from_root, from_), targets in sorted(
             allfiles.iteritems(), key=operator.itemgetter(0)):
         for to_root, to_ in sorted(targets):
             entry = SnakefoodEntry(from_root, from_, to_root, to_)
             entries.append(entry)
     graph = ImportGraph()
     for entry in entries.iterEntries():
         graph.addEntry(entry)
     return graph
Exemple #4
0
 def scan(self):
     """
     Returns an ImportGraph
     """
     self.optsVerbose -= self.optsQuiet
     setup_logging(self.optsVerbose)
     info = logging.info
     warning = logging.warning
     debug = logging.debug
     if self.optsInternal and self.optsExternal:
         message = "Using --internal and --external at the same time " \
             "does not make sense."
         raise SnakefoodScannerException(message)
     if self.optsPrintRoots:
         inroots = find_roots(self.args, self.optsIgnores)
         for dn in sorted(inroots):
             print(dn)
         return
     info("")
     info("Input paths:")
     for arg in self.args:
         fn = os.path.realpath(arg)
         info('  {}'.format(fn))
         if not os.path.exists(fn):
             message = "Filename '{}' does not exist.".format(fn)
             raise SnakefoodScannerException(message)
     # Get the list of package roots for our input files and prepend
     # them to the module search path to insure localized imports.
     inroots = find_roots(self.args, self.optsIgnores)
     if (self.optsInternal or self.optsExternal) and not inroots:
         message = "No package roots found from the given files or " \
             "directories. Using --internal with these roots will  " \
             "generate no dependencies."
         raise SnakefoodScannerException(message)
     info("")
     info("Roots of the input files:")
     for root in inroots:
         info('  {}'.format(root))
     info("")
     info("Using the following import path to search for modules:")
     sys.path = inroots + sys.path
     for dn in sys.path:
         info("  {}".format(dn))
     inroots = frozenset(inroots)
     # Find all the dependencies.
     info("")
     info("Processing files:")
     info("")
     allfiles = defaultdict(set)
     allerrors = []
     processed_files = set()
     fiter = iter_pyfiles(self.args, self.optsIgnores, False)
     while 1:
         newfiles = set()
         for fn in fiter:
             if fn in processed_files:
                 continue  # Make sure we process each file only once.
             info("  {}".format(fn))
             processed_files.add(fn)
             if is_python(fn):
                 files, errors = find_dependencies(
                     fn, self.optsVerbose,
                     self.optsDoPragmas, self.optsVerbose)
                 allerrors.extend(errors)
             else:
                 # If the file is not a source file, we don't know how
                 # to get the dependencies of that (without importing,
                 # which we want to avoid).
                 files = []
             # When packages are the source of dependencies, remove the
             # __init__ file.  This is important because the targets
             # also do not include the __init__ (i.e. when "from
             # <package> import <subpackage>" is seen).
             if os.path.basename(fn) == '__init__.py':
                 fn = os.path.dirname(fn)
             # Make sure all the files at least appear in the output,
             # even if it has no dependency.
             from_ = relfile(fn, self.optsIgnores)
             if from_ is None:
                 continue
             infrom = from_[0] in inroots
             if self.optsInternal and not infrom:
                 continue
             if not self.optsExternal:
                 allfiles[from_].add((None, None))
             # Add the dependencies.
             for dfn in files:
                 xfn = dfn
                 if os.path.basename(xfn) == '__init__.py':
                     xfn = os.path.dirname(xfn)
                 to_ = relfile(xfn, self.optsIgnores)
                 into = to_[0] in inroots
                 if (self.optsInternal and not into) or \
                         (self.optsExternal and into):
                     continue
                 allfiles[from_].add(to_)
                 newfiles.add(dfn)
         if not (self.optsFollow and newfiles):
             break
         else:
             fiter = iter(sorted(newfiles))
     # If internal is used twice, we filter down  further the
     # dependencies to the set of files that were processed only,
     # not just to the files that live in the same roots.
     if self.optsInternal >= 2:
         filtfiles = type(allfiles)()
         for from_, tolist in allfiles.iteritems():
             filtfiles[from_] = set(
                 x for x in tolist if x in allfiles or x == (None, None))
         allfiles = filtfiles
     info("")
     info("SUMMARY")
     info("=======")
     # Output a list of the symbols that could not
     # be imported as modules.
     reports = [
         ("Modules that were ignored because not used:",
             ERROR_UNUSED, info),
         ("Modules that could not be imported:",
             ERROR_IMPORT, warning),
         ]
     if self.optsVerbose >= 2:
         reports.append(
             ("Symbols that could not be imported as modules:",
                 ERROR_SYMBOL, debug))
     for msg, errtype, efun in reports:
         names = set(name for (err, name) in allerrors if err is errtype)
         if names:
             efun("")
             efun(msg)
             for name in sorted(names):
                 efun("  {}".format(name))
     # Output the list of roots found.
     info("")
     info("Found roots:")
     foundRoots = set()
     for key, files in allfiles.iteritems():
         foundRoots.add(key[0])
         foundRoots.update(map(operator.itemgetter(0), files))
     if None in foundRoots:
         foundRoots.remove(None)
     for root in sorted(foundRoots):
         info("  {}".format(root))
     # Output the dependencies.
     entries = SnakefoodEntries()
     info("")
     for (from_root, from_), targets in sorted(
             allfiles.iteritems(), key=operator.itemgetter(0)):
         for to_root, to_ in sorted(targets):
             entry = SnakefoodEntry(from_root, from_, to_root, to_)
             entries.append(entry)
     graph = ImportGraph()
     for entry in entries.iterEntries():
         graph.addEntry(entry)
     return graph
def gendeps():
    import optparse
    parser = optparse.OptionParser()

    parser.add_option(
        '-i',
        '--internal',
        '--internal-only',
        default=0,
        action='count',
        help="Filter out dependencies that are outside of the "
        "roots of the input files. If internal is used twice, we "
        "filter down further the dependencies to the set of "
        "files that were processed only, not just to the files "
        "that live in the same roots.")

    parser.add_option(
        '-e',
        '--external',
        '--external-only',
        action='store_true',
        help="Filter out dependencies to modules within the "
        "roots of the input files. This can be used to find out "
        "what external modules a package depends on, for example. "
        "Note that it does not make sense to use --internal and "
        "--external at the same time, as --internal will reject "
        "all the dependencies --external allows would output.")

    parser.add_option(
        '-I',
        '--ignore',
        dest='ignores',
        action='append',
        default=def_ignores,
        help="Add the given directory name to the list to be ignored.")

    parser.add_option('-v',
                      '--verbose',
                      action='count',
                      default=0,
                      help="Output more debugging information")
    parser.add_option('-q',
                      '--quiet',
                      action='count',
                      default=0,
                      help="Output less debugging information")

    parser.add_option(
        '-f',
        '--follow',
        '-r',
        '--recursive',
        action='store_true',
        help="Follow the modules depended upon and trace their dependencies. "
        "WARNING: This can be slow.  Use --internal to limit the scope.")

    parser.add_option(
        '--print-roots',
        action='store_true',
        help="Only print the package roots corresponding to the input files."
        "This is mostly used for testing and troubleshooting.")

    parser.add_option(
        '-d',
        '--disable-pragmas',
        action='store_false',
        dest='do_pragmas',
        default=True,
        help="Disable processing of pragma directives as strings after imports."
    )

    parser.add_option(
        '-u',
        '--ignore-unused',
        action='store_true',
        help="Automatically ignore unused imports. (See sfood-checker.)")

    opts, args = parser.parse_args()
    opts.verbose -= opts.quiet
    setup_logging(opts.verbose)

    if not args:
        logging.warning("Searching for files from current directory.")
        args = ['.']

    info = logging.info

    if opts.internal and opts.external:
        parser.error(
            "Using --internal and --external at the same time does not make sense."
        )

    if opts.print_roots:
        inroots = find_roots(args, opts.ignores)
        for dn in sorted(inroots):
            print(dn)
        return

    info("")
    info("Input paths:")
    for arg in args:
        fn = realpath(arg)
        info('  %s' % fn)
        if not exists(fn):
            parser.error("Filename '%s' does not exist." % fn)

    # Get the list of package roots for our input files and prepend them to the
    # module search path to insure localized imports.
    inroots = find_roots(args, opts.ignores)
    if (opts.internal or opts.external) and not inroots:
        parser.error(
            "No package roots found from the given files or directories. "
            "Using --internal with these roots will generate no dependencies.")
    info("")
    info("Roots of the input files:")
    for root in inroots:
        info('  %s' % root)

    info("")
    info("Using the following import path to search for modules:")
    sys.path = inroots + sys.path
    for dn in sys.path:
        info("  %s" % dn)
    inroots = frozenset(inroots)

    # Find all the dependencies.
    info("")
    info("Processing files:")
    info("")
    allfiles = defaultdict(set)
    allerrors = []
    processed_files = set()

    fiter = iter_pyfiles(args, opts.ignores, False)
    while 1:
        newfiles = set()
        for fn in fiter:
            if fn in processed_files:
                continue  # Make sure we process each file only once.

            info("  %s" % fn)
            processed_files.add(fn)

            if is_python(fn):
                files, errors = find_dependencies(fn, opts.verbose,
                                                  opts.do_pragmas,
                                                  opts.ignore_unused)
                allerrors.extend(errors)
            else:
                # If the file is not a source file, we don't know how to get the
                # dependencies of that (without importing, which we want to
                # avoid).
                files = []

            # When packages are the source of dependencies, remove the __init__
            # file.  This is important because the targets also do not include the
            # __init__ (i.e. when "from <package> import <subpackage>" is seen).
            if basename(fn) == '__init__.py':
                fn = dirname(fn)

            # Make sure all the files at least appear in the output, even if it has
            # no dependency.
            from_ = relfile(fn, opts.ignores)
            if from_ is None:
                continue
            infrom = from_[0] in inroots
            if opts.internal and not infrom:
                continue
            if not opts.external:
                allfiles[from_].add((None, None))

            # Add the dependencies.
            for dfn in files:
                xfn = dfn
                if basename(xfn) == '__init__.py':
                    xfn = dirname(xfn)

                to_ = relfile(xfn, opts.ignores)
                into = to_[0] in inroots
                if (opts.internal and not into) or (opts.external and into):
                    continue
                allfiles[from_].add(to_)
                newfiles.add(dfn)

        if not (opts.follow and newfiles):
            break
        else:
            fiter = iter(sorted(newfiles))

    # If internal is used twice, we filter down further the dependencies to the
    # set of files that were processed only, not just to the files that live in
    # the same roots.
    if opts.internal >= 2:
        filtfiles = type(allfiles)()
        for from_, tolist in iteritems(allfiles):
            filtfiles[from_] = set(x for x in tolist
                                   if x in allfiles or x == (None, None))
        allfiles = filtfiles

    info("")
    info("SUMMARY")
    info("=======")

    # Output a list of the symbols that could not be imported as modules.
    reports = [
        ("Modules that were ignored because not used:", ERROR_UNUSED,
         logging.info),
        ("Modules that could not be imported:", ERROR_IMPORT, logging.warning),
    ]
    if opts.verbose >= 2:
        reports.append(("Symbols that could not be imported as modules:",
                        ERROR_SYMBOL, logging.debug))

    for msg, errtype, efun in reports:
        names = set(name for (err, name) in allerrors if err is errtype)
        if names:
            efun("")
            efun(msg)
            for name in sorted(names):
                efun("  %s" % name)

    # Output the list of roots found.
    info("")
    info("Found roots:")

    found_roots = set()
    for key, files in iteritems(allfiles):
        found_roots.add(key[0])
        found_roots.update(map(itemgetter(0), files))
    if None in found_roots:
        found_roots.remove(None)
    for root in sorted(found_roots):
        info("  %s" % root)

    # Output the dependencies.
    info("")
    output_depends(allfiles)