init

2022-03-31 20:20:07 -05:00 · 2022-03-31 20:20:07 -05:00 · 38355d2442
commit 38355d2442
9083 changed files with 1225834 additions and 0 deletions
--- a/.venv/lib/python3.8/site-packages/pyflyby/_importdb.py
+++ b/.venv/lib/python3.8/site-packages/pyflyby/_importdb.py
@ -0,0 +1,581 @@
+# pyflyby/_importdb.py.
+# Copyright (C) 2011, 2012, 2013, 2014, 2015 Karl Chen.
+# License: MIT http://opensource.org/licenses/MIT
+
+from __future__ import (absolute_import, division, print_function,
+                        with_statement)
+
+from   collections              import defaultdict
+import os
+import re
+import six
+
+from   pyflyby._file            import Filename, expand_py_files_from_args
+from   pyflyby._idents          import dotted_prefixes
+from   pyflyby._importclns      import ImportMap, ImportSet
+from   pyflyby._importstmt      import Import, ImportStatement
+from   pyflyby._log             import logger
+from   pyflyby._parse           import PythonBlock
+from   pyflyby._util            import cached_attribute, memoize, stable_unique
+
+
+@memoize
+def _find_etc_dirs():
+    result = []
+    dirs = Filename(__file__).real.dir.ancestors[:-1]
+    for dir in dirs:
+        candidate = dir / "etc/pyflyby"
+        if candidate.isdir:
+            result.append(candidate)
+            break
+    global_dir = Filename("/etc/pyflyby")
+    if global_dir.exists:
+        result.append(global_dir)
+    return result
+
+
+def _get_env_var(env_var_name, default):
+    '''
+    Get an environment variable and split on ":", replacing ``-`` with the
+    default.
+    '''
+    assert re.match("^[A-Z_]+$", env_var_name)
+    assert isinstance(default, (tuple, list))
+    value = list(filter(None, os.environ.get(env_var_name, '').split(':')))
+    if not value:
+        return default
+    # Replace '-' with ``default``
+    try:
+        idx = value.index('-')
+    except ValueError:
+        pass
+    else:
+        value[idx:idx+1] = default
+    return value
+
+
+def _get_python_path(env_var_name, default_path, target_dirname):
+    '''
+    Expand an environment variable specifying pyflyby input config files.
+
+      - Default to ``default_path`` if the environment variable is undefined.
+      - Process colon delimiters.
+      - Replace "-" with ``default_path``.
+      - Expand triple dots.
+      - Recursively traverse directories.
+
+    :rtype:
+      ``tuple`` of ``Filename`` s
+    '''
+    pathnames = _get_env_var(env_var_name, default_path)
+    if pathnames == ["EMPTY"]:
+        # The special code PYFLYBY_PATH=EMPTY means we intentionally want to
+        # use an empty PYFLYBY_PATH (and don't fall back to the default path,
+        # nor warn about an empty path).
+        return ()
+    for p in pathnames:
+        if re.match("/|[.]/|[.][.][.]/|~/", p):
+            continue
+        raise ValueError(
+            "{env_var_name} components should start with / or ./ or ~/ or .../.  "
+            "Use {env_var_name}=./{p} instead of {env_var_name}={p} if you really "
+            "want to use the current directory."
+            .format(env_var_name=env_var_name, p=p))
+    pathnames = [os.path.expanduser(p) for p in pathnames]
+    pathnames = _expand_tripledots(pathnames, target_dirname)
+    pathnames = [Filename(fn) for fn in pathnames]
+    pathnames = stable_unique(pathnames)
+    pathnames = expand_py_files_from_args(pathnames)
+    if not pathnames:
+        logger.warning(
+            "No import libraries found (%s=%r, default=%r)"
+            % (env_var_name, os.environ.get(env_var_name), default_path))
+    return tuple(pathnames)
+
+
+# TODO: stop memoizing here after using StatCache.  Actually just inline into
+# _ancestors_on_same_partition
+@memoize
+def _get_st_dev(filename):
+    filename = Filename(filename)
+    try:
+        return os.stat(str(filename)).st_dev
+    except OSError:
+        return None
+
+
+def _ancestors_on_same_partition(filename):
+    """
+    Generate ancestors of ``filename`` that exist and are on the same partition
+    as the first existing ancestor of ``filename``.
+
+    For example, suppose a partition is mounted on /u/homer; /u is a different
+    partition.  Suppose /u/homer/aa exists but /u/homer/aa/bb does not exist.
+    Then::
+
+      >>> _ancestors_on_same_partition(Filename("/u/homer/aa/bb/cc")) # doctest: +SKIP
+      [Filename("/u/homer", Filename("/u/homer/aa")]
+
+    :rtype:
+      ``list`` of ``Filename``
+    """
+    result = []
+    dev = None
+    for f in filename.ancestors:
+        this_dev = _get_st_dev(f)
+        if this_dev is None:
+            continue
+        if dev is None:
+            dev = this_dev
+        elif dev != this_dev:
+            break
+        result.append(f)
+    return result
+
+
+def _expand_tripledots(pathnames, target_dirname):
+    """
+    Expand pathnames of the form ``".../foo/bar"`` as "../../foo/bar",
+    "../foo/bar", "./foo/bar" etc., up to the oldest ancestor with the same
+    st_dev.
+
+    For example, suppose a partition is mounted on /u/homer; /u is a different
+    partition.  Then::
+
+      >>> _expand_tripledots(["/foo", ".../tt"], "/u/homer/aa") # doctest: +SKIP
+      [Filename("/foo"), Filename("/u/homer/tt"), Filename("/u/homer/aa/tt")]
+
+    :type pathnames:
+      sequence of ``str`` (not ``Filename``)
+    :type target_dirname:
+      `Filename`
+    :rtype:
+      ``list`` of `Filename`
+    """
+    target_dirname = Filename(target_dirname)
+    if not isinstance(pathnames, (tuple, list)):
+        pathnames = [pathnames]
+    result = []
+    for pathname in pathnames:
+        if not pathname.startswith(".../"):
+            result.append(Filename(pathname))
+            continue
+        suffix = pathname[4:]
+        expanded = [
+            p / suffix for p in _ancestors_on_same_partition(target_dirname) ]
+        result.extend(expanded[::-1])
+    return result
+
+
+class ImportDB(object):
+    """
+    A database of known, mandatory, canonical imports.
+
+    @iattr known_imports:
+      Set of known imports.  For use by tidy-imports and autoimporter.
+    @iattr mandatory_imports:
+      Set of imports that must be added by tidy-imports.
+    @iattr canonical_imports:
+      Map of imports that tidy-imports transforms on every run.
+    @iattr forget_imports:
+      Set of imports to remove from known_imports, mandatory_imports,
+      canonical_imports.
+    """
+
+    def __new__(cls, *args):
+        if len(args) != 1:
+            raise TypeError
+        arg, = args
+        if isinstance(arg, cls):
+            return arg
+        if isinstance(arg, ImportSet):
+            return cls._from_data(arg, [], [], [])
+        return cls._from_args(arg) # PythonBlock, Filename, etc
+
+
+    _default_cache = {}
+
+    @classmethod
+    def clear_default_cache(cls):
+        """
+        Clear the class cache of default ImportDBs.
+
+        Subsequent calls to ImportDB.get_default() will not reuse previously
+        cached results.  Existing ImportDB instances are not affected by this
+        call.
+        """
+        if cls._default_cache:
+            if logger.debug_enabled:
+                allpyfiles = set()
+                for tup in cls._default_cache:
+                    if tup[0] != 2:
+                        continue
+                    for tup2 in tup[1:]:
+                        for f in tup2:
+                            assert isinstance(f, Filename)
+                            if f.ext == '.py':
+                                allpyfiles.add(f)
+                nfiles = len(allpyfiles)
+                logger.debug("ImportDB: Clearing default cache of %d files",
+                             nfiles)
+            cls._default_cache.clear()
+
+    @classmethod
+    def get_default(cls, target_filename):
+        """
+        Return the default import library for the given target filename.
+
+        This will read various .../.pyflyby files as specified by
+        $PYFLYBY_PATH as well as older deprecated environment variables.
+
+        Memoized.
+
+        :param target_filename:
+          The target filename for which to get the import database.  Note that
+          the target filename itself is not read.  Instead, the target
+          filename is relevant because we look for .../.pyflyby based on the
+          target filename.
+        :rtype:
+          `ImportDB`
+        """
+        # We're going to canonicalize target_filenames in a number of steps.
+        # At each step, see if we've seen the input so far.  We do the cache
+        # checking incrementally since the steps involve syscalls.  Since this
+        # is going to potentially be executed inside the IPython interactive
+        # loop, we cache as much as possible.
+        # TODO: Consider refreshing periodically.  Check if files have
+        # been touched, and if so, return new data.  Check file timestamps at
+        # most once every 60 seconds.
+        cache_keys = []
+        target_filename = Filename(target_filename or ".")
+        if target_filename.startswith("/dev"):
+            target_filename = Filename(".")
+        target_dirname = target_filename
+        # TODO: with StatCache
+        while True:
+            cache_keys.append((1,
+                               target_dirname,
+                               os.getenv("PYFLYBY_PATH"),
+                               os.getenv("PYFLYBY_KNOWN_IMPORTS_PATH"),
+                               os.getenv("PYFLYBY_MANDATORY_IMPORTS_PATH")))
+            try:
+                return cls._default_cache[cache_keys[-1]]
+            except KeyError:
+                pass
+            if target_dirname.isdir:
+                break
+            target_dirname = target_dirname.dir
+        target_dirname = target_dirname.real
+        if target_dirname != cache_keys[-1][0]:
+            cache_keys.append((1,
+                               target_dirname,
+                               os.getenv("PYFLYBY_PATH"),
+                               os.getenv("PYFLYBY_KNOWN_IMPORTS_PATH"),
+                               os.getenv("PYFLYBY_MANDATORY_IMPORTS_PATH")))
+            try:
+                return cls._default_cache[cache_keys[-1]]
+            except KeyError:
+                pass
+        DEFAULT_PYFLYBY_PATH = []
+        DEFAULT_PYFLYBY_PATH += [str(p) for p in _find_etc_dirs()]
+        DEFAULT_PYFLYBY_PATH += [
+            ".../.pyflyby",
+            "~/.pyflyby",
+            ]
+        logger.debug("DEFAULT_PYFLYBY_PATH=%s", DEFAULT_PYFLYBY_PATH)
+        filenames = _get_python_path("PYFLYBY_PATH", DEFAULT_PYFLYBY_PATH,
+                                     target_dirname)
+        mandatory_imports_filenames = ()
+        if "SUPPORT DEPRECATED BEHAVIOR":
+            PYFLYBY_PATH = _get_env_var("PYFLYBY_PATH", DEFAULT_PYFLYBY_PATH)
+            # If the old deprecated environment variables are set, then heed
+            # them.
+            if os.getenv("PYFLYBY_KNOWN_IMPORTS_PATH"):
+                # Use PYFLYBY_PATH as the default for
+                # PYFLYBY_KNOWN_IMPORTS_PATH.  Note that the default is
+                # relevant even though we only enter this code path when the
+                # variable is set to anything, because the env var can
+                # reference "-" to include the default.
+                # Before pyflyby version 0.8, the default value would have
+                # been
+                #   [d/"known_imports" for d in PYFLYBY_PATH]
+                # Instead of using that, we just use PYFLYBY_PATH directly as
+                # the default.  This simplifies things and avoids need for a
+                # "known_imports=>." symlink for backwards compatibility.  It
+                # means that ~/.pyflyby/**/*.py (as opposed to only
+                # ~/.pyflyby/known_imports/**/*.py) would be included.
+                # Although this differs slightly from the old behavior, it
+                # matches the behavior of the newer PYFLYBY_PATH; matching the
+                # new behavior seems higher utility than exactly matching the
+                # old behavior.  Files under ~/.pyflyby/mandatory_imports will
+                # be included in known_imports as well, but that should not
+                # cause any problems.
+                default_path = PYFLYBY_PATH
+                # Expand $PYFLYBY_KNOWN_IMPORTS_PATH.
+                filenames = _get_python_path(
+                    "PYFLYBY_KNOWN_IMPORTS_PATH", default_path, target_dirname)
+                logger.debug(
+                    "The environment variable PYFLYBY_KNOWN_IMPORTS_PATH is deprecated.  "
+                    "Use PYFLYBY_PATH.")
+            if os.getenv("PYFLYBY_MANDATORY_IMPORTS_PATH"):
+                # Compute the "default" path.
+                # Note that we still calculate the erstwhile default value,
+                # even though it's no longer the defaults, in order to still
+                # allow the "-" in the variable.
+                default_path = [
+                    os.path.join(d,"mandatory_imports") for d in PYFLYBY_PATH]
+                # Expand $PYFLYBY_MANDATORY_IMPORTS_PATH.
+                mandatory_imports_filenames = _get_python_path(
+                    "PYFLYBY_MANDATORY_IMPORTS_PATH",
+                    default_path, target_dirname)
+                logger.debug(
+                    "The environment variable PYFLYBY_MANDATORY_IMPORTS_PATH is deprecated.  "
+                    "Use PYFLYBY_PATH and write __mandatory_imports__=['...'] in your files.")
+        cache_keys.append((2, filenames, mandatory_imports_filenames))
+        try:
+            return cls._default_cache[cache_keys[-1]]
+        except KeyError:
+            pass
+        result = cls._from_filenames(filenames, mandatory_imports_filenames)
+        for k in cache_keys:
+            cls._default_cache[k] = result
+        return result
+
+    @classmethod
+    def interpret_arg(cls, arg, target_filename):
+        if arg is None:
+            return cls.get_default(target_filename)
+        else:
+            return cls(arg)
+
+    @classmethod
+    def _from_data(cls, known_imports, mandatory_imports,
+                   canonical_imports, forget_imports):
+        self = object.__new__(cls)
+        self.forget_imports    = ImportSet(forget_imports   )
+        self.known_imports     = ImportSet(known_imports    ).without_imports(forget_imports)
+        self.mandatory_imports = ImportSet(mandatory_imports).without_imports(forget_imports)
+        # TODO: provide more fine-grained control about canonical_imports.
+        self.canonical_imports = ImportMap(canonical_imports).without_imports(forget_imports)
+        return self
+
+    @classmethod
+    def _from_args(cls, args):
+        # TODO: support merging input ImportDBs.  For now we support
+        # `PythonBlock` s and convertibles such as `Filename`.
+        return cls._from_code(args)
+
+    @classmethod
+    def _from_code(cls, blocks,
+                   _mandatory_imports_blocks_deprecated=(),
+                   _forget_imports_blocks_deprecated=(),
+               ):
+        """
+        Load an import database from code.
+
+          >>> ImportDB._from_code('''
+          ...     import foo, bar as barf
+          ...     from xx import yy
+          ...     __mandatory_imports__ = ['__future__.division',
+          ...                              'import aa . bb . cc as dd']
+          ...     __forget_imports__ = ['xx.yy', 'from xx import zz']
+          ...     __canonical_imports__ = {'bad.baad': 'good.goood'}
+          ... ''')
+          ImportDB('''
+            import bar as barf
+            import foo
+          <BLANKLINE>
+            __mandatory_imports__ = [
+              'from __future__ import division',
+              'from aa.bb import cc as dd',
+            ]
+          <BLANKLINE>
+            __canonical_imports__ = {
+              'bad.baad': 'good.goood',
+            }
+          <BLANKLINE>
+            __forget_imports__ = [
+              'from xx import yy',
+              'from xx import zz',
+            ]
+          ''')
+
+        :rtype:
+          `ImportDB`
+        """
+        if not isinstance(blocks, (tuple, list)):
+            blocks = [blocks]
+        if not isinstance(_mandatory_imports_blocks_deprecated, (tuple, list)):
+            _mandatory_imports_blocks_deprecated = [_mandatory_imports_blocks_deprecated]
+        if not isinstance(_forget_imports_blocks_deprecated, (tuple, list)):
+            _forget_imports_blocks_deprecated = [_forget_imports_blocks_deprecated]
+        known_imports     = []
+        mandatory_imports = []
+        canonical_imports = []
+        forget_imports    = []
+        blocks = [PythonBlock(b) for b in blocks]
+        for block in blocks:
+            for statement in block.statements:
+                if statement.is_comment_or_blank:
+                    continue
+                if statement.is_import:
+                    known_imports.extend(ImportStatement(statement).imports)
+                    continue
+                try:
+                    name, value = statement.get_assignment_literal_value()
+                    if name == "__mandatory_imports__":
+                        mandatory_imports.append(cls._parse_import_set(value))
+                    elif name == "__canonical_imports__":
+                        canonical_imports.append(cls._parse_import_map(value))
+                    elif name == "__forget_imports__":
+                        forget_imports.append(cls._parse_import_set(value))
+                    else:
+                        raise ValueError(
+                            "Unknown assignment to %r (expected one of "
+                            "__mandatory_imports__, __canonical_imports__, "
+                            "__forget_imports__)" % (name,))
+                except ValueError as e:
+                    raise ValueError(
+                        "While parsing %s: error in %r: %s"
+                        % (block.filename, statement, e))
+        for block in _mandatory_imports_blocks_deprecated:
+            mandatory_imports.append(ImportSet(block))
+        for block in _forget_imports_blocks_deprecated:
+            forget_imports.append(ImportSet(block))
+        return cls._from_data(known_imports,
+                              mandatory_imports,
+                              canonical_imports,
+                              forget_imports)
+
+    @classmethod
+    def _from_filenames(cls, filenames, _mandatory_filenames_deprecated=[]):
+        """
+        Load an import database from filenames.
+
+        This function exists to support deprecated behavior.
+        When we stop supporting the old behavior, we will delete this function.
+
+        :type filenames:
+          Sequence of `Filename` s
+        :param filenames:
+          Filenames of files to read.
+        :rtype:
+          `ImportDB`
+        """
+        if not isinstance(filenames, (tuple, list)):
+            filenames = [filenames]
+        filenames = [Filename(f) for f in filenames]
+        logger.debug("ImportDB: loading [%s], mandatory=[%s]",
+                     ', '.join(map(str, filenames)),
+                     ', '.join(map(str, _mandatory_filenames_deprecated)))
+        if "SUPPORT DEPRECATED BEHAVIOR":
+            # Before 2014-10, pyflyby read the following:
+            #   * known_imports from $PYFLYBY_PATH/known_imports/**/*.py or
+            #     $PYFLYBY_KNOWN_IMPORTS_PATH/**/*.py,
+            #   * mandatory_imports from $PYFLYBY_PATH/mandatory_imports/**/*.py or
+            #     $PYFLYBY_MANDATORY_IMPORTS_PATH/**/*.py, and
+            #   * forget_imports from $PYFLYBY_PATH/known_imports/**/__remove__.py
+            # After 2014-10, pyflyby reads the following:
+            #   * $PYFLYBY_PATH/**/*.py
+            #     (with directives inside the file)
+            # For backwards compatibility, for now we continue supporting the
+            # old, deprecated behavior.
+            blocks = []
+            mandatory_imports_blocks = [
+                Filename(f) for f in _mandatory_filenames_deprecated]
+            forget_imports_blocks = []
+            for filename in filenames:
+                if filename.base == "__remove__.py":
+                    forget_imports_blocks.append(filename)
+                elif "mandatory_imports" in str(filename).split("/"):
+                    mandatory_imports_blocks.append(filename)
+                else:
+                    blocks.append(filename)
+            return cls._from_code(
+                blocks, mandatory_imports_blocks, forget_imports_blocks)
+        else:
+            return cls._from_code(filenames)
+
+    @classmethod
+    def _parse_import_set(cls, arg):
+        if isinstance(arg, six.string_types):
+            arg = [arg]
+        if not isinstance(arg, (tuple, list)):
+            raise ValueError("Expected a list, not a %s" % (type(arg).__name__,))
+        for item in arg:
+            if not isinstance(item, six.string_types):
+                raise ValueError(
+                    "Expected a list of str, not %s" % (type(item).__name__,))
+        return ImportSet(arg)
+
+    @classmethod
+    def _parse_import_map(cls, arg):
+        if isinstance(arg, six.string_types):
+            arg = [arg]
+        if not isinstance(arg, dict):
+            raise ValueError("Expected a dict, not a %s" % (type(arg).__name__,))
+        for k, v in arg.items():
+            if not isinstance(k, six.string_types):
+                raise ValueError(
+                    "Expected a dict of str, not %s" % (type(k).__name__,))
+            if not isinstance(v, six.string_types):
+                raise ValueError(
+                    "Expected a dict of str, not %s" % (type(v).__name__,))
+        return ImportMap(arg)
+
+    @cached_attribute
+    def by_fullname_or_import_as(self):
+        """
+        Map from ``fullname`` and ``import_as`` to `Import` s.
+
+          >>> import pprint
+          >>> db = ImportDB('from aa.bb import cc as dd')
+          >>> pprint.pprint(db.by_fullname_or_import_as)
+          {'aa': (Import('import aa'),),
+           'aa.bb': (Import('import aa.bb'),),
+           'dd': (Import('from aa.bb import cc as dd'),)}
+
+        :rtype:
+          ``dict`` mapping from ``str`` to tuple of `Import` s
+        """
+        # TODO: make known_imports take into account the below forget_imports,
+        # then move this function into ImportSet
+        d = defaultdict(set)
+        for imp in self.known_imports.imports:
+            # Given an import like "from foo.bar import quux as QUUX", add the
+            # following entries:
+            #   - "QUUX"         => "from foo.bar import quux as QUUX"
+            #   - "foo.bar"      => "import foo.bar"
+            #   - "foo"          => "import foo"
+            # We don't include an entry labeled "quux" because the user has
+            # implied he doesn't want to pollute the global namespace with
+            # "quux", only "QUUX".
+            d[imp.import_as].add(imp)
+            for prefix in dotted_prefixes(imp.fullname)[:-1]:
+                d[prefix].add(Import.from_parts(prefix, prefix))
+        return dict( (k, tuple(sorted(v - set(self.forget_imports.imports))))
+                     for k, v in six.iteritems(d))
+
+    def __repr__(self):
+        printed = self.pretty_print()
+        lines = "".join("  "+line for line in printed.splitlines(True))
+        return "%s('''\n%s''')" % (type(self).__name__, lines)
+
+    def pretty_print(self):
+        s = self.known_imports.pretty_print()
+        if self.mandatory_imports:
+            s += "\n__mandatory_imports__ = [\n"
+            for imp in self.mandatory_imports.imports:
+                s += "  '%s',\n" % imp
+            s += "]\n"
+        if self.canonical_imports:
+            s += "\n__canonical_imports__ = {\n"
+            for k, v in sorted(self.canonical_imports.items()):
+                s += "  '%s': '%s',\n" % (k, v)
+            s += "}\n"
+        if self.forget_imports:
+            s += "\n__forget_imports__ = [\n"
+            for imp in self.forget_imports.imports:
+                s += "  '%s',\n" % imp
+            s += "]\n"
+        return s