client-py/venv/lib/python3.12/site-packages/pylsp/workspace.py

# Copyright 2017-2020 Palantir Technologies, Inc.
# Copyright 2021- Python Language Server Contributors.

import functools
import io
import logging
import os
import re
import uuid
from collections.abc import Generator
from contextlib import contextmanager
from threading import RLock
from typing import Callable, Optional

import jedi

from . import _utils, lsp, uris

log = logging.getLogger(__name__)

DEFAULT_AUTO_IMPORT_MODULES = ["numpy"]

# TODO: this is not the best e.g. we capture numbers
RE_START_WORD = re.compile("[A-Za-z_0-9]*$")
RE_END_WORD = re.compile("^[A-Za-z_0-9]*")


def lock(method):
    """Define an atomic region over a method."""

    @functools.wraps(method)
    def wrapper(self, *args, **kwargs):
        with self._lock:
            return method(self, *args, **kwargs)

    return wrapper


class Workspace:
    M_PUBLISH_DIAGNOSTICS = "textDocument/publishDiagnostics"
    M_PROGRESS = "$/progress"
    M_INITIALIZE_PROGRESS = "window/workDoneProgress/create"
    M_APPLY_EDIT = "workspace/applyEdit"
    M_SHOW_MESSAGE = "window/showMessage"
    M_LOG_MESSAGE = "window/logMessage"

    def __init__(self, root_uri, endpoint, config=None) -> None:
        self._config = config
        self._root_uri = root_uri
        self._endpoint = endpoint
        self._root_uri_scheme = uris.urlparse(self._root_uri)[0]
        self._root_path = uris.to_fs_path(self._root_uri)
        self._docs = {}

        # Cache jedi environments
        self._environments = {}

        # Whilst incubating, keep rope private
        self.__rope = None
        self.__rope_config = None
        self.__rope_autoimport = None

    def _rope_autoimport(
        self,
        rope_config: Optional,
        memory: bool = False,
    ):
        from rope.contrib.autoimport.sqlite import AutoImport

        if self.__rope_autoimport is None:
            project = self._rope_project_builder(rope_config)
            self.__rope_autoimport = AutoImport(project, memory=memory)
        return self.__rope_autoimport

    def _rope_project_builder(self, rope_config):
        from rope.base.project import Project

        # TODO: we could keep track of dirty files and validate only those
        if self.__rope is None or self.__rope_config != rope_config:
            rope_folder = rope_config.get("ropeFolder")
            if "ropeFolder" in rope_config:
                self.__rope = Project(self._root_path, ropefolder=rope_folder)
            else:
                self.__rope = Project(self._root_path)
            self.__rope.prefs.set(
                "extension_modules", rope_config.get("extensionModules", [])
            )
            self.__rope.prefs.set("ignore_syntax_errors", True)
            self.__rope.prefs.set("ignore_bad_imports", True)
        self.__rope.validate()
        return self.__rope

    @property
    def documents(self):
        return self._docs

    @property
    def root_path(self):
        return self._root_path

    @property
    def root_uri(self):
        return self._root_uri

    def is_local(self):
        return (self._root_uri_scheme in ["", "file"]) and os.path.exists(
            self._root_path
        )

    def get_document(self, doc_uri):
        """Return a managed document if-present, else create one pointing at disk.

        See https://github.com/Microsoft/language-server-protocol/issues/177
        """
        return self._docs.get(doc_uri) or self._create_document(doc_uri)

    def get_cell_document(self, doc_uri):
        return self._docs.get(doc_uri)

    def get_maybe_document(self, doc_uri):
        return self._docs.get(doc_uri)

    def put_document(self, doc_uri, source, version=None) -> None:
        self._docs[doc_uri] = self._create_document(
            doc_uri, source=source, version=version
        )

    def put_notebook_document(
        self, doc_uri, notebook_type, cells, version=None, metadata=None
    ) -> None:
        self._docs[doc_uri] = self._create_notebook_document(
            doc_uri, notebook_type, cells, version, metadata
        )

    @contextmanager
    def temp_document(self, source, path=None) -> None:
        if path is None:
            path = self.root_path
        uri = uris.from_fs_path(os.path.join(path, str(uuid.uuid4())))
        try:
            self.put_document(uri, source)
            yield uri
        finally:
            self.rm_document(uri)

    def add_notebook_cells(self, doc_uri, cells, start) -> None:
        self._docs[doc_uri].add_cells(cells, start)

    def remove_notebook_cells(self, doc_uri, start, delete_count) -> None:
        self._docs[doc_uri].remove_cells(start, delete_count)

    def update_notebook_metadata(self, doc_uri, metadata) -> None:
        self._docs[doc_uri].metadata = metadata

    def put_cell_document(
        self, doc_uri, notebook_uri, language_id, source, version=None
    ) -> None:
        self._docs[doc_uri] = self._create_cell_document(
            doc_uri, notebook_uri, language_id, source, version
        )

    def rm_document(self, doc_uri) -> None:
        self._docs.pop(doc_uri)

    def update_document(self, doc_uri, change, version=None) -> None:
        self._docs[doc_uri].apply_change(change)
        self._docs[doc_uri].version = version

    def update_config(self, settings):
        self._config.update((settings or {}).get("pylsp", {}))
        for doc_uri in self.documents:
            if isinstance(document := self.get_document(doc_uri), Notebook):
                # Notebook documents don't have a config. The config is
                # handled at the cell level.
                return
            document.update_config(settings)

    def apply_edit(self, edit):
        return self._endpoint.request(self.M_APPLY_EDIT, {"edit": edit})

    def publish_diagnostics(self, doc_uri, diagnostics, doc_version=None) -> None:
        params = {
            "uri": doc_uri,
            "diagnostics": diagnostics,
        }

        if doc_version:
            params["version"] = doc_version

        self._endpoint.notify(
            self.M_PUBLISH_DIAGNOSTICS,
            params=params,
        )

    @contextmanager
    def report_progress(
        self,
        title: str,
        message: Optional[str] = None,
        percentage: Optional[int] = None,
        skip_token_initialization: bool = False,
    ) -> Generator[Callable[[str, Optional[int]], None], None, None]:
        """
        Report progress to the editor / client.

        ``skip_token_initialization` is necessary due to some current
        limitations of our LSP implementation. When `report_progress`
        is used from a synchronous LSP handler, the token initialization
        will time out because we can't receive the response.

        Many editors will still correctly show the progress messages though, which
        is why we are giving progress users the option to skip the initialization
        of the progress token.
        """
        if self._config:
            client_supports_progress_reporting = self._config.capabilities.get(
                "window", {}
            ).get("workDoneProgress", False)
        else:
            client_supports_progress_reporting = False

        if client_supports_progress_reporting:
            token = self._progress_begin(
                title, message, percentage, skip_token_initialization
            )

            def progress_message(
                message: str, percentage: Optional[int] = None
            ) -> None:
                self._progress_report(token, message, percentage)

            try:
                yield progress_message
            finally:
                self._progress_end(token)

            return

        # FALLBACK:
        # If the client doesn't support progress reporting, we have a dummy method
        # for the caller to use.
        def dummy_progress_message(
            message: str, percentage: Optional[int] = None
        ) -> None:
            pass

        yield dummy_progress_message

    def _progress_begin(
        self,
        title: str,
        message: Optional[str] = None,
        percentage: Optional[int] = None,
        skip_token_initialization: bool = False,
    ) -> str:
        token = str(uuid.uuid4())

        if not skip_token_initialization:
            try:
                self._endpoint.request(
                    self.M_INITIALIZE_PROGRESS, {"token": token}
                ).result(timeout=1.0)
            except Exception:
                log.warning(
                    "There was an error while trying to initialize progress reporting."
                    "Likely progress reporting was used in a synchronous LSP handler, "
                    "which is not supported by progress reporting yet. "
                    "To prevent waiting for the timeout you can set "
                    "`skip_token_initialization=True`. "
                    "Not every editor will show progress then, but many will.",
                    exc_info=True,
                )

        value = {
            "kind": "begin",
            "title": title,
        }
        if message is not None:
            value["message"] = message
        if percentage is not None:
            value["percentage"] = percentage

        self._endpoint.notify(
            self.M_PROGRESS,
            params={
                "token": token,
                "value": value,
            },
        )
        return token

    def _progress_report(
        self,
        token: str,
        message: Optional[str] = None,
        percentage: Optional[int] = None,
    ) -> None:
        value = {
            "kind": "report",
        }
        if message:
            value["message"] = message
        if percentage:
            value["percentage"] = percentage

        self._endpoint.notify(
            self.M_PROGRESS,
            params={
                "token": token,
                "value": value,
            },
        )

    def _progress_end(self, token: str, message: Optional[str] = None) -> None:
        value = {
            "kind": "end",
        }
        if message:
            value["message"] = message

        self._endpoint.notify(
            self.M_PROGRESS,
            params={
                "token": token,
                "value": value,
            },
        )

    def log_message(self, message, msg_type=lsp.MessageType.Info):
        self._endpoint.notify(
            self.M_LOG_MESSAGE, params={"type": msg_type, "message": message}
        )

    def show_message(self, message, msg_type=lsp.MessageType.Info) -> None:
        self._endpoint.notify(
            self.M_SHOW_MESSAGE, params={"type": msg_type, "message": message}
        )

    def source_roots(self, document_path):
        """Return the source roots for the given document."""
        files = (
            _utils.find_parents(
                self._root_path, document_path, ["setup.py", "pyproject.toml"]
            )
            or []
        )
        return list({os.path.dirname(project_file) for project_file in files}) or [
            self._root_path
        ]

    def _create_document(self, doc_uri, source=None, version=None):
        path = uris.to_fs_path(doc_uri)
        return Document(
            doc_uri,
            self,
            source=source,
            version=version,
            extra_sys_path=self.source_roots(path),
            rope_project_builder=self._rope_project_builder,
        )

    def _create_notebook_document(
        self, doc_uri, notebook_type, cells, version=None, metadata=None
    ):
        return Notebook(
            doc_uri,
            notebook_type,
            self,
            cells=cells,
            version=version,
            metadata=metadata,
        )

    def _create_cell_document(
        self, doc_uri, notebook_uri, language_id, source=None, version=None
    ):
        # TODO: remove what is unnecessary here.
        path = uris.to_fs_path(doc_uri)
        return Cell(
            doc_uri,
            notebook_uri=notebook_uri,
            language_id=language_id,
            workspace=self,
            source=source,
            version=version,
            extra_sys_path=self.source_roots(path),
            rope_project_builder=self._rope_project_builder,
        )

    def close(self) -> None:
        if self.__rope_autoimport:
            self.__rope_autoimport.close()


class Document:
    def __init__(
        self,
        uri,
        workspace,
        source=None,
        version=None,
        local=True,
        extra_sys_path=None,
        rope_project_builder=None,
    ) -> None:
        self.uri = uri
        self.version = version
        self.path = uris.to_fs_path(uri)
        self.dot_path = _utils.path_to_dot_name(self.path)
        self.filename = os.path.basename(self.path)
        self.shared_data = {}

        self._config = workspace._config
        self._workspace = workspace
        self._local = local
        self._source = source
        self._extra_sys_path = extra_sys_path or []
        self._rope_project_builder = rope_project_builder
        self._lock = RLock()

    def __str__(self):
        return str(self.uri)

    def _rope_resource(self, rope_config):
        from rope.base import libutils

        return libutils.path_to_resource(
            self._rope_project_builder(rope_config), self.path
        )

    @property
    @lock
    def lines(self):
        return self.source.splitlines(True)

    @property
    @lock
    def source(self):
        if self._source is None:
            with open(self.path, encoding="utf-8") as f:
                return f.read()
        return self._source

    def update_config(self, settings) -> None:
        self._config.update((settings or {}).get("pylsp", {}))

    @lock
    def apply_change(self, change):
        """Apply a change to the document."""
        text = change["text"]
        change_range = change.get("range")

        if not change_range:
            # The whole file has changed
            self._source = text
            return

        start_line = change_range["start"]["line"]
        start_col = change_range["start"]["character"]
        end_line = change_range["end"]["line"]
        end_col = change_range["end"]["character"]

        # Check for an edit occuring at the very end of the file
        lines = self.lines
        if start_line == len(lines):
            self._source = self.source + text
            return

        new = io.StringIO()

        # Iterate over the existing document until we hit the edit range,
        # at which point we write the new text, then loop until we hit
        # the end of the range and continue writing.
        for i, line in enumerate(lines):
            if i < start_line:
                new.write(line)
                continue

            if i > end_line:
                new.write(line)
                continue

            if i == start_line:
                new.write(line[:start_col])
                new.write(text)

            if i == end_line:
                new.write(line[end_col:])

        self._source = new.getvalue()

    def offset_at_position(self, position):
        """Return the byte-offset pointed at by the given position."""
        return position["character"] + len("".join(self.lines[: position["line"]]))

    def word_at_position(self, position):
        """Get the word under the cursor returning the start and end positions."""
        lines = self.lines
        if position["line"] >= len(lines):
            return ""

        line = lines[position["line"]]
        i = position["character"]
        # Split word in two
        start = line[:i]
        end = line[i:]

        # Take end of start and start of end to find word
        # These are guaranteed to match, even if they match the empty string
        m_start = RE_START_WORD.findall(start)
        m_end = RE_END_WORD.findall(end)

        return m_start[0] + m_end[-1]

    @lock
    def jedi_names(self, all_scopes=False, definitions=True, references=False):
        script = self.jedi_script()
        return script.get_names(
            all_scopes=all_scopes, definitions=definitions, references=references
        )

    @lock
    def jedi_script(self, position=None, use_document_path=False):
        extra_paths = []
        environment_path = None
        env_vars = None
        prioritize_extra_paths = False

        if self._config:
            jedi_settings = self._config.plugin_settings(
                "jedi", document_path=self.path
            )
            jedi.settings.auto_import_modules = jedi_settings.get(
                "auto_import_modules", DEFAULT_AUTO_IMPORT_MODULES
            )
            environment_path = jedi_settings.get("environment")
            # Jedi itself cannot deal with homedir-relative paths.
            # On systems, where it is expected, expand the home directory.
            if environment_path and os.name != "nt":
                environment_path = os.path.expanduser(environment_path)

            extra_paths = jedi_settings.get("extra_paths") or []
            env_vars = jedi_settings.get("env_vars")
            prioritize_extra_paths = jedi_settings.get("prioritize_extra_paths")

        # Drop PYTHONPATH from env_vars before creating the environment to
        # ensure that Jedi can startup properly without module name collision.
        if env_vars is None:
            env_vars = os.environ.copy()
        env_vars.pop("PYTHONPATH", None)

        environment = self.get_enviroment(environment_path, env_vars=env_vars)
        sys_path = self.sys_path(
            environment_path, env_vars, prioritize_extra_paths, extra_paths
        )

        project_path = self._workspace.root_path

        # Extend sys_path with document's path if requested
        if use_document_path:
            sys_path += [os.path.normpath(os.path.dirname(self.path))]

        kwargs = {
            "code": self.source,
            "path": self.path,
            "environment": environment if environment_path else None,
            "project": jedi.Project(path=project_path, sys_path=sys_path),
        }

        if position:
            # Deprecated by Jedi to use in Script() constructor
            kwargs += _utils.position_to_jedi_linecolumn(self, position)

        return jedi.Script(**kwargs)

    def get_enviroment(self, environment_path=None, env_vars=None):
        # TODO(gatesn): #339 - make better use of jedi environments, they seem pretty powerful
        if environment_path is None:
            environment = jedi.api.environment.get_cached_default_environment()
        else:
            if environment_path in self._workspace._environments:
                environment = self._workspace._environments[environment_path]
            else:
                environment = jedi.api.environment.create_environment(
                    path=environment_path, safe=False, env_vars=env_vars
                )
                self._workspace._environments[environment_path] = environment

        return environment

    def sys_path(
        self,
        environment_path=None,
        env_vars=None,
        prioritize_extra_paths=False,
        extra_paths=[],
    ):
        # Copy our extra sys path
        path = list(self._extra_sys_path)
        environment = self.get_enviroment(
            environment_path=environment_path, env_vars=env_vars
        )
        path.extend(environment.get_sys_path())
        if prioritize_extra_paths:
            path = extra_paths + path
        else:
            path = path + extra_paths

        return path


class Notebook:
    """Represents a notebook."""

    def __init__(
        self, uri, notebook_type, workspace, cells=None, version=None, metadata=None
    ) -> None:
        self.uri = uri
        self.notebook_type = notebook_type
        self.workspace = workspace
        self.version = version
        self.cells = cells or []
        self.metadata = metadata or {}
        self._lock = RLock()

    def __str__(self):
        return "Notebook with URI '%s'" % str(self.uri)

    def add_cells(self, new_cells: list, start: int) -> None:
        self.cells[start:start] = new_cells

    def remove_cells(self, start: int, delete_count: int) -> None:
        del self.cells[start : start + delete_count]

    def cell_data(self):
        """Extract current cell data.

        Returns a dict (ordered by cell position) where the key is the cell uri and the
        value is a dict with line_start, line_end, and source attributes.
        """
        cell_data = {}
        offset = 0
        for cell in self.cells:
            cell_uri = cell["document"]
            cell_document = self.workspace.get_cell_document(cell_uri)
            num_lines = cell_document.line_count
            cell_data[cell_uri] = {
                "line_start": offset,
                "line_end": offset + num_lines - 1,
                "source": cell_document.source,
            }
            offset += num_lines
        return cell_data

    @lock
    def jedi_names(
        self,
        up_to_cell_uri: Optional[str] = None,
        all_scopes=False,
        definitions=True,
        references=False,
    ):
        """
        Get the names in the notebook up to a certain cell.

        Parameters
        ----------
        up_to_cell_uri: str, optional
            The cell uri to stop at. If None, all cells are considered.
        """
        names = set()
        for cell in self.cells:
            cell_uri = cell["document"]
            cell_document = self.workspace.get_cell_document(cell_uri)
            names.update(cell_document.jedi_names(all_scopes, definitions, references))
            if cell_uri == up_to_cell_uri:
                break
        return {name.name for name in names}


class Cell(Document):
    """
    Represents a cell in a notebook.

    Notes
    -----
    We inherit from Document for now to get the same API. However, a cell document differs from text documents in that
    they have a language id.
    """

    def __init__(
        self,
        uri,
        notebook_uri,
        language_id,
        workspace,
        source=None,
        version=None,
        local=True,
        extra_sys_path=None,
        rope_project_builder=None,
    ) -> None:
        super().__init__(
            uri, workspace, source, version, local, extra_sys_path, rope_project_builder
        )
        self.language_id = language_id
        self.notebook_uri = notebook_uri

    @property
    @lock
    def line_count(self):
        """ "Return the number of lines in the cell document."""
        return len(self.source.split("\n"))