client-py/venv/lib/python3.12/site-packages/pylsp/workspace.py
2026-05-02 13:34:53 +05:00

713 lines
22 KiB
Python

# Copyright 2017-2020 Palantir Technologies, Inc.
# Copyright 2021- Python Language Server Contributors.
import functools
import io
import logging
import os
import re
import uuid
from collections.abc import Generator
from contextlib import contextmanager
from threading import RLock
from typing import Callable, Optional
import jedi
from . import _utils, lsp, uris
log = logging.getLogger(__name__)
DEFAULT_AUTO_IMPORT_MODULES = ["numpy"]
# TODO: this is not the best e.g. we capture numbers
RE_START_WORD = re.compile("[A-Za-z_0-9]*$")
RE_END_WORD = re.compile("^[A-Za-z_0-9]*")
def lock(method):
"""Define an atomic region over a method."""
@functools.wraps(method)
def wrapper(self, *args, **kwargs):
with self._lock:
return method(self, *args, **kwargs)
return wrapper
class Workspace:
M_PUBLISH_DIAGNOSTICS = "textDocument/publishDiagnostics"
M_PROGRESS = "$/progress"
M_INITIALIZE_PROGRESS = "window/workDoneProgress/create"
M_APPLY_EDIT = "workspace/applyEdit"
M_SHOW_MESSAGE = "window/showMessage"
M_LOG_MESSAGE = "window/logMessage"
def __init__(self, root_uri, endpoint, config=None) -> None:
self._config = config
self._root_uri = root_uri
self._endpoint = endpoint
self._root_uri_scheme = uris.urlparse(self._root_uri)[0]
self._root_path = uris.to_fs_path(self._root_uri)
self._docs = {}
# Cache jedi environments
self._environments = {}
# Whilst incubating, keep rope private
self.__rope = None
self.__rope_config = None
self.__rope_autoimport = None
def _rope_autoimport(
self,
rope_config: Optional,
memory: bool = False,
):
from rope.contrib.autoimport.sqlite import AutoImport
if self.__rope_autoimport is None:
project = self._rope_project_builder(rope_config)
self.__rope_autoimport = AutoImport(project, memory=memory)
return self.__rope_autoimport
def _rope_project_builder(self, rope_config):
from rope.base.project import Project
# TODO: we could keep track of dirty files and validate only those
if self.__rope is None or self.__rope_config != rope_config:
rope_folder = rope_config.get("ropeFolder")
if "ropeFolder" in rope_config:
self.__rope = Project(self._root_path, ropefolder=rope_folder)
else:
self.__rope = Project(self._root_path)
self.__rope.prefs.set(
"extension_modules", rope_config.get("extensionModules", [])
)
self.__rope.prefs.set("ignore_syntax_errors", True)
self.__rope.prefs.set("ignore_bad_imports", True)
self.__rope.validate()
return self.__rope
@property
def documents(self):
return self._docs
@property
def root_path(self):
return self._root_path
@property
def root_uri(self):
return self._root_uri
def is_local(self):
return (self._root_uri_scheme in ["", "file"]) and os.path.exists(
self._root_path
)
def get_document(self, doc_uri):
"""Return a managed document if-present, else create one pointing at disk.
See https://github.com/Microsoft/language-server-protocol/issues/177
"""
return self._docs.get(doc_uri) or self._create_document(doc_uri)
def get_cell_document(self, doc_uri):
return self._docs.get(doc_uri)
def get_maybe_document(self, doc_uri):
return self._docs.get(doc_uri)
def put_document(self, doc_uri, source, version=None) -> None:
self._docs[doc_uri] = self._create_document(
doc_uri, source=source, version=version
)
def put_notebook_document(
self, doc_uri, notebook_type, cells, version=None, metadata=None
) -> None:
self._docs[doc_uri] = self._create_notebook_document(
doc_uri, notebook_type, cells, version, metadata
)
@contextmanager
def temp_document(self, source, path=None) -> None:
if path is None:
path = self.root_path
uri = uris.from_fs_path(os.path.join(path, str(uuid.uuid4())))
try:
self.put_document(uri, source)
yield uri
finally:
self.rm_document(uri)
def add_notebook_cells(self, doc_uri, cells, start) -> None:
self._docs[doc_uri].add_cells(cells, start)
def remove_notebook_cells(self, doc_uri, start, delete_count) -> None:
self._docs[doc_uri].remove_cells(start, delete_count)
def update_notebook_metadata(self, doc_uri, metadata) -> None:
self._docs[doc_uri].metadata = metadata
def put_cell_document(
self, doc_uri, notebook_uri, language_id, source, version=None
) -> None:
self._docs[doc_uri] = self._create_cell_document(
doc_uri, notebook_uri, language_id, source, version
)
def rm_document(self, doc_uri) -> None:
self._docs.pop(doc_uri)
def update_document(self, doc_uri, change, version=None) -> None:
self._docs[doc_uri].apply_change(change)
self._docs[doc_uri].version = version
def update_config(self, settings):
self._config.update((settings or {}).get("pylsp", {}))
for doc_uri in self.documents:
if isinstance(document := self.get_document(doc_uri), Notebook):
# Notebook documents don't have a config. The config is
# handled at the cell level.
return
document.update_config(settings)
def apply_edit(self, edit):
return self._endpoint.request(self.M_APPLY_EDIT, {"edit": edit})
def publish_diagnostics(self, doc_uri, diagnostics, doc_version=None) -> None:
params = {
"uri": doc_uri,
"diagnostics": diagnostics,
}
if doc_version:
params["version"] = doc_version
self._endpoint.notify(
self.M_PUBLISH_DIAGNOSTICS,
params=params,
)
@contextmanager
def report_progress(
self,
title: str,
message: Optional[str] = None,
percentage: Optional[int] = None,
skip_token_initialization: bool = False,
) -> Generator[Callable[[str, Optional[int]], None], None, None]:
"""
Report progress to the editor / client.
``skip_token_initialization` is necessary due to some current
limitations of our LSP implementation. When `report_progress`
is used from a synchronous LSP handler, the token initialization
will time out because we can't receive the response.
Many editors will still correctly show the progress messages though, which
is why we are giving progress users the option to skip the initialization
of the progress token.
"""
if self._config:
client_supports_progress_reporting = self._config.capabilities.get(
"window", {}
).get("workDoneProgress", False)
else:
client_supports_progress_reporting = False
if client_supports_progress_reporting:
token = self._progress_begin(
title, message, percentage, skip_token_initialization
)
def progress_message(
message: str, percentage: Optional[int] = None
) -> None:
self._progress_report(token, message, percentage)
try:
yield progress_message
finally:
self._progress_end(token)
return
# FALLBACK:
# If the client doesn't support progress reporting, we have a dummy method
# for the caller to use.
def dummy_progress_message(
message: str, percentage: Optional[int] = None
) -> None:
pass
yield dummy_progress_message
def _progress_begin(
self,
title: str,
message: Optional[str] = None,
percentage: Optional[int] = None,
skip_token_initialization: bool = False,
) -> str:
token = str(uuid.uuid4())
if not skip_token_initialization:
try:
self._endpoint.request(
self.M_INITIALIZE_PROGRESS, {"token": token}
).result(timeout=1.0)
except Exception:
log.warning(
"There was an error while trying to initialize progress reporting."
"Likely progress reporting was used in a synchronous LSP handler, "
"which is not supported by progress reporting yet. "
"To prevent waiting for the timeout you can set "
"`skip_token_initialization=True`. "
"Not every editor will show progress then, but many will.",
exc_info=True,
)
value = {
"kind": "begin",
"title": title,
}
if message is not None:
value["message"] = message
if percentage is not None:
value["percentage"] = percentage
self._endpoint.notify(
self.M_PROGRESS,
params={
"token": token,
"value": value,
},
)
return token
def _progress_report(
self,
token: str,
message: Optional[str] = None,
percentage: Optional[int] = None,
) -> None:
value = {
"kind": "report",
}
if message:
value["message"] = message
if percentage:
value["percentage"] = percentage
self._endpoint.notify(
self.M_PROGRESS,
params={
"token": token,
"value": value,
},
)
def _progress_end(self, token: str, message: Optional[str] = None) -> None:
value = {
"kind": "end",
}
if message:
value["message"] = message
self._endpoint.notify(
self.M_PROGRESS,
params={
"token": token,
"value": value,
},
)
def log_message(self, message, msg_type=lsp.MessageType.Info):
self._endpoint.notify(
self.M_LOG_MESSAGE, params={"type": msg_type, "message": message}
)
def show_message(self, message, msg_type=lsp.MessageType.Info) -> None:
self._endpoint.notify(
self.M_SHOW_MESSAGE, params={"type": msg_type, "message": message}
)
def source_roots(self, document_path):
"""Return the source roots for the given document."""
files = (
_utils.find_parents(
self._root_path, document_path, ["setup.py", "pyproject.toml"]
)
or []
)
return list({os.path.dirname(project_file) for project_file in files}) or [
self._root_path
]
def _create_document(self, doc_uri, source=None, version=None):
path = uris.to_fs_path(doc_uri)
return Document(
doc_uri,
self,
source=source,
version=version,
extra_sys_path=self.source_roots(path),
rope_project_builder=self._rope_project_builder,
)
def _create_notebook_document(
self, doc_uri, notebook_type, cells, version=None, metadata=None
):
return Notebook(
doc_uri,
notebook_type,
self,
cells=cells,
version=version,
metadata=metadata,
)
def _create_cell_document(
self, doc_uri, notebook_uri, language_id, source=None, version=None
):
# TODO: remove what is unnecessary here.
path = uris.to_fs_path(doc_uri)
return Cell(
doc_uri,
notebook_uri=notebook_uri,
language_id=language_id,
workspace=self,
source=source,
version=version,
extra_sys_path=self.source_roots(path),
rope_project_builder=self._rope_project_builder,
)
def close(self) -> None:
if self.__rope_autoimport:
self.__rope_autoimport.close()
class Document:
def __init__(
self,
uri,
workspace,
source=None,
version=None,
local=True,
extra_sys_path=None,
rope_project_builder=None,
) -> None:
self.uri = uri
self.version = version
self.path = uris.to_fs_path(uri)
self.dot_path = _utils.path_to_dot_name(self.path)
self.filename = os.path.basename(self.path)
self.shared_data = {}
self._config = workspace._config
self._workspace = workspace
self._local = local
self._source = source
self._extra_sys_path = extra_sys_path or []
self._rope_project_builder = rope_project_builder
self._lock = RLock()
def __str__(self):
return str(self.uri)
def _rope_resource(self, rope_config):
from rope.base import libutils
return libutils.path_to_resource(
self._rope_project_builder(rope_config), self.path
)
@property
@lock
def lines(self):
return self.source.splitlines(True)
@property
@lock
def source(self):
if self._source is None:
with open(self.path, encoding="utf-8") as f:
return f.read()
return self._source
def update_config(self, settings) -> None:
self._config.update((settings or {}).get("pylsp", {}))
@lock
def apply_change(self, change):
"""Apply a change to the document."""
text = change["text"]
change_range = change.get("range")
if not change_range:
# The whole file has changed
self._source = text
return
start_line = change_range["start"]["line"]
start_col = change_range["start"]["character"]
end_line = change_range["end"]["line"]
end_col = change_range["end"]["character"]
# Check for an edit occuring at the very end of the file
lines = self.lines
if start_line == len(lines):
self._source = self.source + text
return
new = io.StringIO()
# Iterate over the existing document until we hit the edit range,
# at which point we write the new text, then loop until we hit
# the end of the range and continue writing.
for i, line in enumerate(lines):
if i < start_line:
new.write(line)
continue
if i > end_line:
new.write(line)
continue
if i == start_line:
new.write(line[:start_col])
new.write(text)
if i == end_line:
new.write(line[end_col:])
self._source = new.getvalue()
def offset_at_position(self, position):
"""Return the byte-offset pointed at by the given position."""
return position["character"] + len("".join(self.lines[: position["line"]]))
def word_at_position(self, position):
"""Get the word under the cursor returning the start and end positions."""
lines = self.lines
if position["line"] >= len(lines):
return ""
line = lines[position["line"]]
i = position["character"]
# Split word in two
start = line[:i]
end = line[i:]
# Take end of start and start of end to find word
# These are guaranteed to match, even if they match the empty string
m_start = RE_START_WORD.findall(start)
m_end = RE_END_WORD.findall(end)
return m_start[0] + m_end[-1]
@lock
def jedi_names(self, all_scopes=False, definitions=True, references=False):
script = self.jedi_script()
return script.get_names(
all_scopes=all_scopes, definitions=definitions, references=references
)
@lock
def jedi_script(self, position=None, use_document_path=False):
extra_paths = []
environment_path = None
env_vars = None
prioritize_extra_paths = False
if self._config:
jedi_settings = self._config.plugin_settings(
"jedi", document_path=self.path
)
jedi.settings.auto_import_modules = jedi_settings.get(
"auto_import_modules", DEFAULT_AUTO_IMPORT_MODULES
)
environment_path = jedi_settings.get("environment")
# Jedi itself cannot deal with homedir-relative paths.
# On systems, where it is expected, expand the home directory.
if environment_path and os.name != "nt":
environment_path = os.path.expanduser(environment_path)
extra_paths = jedi_settings.get("extra_paths") or []
env_vars = jedi_settings.get("env_vars")
prioritize_extra_paths = jedi_settings.get("prioritize_extra_paths")
# Drop PYTHONPATH from env_vars before creating the environment to
# ensure that Jedi can startup properly without module name collision.
if env_vars is None:
env_vars = os.environ.copy()
env_vars.pop("PYTHONPATH", None)
environment = self.get_enviroment(environment_path, env_vars=env_vars)
sys_path = self.sys_path(
environment_path, env_vars, prioritize_extra_paths, extra_paths
)
project_path = self._workspace.root_path
# Extend sys_path with document's path if requested
if use_document_path:
sys_path += [os.path.normpath(os.path.dirname(self.path))]
kwargs = {
"code": self.source,
"path": self.path,
"environment": environment if environment_path else None,
"project": jedi.Project(path=project_path, sys_path=sys_path),
}
if position:
# Deprecated by Jedi to use in Script() constructor
kwargs += _utils.position_to_jedi_linecolumn(self, position)
return jedi.Script(**kwargs)
def get_enviroment(self, environment_path=None, env_vars=None):
# TODO(gatesn): #339 - make better use of jedi environments, they seem pretty powerful
if environment_path is None:
environment = jedi.api.environment.get_cached_default_environment()
else:
if environment_path in self._workspace._environments:
environment = self._workspace._environments[environment_path]
else:
environment = jedi.api.environment.create_environment(
path=environment_path, safe=False, env_vars=env_vars
)
self._workspace._environments[environment_path] = environment
return environment
def sys_path(
self,
environment_path=None,
env_vars=None,
prioritize_extra_paths=False,
extra_paths=[],
):
# Copy our extra sys path
path = list(self._extra_sys_path)
environment = self.get_enviroment(
environment_path=environment_path, env_vars=env_vars
)
path.extend(environment.get_sys_path())
if prioritize_extra_paths:
path = extra_paths + path
else:
path = path + extra_paths
return path
class Notebook:
"""Represents a notebook."""
def __init__(
self, uri, notebook_type, workspace, cells=None, version=None, metadata=None
) -> None:
self.uri = uri
self.notebook_type = notebook_type
self.workspace = workspace
self.version = version
self.cells = cells or []
self.metadata = metadata or {}
self._lock = RLock()
def __str__(self):
return "Notebook with URI '%s'" % str(self.uri)
def add_cells(self, new_cells: list, start: int) -> None:
self.cells[start:start] = new_cells
def remove_cells(self, start: int, delete_count: int) -> None:
del self.cells[start : start + delete_count]
def cell_data(self):
"""Extract current cell data.
Returns a dict (ordered by cell position) where the key is the cell uri and the
value is a dict with line_start, line_end, and source attributes.
"""
cell_data = {}
offset = 0
for cell in self.cells:
cell_uri = cell["document"]
cell_document = self.workspace.get_cell_document(cell_uri)
num_lines = cell_document.line_count
cell_data[cell_uri] = {
"line_start": offset,
"line_end": offset + num_lines - 1,
"source": cell_document.source,
}
offset += num_lines
return cell_data
@lock
def jedi_names(
self,
up_to_cell_uri: Optional[str] = None,
all_scopes=False,
definitions=True,
references=False,
):
"""
Get the names in the notebook up to a certain cell.
Parameters
----------
up_to_cell_uri: str, optional
The cell uri to stop at. If None, all cells are considered.
"""
names = set()
for cell in self.cells:
cell_uri = cell["document"]
cell_document = self.workspace.get_cell_document(cell_uri)
names.update(cell_document.jedi_names(all_scopes, definitions, references))
if cell_uri == up_to_cell_uri:
break
return {name.name for name in names}
class Cell(Document):
"""
Represents a cell in a notebook.
Notes
-----
We inherit from Document for now to get the same API. However, a cell document differs from text documents in that
they have a language id.
"""
def __init__(
self,
uri,
notebook_uri,
language_id,
workspace,
source=None,
version=None,
local=True,
extra_sys_path=None,
rope_project_builder=None,
) -> None:
super().__init__(
uri, workspace, source, version, local, extra_sys_path, rope_project_builder
)
self.language_id = language_id
self.notebook_uri = notebook_uri
@property
@lock
def line_count(self):
""" "Return the number of lines in the cell document."""
return len(self.source.split("\n"))