"""Operating system-related utility functions for Sphinx.""" from __future__ import annotations import contextlib import filecmp import os import re import shutil import sys import unicodedata from io import StringIO from os import path from pathlib import Path from typing import TYPE_CHECKING from sphinx.locale import __ if TYPE_CHECKING: from types import TracebackType from typing import Any # SEP separates path elements in the canonical file names # # Define SEP as a manifest constant, not so much because we expect it to change # in the future as to avoid the suspicion that a stray "/" in the code is a # hangover from more *nix-oriented origins. SEP = '/' def os_path(canonical_path: str, /) -> str: return canonical_path.replace(SEP, path.sep) def canon_path(native_path: str | os.PathLike[str], /) -> str: """Return path in OS-independent form""" return os.fspath(native_path).replace(path.sep, SEP) def path_stabilize(filepath: str | os.PathLike[str], /) -> str: """Normalize path separator and unicode string""" new_path = canon_path(filepath) return unicodedata.normalize('NFC', new_path) def relative_uri(base: str, to: str) -> str: """Return a relative URL from ``base`` to ``to``.""" if to.startswith(SEP): return to b2 = base.split('#')[0].split(SEP) t2 = to.split('#')[0].split(SEP) # remove common segments (except the last segment) for x, y in zip(b2[:-1], t2[:-1], strict=False): if x != y: break b2.pop(0) t2.pop(0) if b2 == t2: # Special case: relative_uri('f/index.html','f/index.html') # returns '', not 'index.html' return '' if len(b2) == 1 and t2 == ['']: # Special case: relative_uri('f/index.html','f/') should # return './', not '' return '.' + SEP return ('..' + SEP) * (len(b2) - 1) + SEP.join(t2) def ensuredir(file: str | os.PathLike[str]) -> None: """Ensure that a path exists.""" os.makedirs(file, exist_ok=True) def _last_modified_time(source: str | os.PathLike[str], /) -> int: """Return the last modified time of ``filename``. The time is returned as integer microseconds. The lowest common denominator of modern file-systems seems to be microsecond-level precision. We prefer to err on the side of re-rendering a file, so we round up to the nearest microsecond. """ st = source.stat() if isinstance(source, os.DirEntry) else os.stat(source) # upside-down floor division to get the ceiling return -(st.st_mtime_ns // -1_000) def _copy_times(source: str | os.PathLike[str], dest: str | os.PathLike[str]) -> None: """Copy a file's modification times.""" st = source.stat() if isinstance(source, os.DirEntry) else os.stat(source) os.utime(dest, ns=(st.st_atime_ns, st.st_mtime_ns)) def copyfile( source: str | os.PathLike[str], dest: str | os.PathLike[str], *, force: bool = False, ) -> None: """Copy a file and its modification times, if possible. :param source: An existing source to copy. :param dest: The destination path. :param bool force: Overwrite the destination file even if it exists. :raise FileNotFoundError: The *source* does not exist. .. note:: :func:`copyfile` is a no-op if *source* and *dest* are identical. """ # coerce to Path objects source = Path(source) dest = Path(dest) if not source.exists(): msg = f'{source} does not exist' raise FileNotFoundError(msg) if ( not (dest_exists := dest.exists()) # comparison must be done using shallow=False since # two different files might have the same size or not filecmp.cmp(source, dest, shallow=False) ): if not force and dest_exists: # sphinx.util.logging imports sphinx.util.osutil, # so use a local import to avoid circular imports from sphinx.util import logging logger = logging.getLogger(__name__) msg = __( 'Aborted attempted copy from %s to %s ' '(the destination path has existing data).' ) logger.warning(msg, source, dest, type='misc', subtype='copy_overwrite') return shutil.copyfile(source, dest) with contextlib.suppress(OSError): # don't do full copystat because the source may be read-only _copy_times(source, dest) _no_fn_re = re.compile(r'[^a-zA-Z0-9_-]') def make_filename(string: str) -> str: return _no_fn_re.sub('', string) or 'sphinx' def make_filename_from_project(project: str) -> str: return make_filename(project.removesuffix(' Documentation')).lower() def relpath( path: str | os.PathLike[str], start: str | os.PathLike[str] | None = os.curdir ) -> str: """Return a relative filepath to *path* either from the current directory or from an optional *start* directory. This is an alternative of ``os.path.relpath()``. This returns original path if *path* and *start* are on different drives (for Windows platform). """ try: return os.path.relpath(path, start) except ValueError: return str(path) safe_relpath = relpath # for compatibility fs_encoding = sys.getfilesystemencoding() or sys.getdefaultencoding() abspath = path.abspath class _chdir: """Remove this fall-back once support for Python 3.10 is removed.""" def __init__(self, target_dir: str, /) -> None: self.path = target_dir self._dirs: list[str] = [] def __enter__(self) -> None: self._dirs.append(os.getcwd()) os.chdir(self.path) def __exit__( self, type: type[BaseException] | None, value: BaseException | None, traceback: TracebackType | None, /, ) -> None: os.chdir(self._dirs.pop()) if sys.version_info[:2] < (3, 11): cd = _chdir class FileAvoidWrite: """File-like object that buffers output and only writes if content changed. Use this class like when writing to a file to avoid touching the original file if the content hasn't changed. This is useful in scenarios where file mtime is used to invalidate caches or trigger new behavior. When writing to this file handle, all writes are buffered until the object is closed. Objects can be used as context managers. """ def __init__(self, path: str | Path) -> None: self._path = path self._io: StringIO | None = None def write(self, data: str) -> None: if not self._io: self._io = StringIO() self._io.write(data) def close(self) -> None: """Stop accepting writes and write file, if needed.""" if not self._io: msg = 'FileAvoidWrite does not support empty files.' raise Exception(msg) buf = self.getvalue() self._io.close() try: with open(self._path, encoding='utf-8') as old_f: old_content = old_f.read() if old_content == buf: return except OSError: pass with open(self._path, 'w', encoding='utf-8') as f: f.write(buf) def __enter__(self) -> FileAvoidWrite: return self def __exit__( self, exc_type: type[Exception], exc_value: Exception, traceback: Any ) -> bool: self.close() return True def __getattr__(self, name: str) -> Any: # Proxy to _io instance. if not self._io: msg = 'Must write to FileAvoidWrite before other methods can be used' raise Exception(msg) return getattr(self._io, name) def rmtree(path: str) -> None: if os.path.isdir(path): shutil.rmtree(path) else: os.remove(path)