"""
Path and filesystem utilities.
The :class:`Path` object is an extension of :class:`pathlib.Path` that contains
extra convenience methods corresponding to the extra functional methods in this
module. (New in 0.11.0). See the class documentation for more details.
This module also defines functional path-related utilities, but moving forward
users should prefer using :class:`Path` over standalone functional methods. The
functions methods will still be available for the forseable future, but their
functionality is made redundant by :class:`Path`. For completeness these
functions are listed
The :func:`expandpath` function expands the tilde to ``$HOME`` and environment
variables to their values.
The :func:`augpath` function creates variants of an existing path without
having to spend multiple lines of code splitting it up and stitching it back
together.
The :func:`shrinkuser` function replaces your home directory with a tilde.
The :func:`userhome` function reports the home directory of the current user of
the operating system.
The :func:`ensuredir` function operates like ``mkdir -p`` in unix.
Note:
In the future the part of this module that defines Path may be renamed to
util_pathlib.
"""
from os.path import (
dirname, exists, expanduser, expandvars, join, normpath, split, splitext,
)
import os
import sys
import pathlib
import warnings
from ubelt import util_io
__all__ = [
'Path', 'TempDir', 'augpath', 'shrinkuser', 'userhome', 'ensuredir',
'expandpath', 'ChDir',
]
[docs]
def augpath(path, suffix='', prefix='', ext=None, tail='', base=None,
dpath=None, relative=None, multidot=False):
"""
Create a new path with a different extension, basename, directory, prefix,
and/or suffix.
A prefix is inserted before the basename. A suffix is inserted
between the basename and the extension. The basename and extension can be
replaced with a new one. Essentially a path is broken down into components
(dpath, base, ext), and then recombined as (dpath, prefix, base, suffix,
ext) after replacing any specified component.
Args:
path (str | PathLike): a path to augment
suffix (str):
placed between the basename and extension
Note: this is referred to as stemsuffix in :func:`ub.Path.augment`.
prefix (str):
placed in front of the basename
ext (str | None):
if specified, replaces the extension
tail (str | None):
If specified, appends this text to the extension
base (str | None):
if specified, replaces the basename without extension.
Note: this is referred to as stem in :func:`ub.Path.augment`.
dpath (str | PathLike | None):
if specified, replaces the specified "relative" directory, which by
default is the parent directory.
relative (str | PathLike | None):
Replaces ``relative`` with ``dpath`` in ``path``.
Has no effect if ``dpath`` is not specified.
Defaults to the dirname of the input ``path``.
*experimental* not currently implemented.
multidot (bool): Allows extensions to contain multiple
dots. Specifically, if False, everything after the last dot in the
basename is the extension. If True, everything after the first dot
in the basename is the extension.
Returns:
str: augmented path
Example:
>>> import ubelt as ub
>>> path = 'foo.bar'
>>> suffix = '_suff'
>>> prefix = 'pref_'
>>> ext = '.baz'
>>> newpath = ub.augpath(path, suffix, prefix, ext=ext, base='bar')
>>> print('newpath = %s' % (newpath,))
newpath = pref_bar_suff.baz
Example:
>>> from ubelt.util_path import * # NOQA
>>> augpath('foo.bar')
'foo.bar'
>>> augpath('foo.bar', ext='.BAZ')
'foo.BAZ'
>>> augpath('foo.bar', suffix='_')
'foo_.bar'
>>> augpath('foo.bar', prefix='_')
'_foo.bar'
>>> augpath('foo.bar', base='baz')
'baz.bar'
>>> augpath('foo.tar.gz', ext='.zip', multidot=True)
foo.zip
>>> augpath('foo.tar.gz', ext='.zip', multidot=False)
foo.tar.zip
>>> augpath('foo.tar.gz', suffix='_new', multidot=True)
foo_new.tar.gz
>>> augpath('foo.tar.gz', suffix='_new', tail='.cache', multidot=True)
foo_new.tar.gz.cache
"""
stem = base # new nomenclature
# Breakup path
if relative is None:
orig_dpath, fname = split(path)
else: # nocover
# if path.startswith(relative):
# orig_dpath = relative
# fname = relpath(path, relative)
# else:
# orig_dpath, fname = split(path)
raise NotImplementedError('Not implemented yet')
if multidot:
# The first dot defines the extension
parts = fname.split('.', 1)
orig_base = parts[0]
orig_ext = '' if len(parts) == 1 else '.' + parts[1]
else:
# The last dot defines the extension
orig_base, orig_ext = splitext(fname)
# Replace parts with specified augmentations
if dpath is None:
dpath = orig_dpath
if ext is None:
ext = orig_ext
if stem is None:
stem = orig_base
# Recombine into new path
new_fname = ''.join((prefix, stem, suffix, ext, tail))
newpath = join(dpath, new_fname)
return newpath
[docs]
def userhome(username=None):
"""
Returns the path to some user's home directory.
Args:
username (str | None):
name of a user on the system. If unspecified, the current user is
inferred from standard environment variables.
Returns:
str: path to the specified home directory
Raises:
KeyError: if the specified user does not exist on the system
OSError: if username is unspecified and the current user cannot be
inferred
Example:
>>> import ubelt as ub
>>> import os
>>> import getpass
>>> username = getpass.getuser()
>>> userhome_target = os.path.expanduser('~')
>>> userhome_got1 = ub.userhome()
>>> userhome_got2 = ub.userhome(username)
>>> print(f'username={username}')
>>> print(f'userhome_got1={userhome_got1}')
>>> print(f'userhome_got2={userhome_got2}')
>>> print(f'userhome_target={userhome_target}')
>>> assert userhome_got1 == userhome_target
>>> assert userhome_got2 == userhome_target
"""
if username is None:
# get home directory for the current user
if 'HOME' in os.environ:
userhome_dpath = os.environ['HOME']
else: # nocover
if sys.platform.startswith('win32'):
# win32 fallback when HOME is not defined
if 'USERPROFILE' in os.environ:
userhome_dpath = os.environ['USERPROFILE']
elif 'HOMEPATH' in os.environ:
drive = os.environ.get('HOMEDRIVE', '')
userhome_dpath = join(drive, os.environ['HOMEPATH'])
else:
raise OSError("Cannot determine the user's home directory")
else:
# posix fallback when HOME is not defined
import pwd
userhome_dpath = pwd.getpwuid(os.getuid()).pw_dir
else:
# A specific user directory was requested
if sys.platform.startswith('win32'): # nocover
# get the directory name for the current user
c_users = dirname(userhome())
userhome_dpath = join(c_users, username)
if not exists(userhome_dpath):
raise KeyError('Unknown user: {}'.format(username))
else:
import pwd
try:
pwent = pwd.getpwnam(username)
except KeyError: # nocover
raise KeyError('Unknown user: {}'.format(username))
userhome_dpath = pwent.pw_dir
return userhome_dpath
[docs]
def shrinkuser(path, home='~'):
"""
Inverse of :func:`os.path.expanduser`.
Args:
path (str | PathLike): path in system file structure
home (str): symbol used to replace the home path.
Defaults to ``'~'``, but you might want to use ``'$HOME'`` or
``'%USERPROFILE%'`` instead.
Returns:
str: shortened path replacing the home directory with a symbol
Example:
>>> from ubelt.util_path import * # NOQA
>>> path = expanduser('~')
>>> assert path != '~'
>>> assert shrinkuser(path) == '~'
>>> assert shrinkuser(path + '1') == path + '1'
>>> assert shrinkuser(path + '/1') == join('~', '1')
>>> assert shrinkuser(path + '/1', '$HOME') == join('$HOME', '1')
>>> assert shrinkuser('.') == '.'
"""
path = normpath(path)
userhome_dpath = userhome()
if path.startswith(userhome_dpath):
if len(path) == len(userhome_dpath):
path = home
elif path[len(userhome_dpath)] == os.path.sep:
path = home + path[len(userhome_dpath):]
return path
[docs]
def expandpath(path):
"""
Shell-like environment variable and tilde path expansion.
Args:
path (str | PathLike): string representation of a path
Returns:
str: expanded path
Example:
>>> from ubelt.util_path import * # NOQA
>>> import ubelt as ub
>>> assert normpath(ub.expandpath('~/foo')) == join(ub.userhome(), 'foo')
>>> assert ub.expandpath('foo') == 'foo'
"""
path = expanduser(path)
path = expandvars(path)
return path
[docs]
def ensuredir(dpath, mode=0o1777, verbose=0, recreate=False):
r"""
Ensures that directory will exist. Creates new dir with sticky bits by
default
Args:
dpath (str | PathLike | Tuple[str | PathLike]):
directory to create if it does not exist.
mode (int):
octal permissions if a new directory is created.
Defaults to 0o1777.
verbose (int): verbosity
recreate (bool): if True removes the directory and
all of its contents and creates a new empty directory.
DEPRECATED: Use ``ub.Path(dpath).delete().ensuredir()`` instead.
Returns:
str: the ensured directory
SeeAlso:
:func:`ubelt.Path.ensuredir`
Example:
>>> import ubelt as ub
>>> dpath = ub.Path.appdir('ubelt', 'ensuredir')
>>> dpath.delete()
>>> assert not dpath.exists()
>>> ub.ensuredir(dpath)
>>> assert dpath.exists()
>>> dpath.delete()
"""
if isinstance(dpath, (list, tuple)):
dpath = join(*dpath)
if recreate:
from ubelt import schedule_deprecation
schedule_deprecation(
modname='ubelt',
migration='Use ``ub.Path(dpath).delete().ensuredir()`` instead', name='recreate',
type='argument of ensuredir', deprecate='1.3.0', error='2.0.0',
remove='2.1.0',
)
util_io.delete(dpath, verbose=verbose)
if not exists(dpath):
if verbose:
print('Ensuring directory (creating {!r})'.format(dpath))
os.makedirs(normpath(dpath), mode=mode, exist_ok=True)
else:
if verbose:
print('Ensuring directory (existing {!r})'.format(dpath))
return dpath
[docs]
class ChDir:
"""
Context manager that changes the current working directory and then
returns you to where you were.
This is nearly the same as the stdlib :func:`contextlib.chdir`, with the
exception that it will do nothing if the input path is None (i.e. the user
did not want to change directories).
SeeAlso:
:func:`contextlib.chdir`
Example:
>>> import ubelt as ub
>>> dpath = ub.Path.appdir('ubelt/tests/chdir').ensuredir()
>>> dir1 = (dpath / 'dir1').ensuredir()
>>> dir2 = (dpath / 'dir2').ensuredir()
>>> with ChDir(dpath):
>>> assert ub.Path.cwd() == dpath
>>> # change to the given directory, and then returns back
>>> with ChDir(dir1):
>>> assert ub.Path.cwd() == dir1
>>> with ChDir(dir2):
>>> assert ub.Path.cwd() == dir2
>>> # changes inside the context manager will be reset
>>> os.chdir(dpath)
>>> assert ub.Path.cwd() == dir1
>>> assert ub.Path.cwd() == dpath
>>> with ChDir(dir1):
>>> assert ub.Path.cwd() == dir1
>>> with ChDir(None):
>>> assert ub.Path.cwd() == dir1
>>> # When disabled, the cwd does *not* reset at context exit
>>> os.chdir(dir2)
>>> assert ub.Path.cwd() == dir2
>>> os.chdir(dir1)
>>> # Dont change dirs, but reset to your cwd at context end
>>> with ChDir('.'):
>>> os.chdir(dir2)
>>> assert ub.Path.cwd() == dir1
>>> assert ub.Path.cwd() == dpath
"""
def __init__(self, dpath):
"""
Args:
dpath (str | PathLike | None):
The new directory to work in.
If None, then the context manager is disabled.
"""
self._context_dpath = dpath
self._orig_dpath = None
def __enter__(self):
"""
Returns:
ChDir: self
"""
if self._context_dpath is not None:
self._orig_dpath = os.getcwd()
os.chdir(self._context_dpath)
return self
def __exit__(self, ex_type, ex_value, ex_traceback):
"""
Args:
ex_type (Type[BaseException] | None):
ex_value (BaseException | None):
ex_traceback (TracebackType | None):
Returns:
bool | None
"""
if self._context_dpath is not None:
os.chdir(self._orig_dpath)
[docs]
class TempDir:
"""
Context for creating and cleaning up temporary directories.
Warning:
DEPRECATED. Use :mod:`tempfile` instead.
Note:
This exists because :class:`tempfile.TemporaryDirectory` was
introduced in Python 3.2. Thus once ubelt no longer supports
python 2.7, this class will be deprecated.
Attributes:
dpath (str | None): the temporary path
Note:
# WE MAY WANT TO KEEP THIS FOR WINDOWS.
Example:
>>> from ubelt.util_path import * # NOQA
>>> with TempDir() as self:
>>> dpath = self.dpath
>>> assert exists(dpath)
>>> assert not exists(dpath)
Example:
>>> from ubelt.util_path import * # NOQA
>>> self = TempDir()
>>> dpath = self.ensure()
>>> assert exists(dpath)
>>> self.cleanup()
>>> assert not exists(dpath)
"""
def __init__(self):
from ubelt import schedule_deprecation
schedule_deprecation(
modname='ubelt',
migration='Use tempfile instead', name='TempDir',
type='class', deprecate='1.2.0', error='1.4.0',
remove='1.5.0',
)
self.dpath = None
def __del__(self):
self.cleanup()
[docs]
def ensure(self):
"""
Returns:
str: the path
"""
import tempfile
if not self.dpath:
self.dpath = tempfile.mkdtemp()
return self.dpath
[docs]
def cleanup(self):
if self.dpath:
import shutil
shutil.rmtree(self.dpath)
self.dpath = None
[docs]
def start(self):
"""
Returns:
TempDir: self
"""
self.ensure()
return self
def __enter__(self):
"""
Returns:
TempDir: self
"""
return self.start()
def __exit__(self, ex_type, ex_value, ex_traceback):
"""
Args:
ex_type (Type[BaseException] | None):
ex_value (BaseException | None):
ex_traceback (TracebackType | None):
Returns:
bool | None
"""
self.cleanup()
_PathBase = pathlib.WindowsPath if os.name == 'nt' else pathlib.PosixPath
[docs]
class Path(_PathBase):
"""
This class extends :class:`pathlib.Path` with extra functionality and
convenience methods.
New methods are designed to support chaining.
In addition to new methods this class supports the addition (``+``)
operator via which allows for better drop-in compatibility with code using
existing string-based paths.
Note:
On windows this inherits from :class:`pathlib.WindowsPath`.
New methods are
* :py:meth:`ubelt.Path.ensuredir` - Like mkdir but with easier defaults.
* :py:meth:`ubelt.Path.delete` - Previously pathlib could only remove one file at a time.
* :py:meth:`ubelt.Path.copy` - Pathlib has no similar functionality.
* :py:meth:`ubelt.Path.move` - Pathlib has no similar functionality.
* :py:meth:`ubelt.Path.augment` - Unifies and extends disparate functionality across pathlib.
* :py:meth:`ubelt.Path.expand` - Unifies existing environ and home expansion.
* :py:meth:`ubelt.Path.ls` - Like iterdir, but more interactive.
* :py:meth:`ubelt.Path.shrinkuser` - Python has no similar functionality.
* :py:meth:`ubelt.Path.walk` - Pathlib had no similar functionality.
New classmethods are
* :py:meth:`ubelt.Path.appdir` - application directories
Modified methods are
* :py:meth:`ubelt.Path.touch` - returns self to support chaining
* :py:meth:`ubelt.Path.chmod` - returns self to support chaining and
now accepts string-based permission codes.
Example:
>>> # Ubelt extends pathlib functionality
>>> import ubelt as ub
>>> # Chain expansion and mkdir with cumbersome args.
>>> dpath = ub.Path('~/.cache/ubelt/demo_path').expand().ensuredir()
>>> fpath = dpath / 'text_file.txt'
>>> # Augment is concise and chainable
>>> aug_fpath = fpath.augment(stemsuffix='.aux', ext='.jpg').touch()
>>> aug_dpath = dpath.augment(stemsuffix='demo_path2')
>>> assert aug_fpath.read_text() == ''
>>> fpath.write_text('text data')
>>> assert aug_fpath.exists()
>>> # Delete is akin to "rm -rf" and is also chainable.
>>> assert not aug_fpath.delete().exists()
>>> assert dpath.exists()
>>> assert not dpath.delete().exists()
>>> print(f'{str(fpath.shrinkuser()).replace(os.path.sep, "/")}')
>>> print(f'{str(dpath.shrinkuser()).replace(os.path.sep, "/")}')
>>> print(f'{str(aug_fpath.shrinkuser()).replace(os.path.sep, "/")}')
>>> print(f'{str(aug_dpath.shrinkuser()).replace(os.path.sep, "/")}')
~/.cache/ubelt/demo_path/text_file.txt
~/.cache/ubelt/demo_path
~/.cache/ubelt/demo_path/text_file.aux.jpg
~/.cache/ubelt/demo_pathdemo_path2
Inherited unmodified properties from :class:`pathlib.Path` are:
* :py:data:`pathlib.PurePath.anchor`
* :py:data:`pathlib.PurePath.name`
* :py:data:`pathlib.PurePath.parts`
* :py:data:`pathlib.PurePath.parent`
* :py:data:`pathlib.PurePath.parents`
* :py:data:`pathlib.PurePath.suffix`
* :py:data:`pathlib.PurePath.suffixes`
* :py:data:`pathlib.PurePath.stem`
* :py:data:`pathlib.PurePath.drive`
* :py:data:`pathlib.PurePath.root`
Inherited unmodified classmethods from :class:`pathlib.Path` are:
* :py:meth:`pathlib.Path.cwd`
* :py:meth:`pathlib.Path.home`
Inherited unmodified methods from :class:`pathlib.Path` are:
* :py:meth:`pathlib.Path.samefile`
* :py:meth:`pathlib.Path.iterdir`
* :py:meth:`pathlib.Path.glob`
* :py:meth:`pathlib.Path.rglob`
* :py:meth:`pathlib.Path.resolve`
* :py:meth:`pathlib.Path.lstat`
* :py:meth:`pathlib.Path.stat`
* :py:meth:`pathlib.Path.owner`
* :py:meth:`pathlib.Path.group`
* :py:meth:`pathlib.Path.open`
* :py:meth:`pathlib.Path.read_bytes`
* :py:meth:`pathlib.Path.read_text`
* :py:meth:`pathlib.Path.write_bytes`
* :py:meth:`pathlib.Path.write_text`
* :py:meth:`pathlib.Path.readlink`
* :py:meth:`pathlib.Path.mkdir` - we recommend :py:meth:`ubelt.Path.ensuredir` instead.
* :py:meth:`pathlib.Path.lchmod`
* :py:meth:`pathlib.Path.unlink`
* :py:meth:`pathlib.Path.rmdir`
* :py:meth:`pathlib.Path.rename`
* :py:meth:`pathlib.Path.replace`
* :py:meth:`pathlib.Path.symlink_to`
* :py:meth:`pathlib.Path.hardlink_to`
* :py:meth:`pathlib.Path.link_to` - deprecated
* :py:meth:`pathlib.Path.exists`
* :py:meth:`pathlib.Path.is_dir`
* :py:meth:`pathlib.Path.is_file`
* :py:meth:`pathlib.Path.is_mount`
* :py:meth:`pathlib.Path.is_symlink`
* :py:meth:`pathlib.Path.is_block_device`
* :py:meth:`pathlib.Path.is_char_device`
* :py:meth:`pathlib.Path.is_fifo`
* :py:meth:`pathlib.Path.is_socket`
* :py:meth:`pathlib.Path.expanduser` - we recommend :py:meth:`ubelt.Path.expand` instead.
* :py:meth:`pathlib.PurePath.as_posix`
* :py:meth:`pathlib.PurePath.as_uri`
* :py:meth:`pathlib.PurePath.with_name` - we recommend :py:meth:`ubelt.Path.augment` instead.
* :py:meth:`pathlib.PurePath.with_stem` - we recommend :py:meth:`ubelt.Path.augment` instead.
* :py:meth:`pathlib.PurePath.with_suffix` - we recommend :py:meth:`ubelt.Path.augment` instead.
* :py:meth:`pathlib.PurePath.relative_to`
* :py:meth:`pathlib.PurePath.joinpath`
* :py:meth:`pathlib.PurePath.is_relative_to`
* :py:meth:`pathlib.PurePath.is_absolute`
* :py:meth:`pathlib.PurePath.is_reserved`
* :py:meth:`pathlib.PurePath.match`
"""
__slots__ = ()
[docs]
@classmethod
def appdir(cls, appname=None, *args, type='cache'):
"""
Returns a standard platform specific directory for an application to
use as cache, config, or data.
The default root location depends on the platform and is specified the
the following table:
TextArt:
| POSIX | Windows | MacOSX
data | $XDG_DATA_HOME | %APPDATA% | ~/Library/Application Support
config | $XDG_CONFIG_HOME | %APPDATA% | ~/Library/Application Support
cache | $XDG_CACHE_HOME | %LOCALAPPDATA% | ~/Library/Caches
If an environment variable is not specified the defaults are:
APPDATA = ~/AppData/Roaming
LOCALAPPDATA = ~/AppData/Local
XDG_DATA_HOME = ~/.local/share
XDG_CACHE_HOME = ~/.cache
XDG_CONFIG_HOME = ~/.config
Args:
appname (str | None):
The name of the application.
*args : optional subdirs
type (str):
the type of data the expected to be stored in this application
directory. Valid options are 'cache', 'config', or 'data'.
Returns:
Path: a new path object for the specified application directory.
SeeAlso:
This provides functionality similar to the
`appdirs <https://pypi.org/project/appdirs/>`_ -
and
`platformdirs <https://platformdirs.readthedocs.io/en/latest/api.html>`_ -
packages.
Example:
>>> # xdoctest: +IGNORE_WANT
>>> import ubelt as ub
>>> print(ub.Path.appdir('ubelt', type='cache').shrinkuser())
>>> print(ub.Path.appdir('ubelt', type='config').shrinkuser())
>>> print(ub.Path.appdir('ubelt', type='data').shrinkuser())
~/.cache/ubelt
~/.config/ubelt
~/.local/share/ubelt
>>> import pytest
>>> with pytest.raises(KeyError):
>>> ub.Path.appdir('ubelt', type='other')
Example:
>>> # xdoctest: +IGNORE_WANT
>>> import ubelt as ub
>>> # Can now call appdir without any arguments
>>> print(ub.Path.appdir().shrinkuser())
~/.cache
"""
from ubelt import util_platform
if type == 'cache':
base = util_platform.platform_cache_dir()
elif type == 'config':
base = util_platform.platform_config_dir()
elif type == 'data':
base = util_platform.platform_data_dir()
else:
raise KeyError(type)
if appname is None:
return cls(base, *args)
else:
return cls(base, appname, *args)
[docs]
def augment(self, prefix='', stemsuffix='', ext=None, stem=None, dpath=None,
tail='', relative=None, multidot=False, suffix=''):
"""
Create a new path with a different extension, basename, directory,
prefix, and/or suffix.
See :func:`augpath` for more details.
Args:
prefix (str):
Text placed in front of the stem. Defaults to ''.
stemsuffix (str):
Text placed between the stem and extension. Defaults to ''.
ext (str | None):
If specified, replaces the extension
stem (str | None):
If specified, replaces the stem (i.e. basename without
extension).
dpath (str | PathLike | None):
If specified, replaces the specified "relative" directory,
which by default is the parent directory.
tail (str | None):
If specified, appends this text the very end of the path -
after the extension.
relative (str | PathLike | None):
Replaces ``relative`` with ``dpath`` in ``path``.
Has no effect if ``dpath`` is not specified.
Defaults to the dirname of the input ``path``.
*experimental* not currently implemented.
multidot (bool): Allows extensions to contain
multiple dots. Specifically, if False, everything after the
last dot in the basename is the extension. If True, everything
after the first dot in the basename is the extension.
SeeAlso:
:py:meth:`pathlib.Path.with_stem`
:py:meth:`pathlib.Path.with_name`
:py:meth:`pathlib.Path.with_suffix`
Returns:
Path: augmented path
Warning:
NOTICE OF BACKWARDS INCOMPATABILITY.
THE INITIAL RELEASE OF Path.augment suffered from an unfortunate
variable naming decision that conflicts with pathlib.Path
.. code:: python
p = ub.Path('the.entire.fname.or.dname.is.the.name.exe')
print(f'p ={p}')
print(f'p.name={p.name}')
p = ub.Path('the.stem.ends.here.ext')
print(f'p ={p}')
print(f'p.stem={p.stem}')
p = ub.Path('only.the.last.dot.is.the.suffix')
print(f'p ={p}')
print(f'p.suffix={p.suffix}')
p = ub.Path('but.all.suffixes.can.be.recovered')
print(f'p ={p}')
print(f'p.suffixes={p.suffixes}')
Example:
>>> import ubelt as ub
>>> path = ub.Path('foo.bar')
>>> suffix = '_suff'
>>> prefix = 'pref_'
>>> ext = '.baz'
>>> newpath = path.augment(prefix=prefix, stemsuffix=suffix, ext=ext, stem='bar')
>>> print('newpath = {!r}'.format(newpath))
newpath = Path('pref_bar_suff.baz')
Example:
>>> import ubelt as ub
>>> path = ub.Path('foo.bar')
>>> stemsuffix = '_suff'
>>> prefix = 'pref_'
>>> ext = '.baz'
>>> newpath = path.augment(prefix=prefix, stemsuffix=stemsuffix, ext=ext, stem='bar')
>>> print('newpath = {!r}'.format(newpath))
Example:
>>> # Compare our augpath(ext=...) versus pathlib with_suffix(...)
>>> import ubelt as ub
>>> cases = [
>>> ub.Path('no_ext'),
>>> ub.Path('one.ext'),
>>> ub.Path('double..dot'),
>>> ub.Path('two.many.cooks'),
>>> ub.Path('path.with.three.dots'),
>>> ub.Path('traildot.'),
>>> ub.Path('doubletraildot..'),
>>> ub.Path('.prefdot'),
>>> ub.Path('..doubleprefdot'),
>>> ]
>>> for path in cases:
>>> print('--')
>>> print('path = {}'.format(ub.repr2(path, nl=1)))
>>> ext = '.EXT'
>>> method_pathlib = path.with_suffix(ext)
>>> method_augment = path.augment(ext=ext)
>>> if method_pathlib == method_augment:
>>> print(ub.color_text('sagree', 'green'))
>>> else:
>>> print(ub.color_text('disagree', 'red'))
>>> print('path.with_suffix({}) = {}'.format(ext, ub.repr2(method_pathlib, nl=1)))
>>> print('path.augment(ext={}) = {}'.format(ext, ub.repr2(method_augment, nl=1)))
>>> print('--')
"""
if suffix: # nocover
from ubelt.util_deprecate import schedule_deprecation
schedule_deprecation(
'ubelt', 'suffix', 'arg',
deprecate='1.1.3', remove='1.4.0',
migration='Use stemsuffix instead',
)
if not stemsuffix:
stemsuffix = suffix
warnings.warn(
'DEVELOPER NOTICE: The ubelt.Path.augment function may '
'experience a BACKWARDS INCOMPATIBLE update in the future '
'having to do with the suffix argument to ub.Path.augment '
'To avoid any issue use the ``stemsuffix` argument or use the '
'``ubelt.augpath`` function instead. '
'If you see this warning, please make an '
'issue on https://github.com/Erotemic/ubelt/issues indicating '
'that there are users of this function in the wild. If there '
'are none, then this signature will be "fixed", but if anyone '
'depends on this feature then we will continue to support it as '
'is.'
)
aug = augpath(self, suffix=stemsuffix, prefix=prefix, ext=ext, base=stem,
dpath=dpath, relative=relative, multidot=multidot,
tail=tail)
new = self.__class__(aug)
return new
[docs]
def delete(self):
"""
Removes a file or recursively removes a directory.
If a path does not exist, then this is does nothing.
SeeAlso:
:func:`ubelt.delete`
Returns:
Path: reference to self
Example:
>>> import ubelt as ub
>>> from os.path import join
>>> base = ub.Path.appdir('ubelt', 'delete_test2')
>>> dpath1 = (base / 'dir').ensuredir()
>>> (base / 'dir' / 'subdir').ensuredir()
>>> (base / 'dir' / 'to_remove1.txt').touch()
>>> fpath1 = (base / 'dir' / 'subdir' / 'to_remove3.txt').touch()
>>> fpath2 = (base / 'dir' / 'subdir' / 'to_remove2.txt').touch()
>>> assert all(p.exists() for p in [dpath1, fpath1, fpath2])
>>> fpath1.delete()
>>> assert all(p.exists() for p in [dpath1, fpath2])
>>> assert not fpath1.exists()
>>> dpath1.delete()
>>> assert not any(p.exists() for p in [dpath1, fpath1, fpath2])
"""
util_io.delete(self)
return self
[docs]
def ensuredir(self, mode=0o777):
"""
Concise alias of ``self.mkdir(parents=True, exist_ok=True)``
Args:
mode (int):
octal permissions if a new directory is created.
Defaults to 0o777.
Returns:
Path: returns itself
Example:
>>> import ubelt as ub
>>> cache_dpath = ub.Path.appdir('ubelt').ensuredir()
>>> dpath = ub.Path(cache_dpath, 'newdir')
>>> dpath.delete()
>>> assert not dpath.exists()
>>> dpath.ensuredir()
>>> assert dpath.exists()
>>> dpath.rmdir()
"""
self.mkdir(mode=mode, parents=True, exist_ok=True)
return self
[docs]
def mkdir(self, mode=511, parents=False, exist_ok=False):
"""
Create a new directory at this given path.
Note:
The ubelt extension is the same as the original pathlib method,
except this returns returns the path instead of None.
Args:
mode (int) : permission bits
parents (bool) : create parents
exist_ok (bool) : fail if exists
Returns:
Path: returns itself
"""
super().mkdir(mode=mode, parents=parents, exist_ok=exist_ok)
return self
[docs]
def expand(self):
"""
Expands user tilde and environment variables.
Concise alias of ``Path(os.path.expandvars(self.expanduser()))``
Returns:
Path: path with expanded environment variables and tildes
Example:
>>> import ubelt as ub
>>> home_v1 = ub.Path('~/').expand()
>>> home_v2 = ub.Path.home()
>>> print('home_v1 = {!r}'.format(home_v1))
>>> print('home_v2 = {!r}'.format(home_v2))
>>> assert home_v1 == home_v2
"""
return self.expandvars().expanduser()
[docs]
def expandvars(self):
"""
As discussed in [CPythonIssue21301]_, CPython won't be adding
expandvars to pathlib. I think this is a mistake, so I added it in this
extension.
Returns:
Path: path with expanded environment variables
References:
.. [CPythonIssue21301] https://bugs.python.org/issue21301
"""
return self.__class__(os.path.expandvars(self))
[docs]
def ls(self, pattern=None):
"""
A convenience function to list all paths in a directory.
This is a wrapper around iterdir that returns the results as a list
instead of a generator. This is mainly for faster navigation in
IPython. In production code ``iterdir`` or ``glob`` should be used
instead.
Args:
pattern (None | str):
if specified, performs a glob instead of an iterdir.
Returns:
List['Path']: an eagerly evaluated list of paths
Note:
When pattern is specified only paths matching the pattern are
returned, not the paths inside matched directories. This is
different than bash semantics where the pattern is first expanded
and then ls is performed on all matching paths.
Example:
>>> import ubelt as ub
>>> self = ub.Path.appdir('ubelt/tests/ls')
>>> (self / 'dir1').ensuredir()
>>> (self / 'dir2').ensuredir()
>>> (self / 'file1').touch()
>>> (self / 'file2').touch()
>>> (self / 'dir1/file3').touch()
>>> (self / 'dir2/file4').touch()
>>> children = self.ls()
>>> assert isinstance(children, list)
>>> print(ub.repr2(sorted([p.relative_to(self) for p in children])))
[
Path('dir1'),
Path('dir2'),
Path('file1'),
Path('file2'),
]
>>> children = self.ls('dir*/*')
>>> assert isinstance(children, list)
>>> print(ub.repr2(sorted([p.relative_to(self) for p in children])))
[
Path('dir1/file3'),
Path('dir2/file4'),
]
"""
if pattern is None:
return list(self.iterdir())
else:
return list(self.glob(pattern))
# TODO:
# def _glob(self):
# """
# I would like some way of globbing using patterns contained in the path
# itself. Perhaps this goes into expand?
# """
# import glob
# yield from map(self.__class__, glob.glob(self))
[docs]
def shrinkuser(self, home='~'):
"""
Shrinks your home directory by replacing it with a tilde.
This is the inverse of :func:`os.path.expanduser`.
Args:
home (str): symbol used to replace the home path.
Defaults to '~', but you might want to use '$HOME' or
'%USERPROFILE%' instead.
Returns:
Path: shortened path replacing the home directory with a symbol
Example:
>>> import ubelt as ub
>>> path = ub.Path('~').expand()
>>> assert str(path.shrinkuser()) == '~'
>>> assert str(ub.Path((str(path) + '1')).shrinkuser()) == str(path) + '1'
>>> assert str((path / '1').shrinkuser()) == join('~', '1')
>>> assert str((path / '1').shrinkuser('$HOME')) == join('$HOME', '1')
>>> assert str(ub.Path('.').shrinkuser()) == '.'
"""
shrunk = shrinkuser(self, home)
new = self.__class__(shrunk)
return new
[docs]
def chmod(self, mode, follow_symlinks=True):
"""
Change the permissions of the path, like os.chmod().
Args:
mode (int | str): either a stat code to pass directly to
:func:`os.chmod` or a string-based code to construct modified
permissions. See note for details on the string-based chmod
codes.
follow_symlinks (bool):
if True, and this path is a symlink, modify permission of the
file it points to, otherwise if False, modify the link
permission.
Note:
From the chmod man page:
The format of a symbolic mode is [ugoa...][[-+=][perms...]...], where
perms is either zero or more letters from the set rwxXst, or a single
letter from the set ugo. Multiple symbolic modes can be given,
separated by commas.
Note:
Like :func:`os.chmod`, this may not work on Windows or on certain
filesystems.
Returns:
Path: returns self for chaining
Example:
>>> # xdoctest: +REQUIRES(POSIX)
>>> import ubelt as ub
>>> from ubelt.util_path import _encode_chmod_int
>>> dpath = ub.Path.appdir('ubelt/tests/chmod').ensuredir()
>>> fpath = (dpath / 'file.txt').touch()
>>> fpath.chmod('ugo+rw,ugo-x')
>>> print(_encode_chmod_int(fpath.stat().st_mode))
u=rw,g=rw,o=rw
>>> fpath.chmod('o-rwx')
>>> print(_encode_chmod_int(fpath.stat().st_mode))
u=rw,g=rw
>>> fpath.chmod(0o646)
>>> print(_encode_chmod_int(fpath.stat().st_mode))
u=rw,g=r,o=rw
"""
if isinstance(mode, str):
# Resolve mode
# Follow symlinks was added to pathlib.Path.stat in 3.10
# but os.stat has had it since 3.3, so use that instead.
old_mode = os.stat(self, follow_symlinks=follow_symlinks).st_mode
# old_mode = self.stat(follow_symlinks=follow_symlinks).st_mode
mode = _resolve_chmod_code(old_mode, mode)
os.chmod(self, mode, follow_symlinks=follow_symlinks)
return self
# Should not need to modify unless we want chanability here.
# def lchmod(self, mode):
# """
# Like chmod(), except if the path points to a symlink, the symlink's
# permissions are changed, rather than its target's.
#
# Args:
# mode (int | str): either a stat code to pass directly to
# :func:`os.chmod` or a string-based code to construct modified
# permissions.
#
# Returns:
# Path: returns self for chaining
#
# Example:
# >>> import ubelt as ub
# >>> from ubelt.util_path import _encode_chmod_int
# >>> dpath = ub.Path.appdir('ubelt/tests/chmod').ensuredir()
# >>> fpath = (dpath / 'file1.txt').delete().touch()
# >>> lpath = (dpath / 'link1.txt').delete()
# >>> lpath.symlink_to(fpath)
# >>> print(_encode_chmod_int(fpath.stat().st_mode))
# >>> lpath.lchmod('a+rwx')
# >>> print(_encode_chmod_int(fpath.stat().st_mode))
# """
# return self.chmod(mode, follow_symlinks=False)
[docs]
def touch(self, mode=0o666, exist_ok=True):
"""
Create this file with the given access mode, if it doesn't exist.
Returns:
Path: returns itself
Note:
The :func:`ubelt.util_io.touch` function currently has a slightly
different implementation. This uses whatever the pathlib version
is. This may change in the future.
"""
# modify touch to return self
# Note: util_io.touch is more expressive than standard python
# touch, may want to use that instead.
super().touch(mode=mode, exist_ok=exist_ok)
return self
[docs]
def walk(self, topdown=True, onerror=None, followlinks=False):
"""
A variant of :func:`os.walk` for pathlib
Args:
topdown (bool):
if True starts yield nodes closer to the root first otherwise
yield nodes closer to the leaves first.
onerror (Callable[[OSError], None] | None):
A function with one argument of type OSError. If the
error is raised the walk is aborted, otherwise it continues.
followlinks (bool):
if True recurse into symbolic directory links
Yields:
Tuple['Path', List[str], List[str]]:
the root path, directory names, and file names
Example:
>>> import ubelt as ub
>>> self = ub.Path.appdir('ubelt/tests/ls')
>>> (self / 'dir1').ensuredir()
>>> (self / 'dir2').ensuredir()
>>> (self / 'file1').touch()
>>> (self / 'file2').touch()
>>> (self / 'dir1/file3').touch()
>>> (self / 'dir2/file4').touch()
>>> subdirs = list(self.walk())
>>> assert len(subdirs) == 3
Example:
>>> # Modified from the stdlib
>>> import os
>>> from os.path import join, getsize
>>> import email
>>> import ubelt as ub
>>> base = ub.Path(email.__file__).parent
>>> for root, dirs, files in base.walk():
>>> print(root, " consumes", end="")
>>> print(sum(getsize(join(root, name)) for name in files), end="")
>>> print("bytes in ", len(files), " non-directory files")
>>> if 'CVS' in dirs:
>>> dirs.remove('CVS') # don't visit CVS directories
"""
cls = self.__class__
walker = os.walk(self, topdown=topdown, onerror=onerror,
followlinks=followlinks)
for root, dnames, fnames in walker:
yield (cls(root), dnames, fnames)
def __add__(self, other):
"""
Returns a new string starting with this fspath representation.
Returns:
str
Allows ubelt.Path to be a better drop-in replacement when working with
string-based paths.
Note:
It is not recommended to write new code that uses this behavior.
This exists to make it easier to transition existing str-based
paths to pathlib.
Example:
>>> import ubelt as ub
>>> base = ub.Path('base')
>>> base_ = ub.Path('base/')
>>> base2 = ub.Path('base/2')
>>> assert base + 'foo' == 'basefoo'
>>> assert base_ + 'foo' == 'basefoo'
>>> assert base2 + 'foo' == str(base2.augment(tail='foo'))
"""
return os.fspath(self) + other
def __radd__(self, other):
"""
Returns a new string ending with this fspath representation.
Returns:
str
Allows ubelt.Path to be a better drop-in replacement when working with
string-based paths.
Note:
It is not recommended to write new code that uses this behavior.
This exists to make it easier to transition existing str-based
paths to pathlib.
Example:
>>> import ubelt as ub
>>> base = ub.Path('base')
>>> base_ = ub.Path('base/')
>>> base2 = ub.Path('base/2')
>>> assert 'foo' + base == 'foobase'
>>> assert 'foo' + base_ == 'foobase'
>>> assert 'foo' + base2 == str(base2.augment(dpath='foobase'))
"""
return other + os.fspath(self)
[docs]
def endswith(self, suffix, *args):
"""
Test if the fspath representation ends with ``suffix``.
Allows ubelt.Path to be a better drop-in replacement when working with
string-based paths.
Args:
suffix (str | Tuple[str, ...]):
One or more suffixes to test for
*args:
start (int): if specified begin testing at this position.
end (int): if specified stop testing at this position.
Returns:
bool: True if any of the suffixes match.
Example:
>>> import ubelt as ub
>>> base = ub.Path('base')
>>> assert base.endswith('se')
>>> assert not base.endswith('be')
>>> # test start / stop cases
>>> assert ub.Path('aabbccdd').endswith('cdd', 5)
>>> assert not ub.Path('aabbccdd').endswith('cdd', 6)
>>> assert ub.Path('aabbccdd').endswith('cdd', 5, 10)
>>> assert not ub.Path('aabbccdd').endswith('cdd', 5, 7)
>>> # test tuple case
>>> assert ub.Path('aabbccdd').endswith(('foo', 'cdd'))
>>> assert ub.Path('foo').endswith(('foo', 'cdd'))
>>> assert not ub.Path('bar').endswith(('foo', 'cdd'))
"""
return os.fspath(self).endswith(suffix, *args)
[docs]
def startswith(self, prefix, *args):
"""
Test if the fspath representation starts with ``prefix``.
Allows ubelt.Path to be a better drop-in replacement when working with
string-based paths.
Args:
prefix (str | Tuple[str, ...]):
One or more prefixes to test for
*args:
start (int): if specified begin testing at this position.
end (int): if specified stop testing at this position.
Returns:
bool: True if any of the prefixes match.
Example:
>>> import ubelt as ub
>>> base = ub.Path('base')
>>> assert base.startswith('base')
>>> assert not base.startswith('all your')
>>> # test start / stop cases
>>> assert ub.Path('aabbccdd').startswith('aab', 0)
>>> assert ub.Path('aabbccdd').startswith('aab', 0, 5)
>>> assert not ub.Path('aabbccdd').startswith('aab', 1, 5)
>>> assert not ub.Path('aabbccdd').startswith('aab', 0, 2)
>>> # test tuple case
>>> assert ub.Path('aabbccdd').startswith(('foo', 'aab'))
>>> assert ub.Path('foo').startswith(('foo', 'aab'))
>>> assert not ub.Path('bar').startswith(('foo', 'aab'))
"""
return os.fspath(self).startswith(prefix, *args)
# More shutil functionality
# This is discussed in https://peps.python.org/pep-0428/#filesystem-modification
[docs]
def _request_copy_function(self, follow_file_symlinks=True,
follow_dir_symlinks=True, meta='stats'):
"""
Get a copy_function based on specified capabilities
"""
import shutil
from functools import partial
if meta is None:
copy_function = partial(shutil.copyfile, follow_symlinks=follow_file_symlinks)
elif meta == 'stats':
copy_function = partial(shutil.copy2, follow_symlinks=follow_file_symlinks)
elif meta == 'mode':
copy_function = partial(shutil.copy, follow_symlinks=follow_file_symlinks)
else:
raise KeyError(meta)
return copy_function
[docs]
def copy(self, dst, follow_file_symlinks=False, follow_dir_symlinks=False,
meta='stats', overwrite=False):
"""
Copy this file or directory to dst.
By default files are never overwritten and symlinks are copied as-is.
At a basic level (i.e. ignoring symlinks) for each path argument
(``src`` and ``dst``) these can either be files, directories, or not
exist. Given these three states, the following table summarizes how
this function copies this path to its destination.
TextArt:
+----------+------------------------+------------------------+----------+
| dst | dir | file | no-exist |
+----------+ | | |
| src | | | |
+==========+========================+========================+==========+
| dir | error-or-overwrite-dst | error | dst |
+----------+------------------------+------------------------+----------+
| file | dst / src.name | error-or-overwrite-dst | dst |
+----------+------------------------+------------------------+----------+
| no-exist | error | error | error |
+----------+------------------------+------------------------+----------+
In general, the contents of src will be the contents of dst, except for
the one case where a file is copied into an existing directory. In this
case the name is used to construct a fully qualified destination.
Args:
dst (str | PathLike):
if ``src`` is a file and ``dst`` does not exist, copies this to ``dst``
if ``src`` is a file and ``dst`` is a directory, copies this to ``dst / src.name``
if ``src`` is a directory and ``dst`` does not exist, copies this to ``dst``
if ``src`` is a directory and ``dst`` is a directory, errors unless
overwrite is True, in which case, copies this to ``dst`` and
overwrites anything conflicting path.
follow_file_symlinks (bool):
If True and src is a link, the link will be resolved before
it is copied (i.e. the data is duplicated), otherwise just
the link itself will be copied.
follow_dir_symlinks (bool):
if True when src is a directory and contains symlinks to
other directories, the contents of the linked data are
copied, otherwise when False only the link itself is
copied.
meta (str | None):
Indicates what metadata bits to copy. This can be 'stats' which
tries to copy all metadata (i.e. like :py:func:`shutil.copy2`),
'mode' which copies just the permission bits (i.e. like
:py:func:`shutil.copy`), or None, which ignores all metadata
(i.e. like :py:func:`shutil.copyfile`).
overwrite (bool):
if False, and target file exists, this will raise an error,
otherwise the file will be overwritten.
Returns:
Path: where the path was copied to
Note:
This is implemented with a combination of :func:`shutil.copy`,
:func:`shutil.copy2`, and :func:`shutil.copytree`, but the defaults
and behavior here are different (and ideally safer and more
intuitive).
Note:
Unlike cp on Linux, copying a src directory into a dst directory
will not implicitly add the src directory name to the dst
directory. This means we cannot copy directory ``<parent>/<dname>``
to ``<dst>`` and expect the result to be ``<dst>/<dname>``.
Conceptually you can expect ``<parent>/<dname>/<contents>``
to exist in ``<dst>/<contents>``.
Example:
>>> import ubelt as ub
>>> root = ub.Path.appdir('ubelt', 'tests', 'path', 'copy').delete().ensuredir()
>>> paths = {}
>>> dpath = (root / 'orig').ensuredir()
>>> clone0 = (root / 'dst_is_explicit').ensuredir()
>>> clone1 = (root / 'dst_is_parent').ensuredir()
>>> paths['fpath'] = (dpath / 'file0.txt').touch()
>>> paths['empty_dpath'] = (dpath / 'empty_dpath').ensuredir()
>>> paths['nested_dpath'] = (dpath / 'nested_dpath').ensuredir()
>>> (dpath / 'nested_dpath/d0').ensuredir()
>>> (dpath / 'nested_dpath/d0/f1.txt').touch()
>>> (dpath / 'nested_dpath/d0/f2.txt').touch()
>>> print('paths = {}'.format(ub.repr2(paths, nl=1)))
>>> assert all(p.exists() for p in paths.values())
>>> paths['fpath'].copy(clone0 / 'file0.txt')
>>> paths['fpath'].copy(clone1)
>>> paths['empty_dpath'].copy(clone0 / 'empty_dpath')
>>> paths['empty_dpath'].copy((clone1 / 'empty_dpath_alt').ensuredir(), overwrite=True)
>>> paths['nested_dpath'].copy(clone0 / 'nested_dpath')
>>> paths['nested_dpath'].copy((clone1 / 'nested_dpath_alt').ensuredir(), overwrite=True)
Ignore:
# Enumerate cases
rows = [
{'src': 'no-exist', 'dst': 'no-exist', 'result': 'error'},
{'src': 'no-exist', 'dst': 'file', 'result': 'error'},
{'src': 'no-exist', 'dst': 'dir', 'result': 'error'},
{'src': 'file', 'dst': 'no-exist', 'result': 'dst'},
{'src': 'file', 'dst': 'dir', 'result': 'dst / src.name'},
{'src': 'file', 'dst': 'file', 'result': 'error-or-overwrite-dst'},
{'src': 'dir', 'dst': 'no-exist', 'result': 'dst'},
{'src': 'dir', 'dst': 'dir', 'result': 'error-or-overwrite-dst'},
{'src': 'dir', 'dst': 'file', 'result': 'error'},
]
import pandas as pd
df = pd.DataFrame(rows)
piv = df.pivot(['src'], ['dst'], 'result')
print(piv.to_markdown(tablefmt="grid", index=True))
See: ~/code/ubelt/tests/test_path.py for test cases
"""
import shutil
copy_function = self._request_copy_function(
follow_file_symlinks=follow_file_symlinks,
follow_dir_symlinks=follow_dir_symlinks, meta=meta)
if self.is_dir():
if sys.version_info[0:2] < (3, 8): # nocover
copytree = _compat_copytree
else:
copytree = shutil.copytree
dst = copytree(
self, dst, copy_function=copy_function,
symlinks=not follow_dir_symlinks, dirs_exist_ok=overwrite)
elif self.is_file():
if not overwrite:
dst = Path(dst)
if dst.is_dir():
real_dst = dst / self.name
else:
real_dst = dst
if real_dst.exists():
raise FileExistsError('Cannot overwrite existing file unless overwrite=True')
dst = copy_function(self, dst)
else:
raise FileExistsError('The source path does not exist')
return Path(dst)
[docs]
def move(self, dst, follow_file_symlinks=False, follow_dir_symlinks=False,
meta='stats'):
"""
Move a file from one location to another, or recursively move a
directory from one location to another.
This method will refuse to overwrite anything, and there is currently
no overwrite option for technical reasons. This may change in the
future.
Args:
dst (str | PathLike):
A non-existing path where this file will be moved.
follow_file_symlinks (bool):
If True and src is a link, the link will be resolved before
it is copied (i.e. the data is duplicated), otherwise just
the link itself will be copied.
follow_dir_symlinks (bool):
if True when src is a directory and contains symlinks to
other directories, the contents of the linked data are
copied, otherwise when False only the link itself is
copied.
meta (str | None):
Indicates what metadata bits to copy. This can be 'stats' which
tries to copy all metadata (i.e. like shutil.copy2), 'mode'
which copies just the permission bits (i.e. like shutil.copy),
or None, which ignores all metadata (i.e. like
shutil.copyfile).
Note:
This method will refuse to overwrite anything.
This is implemented via :func:`shutil.move`, which depends heavily
on :func:`os.rename` semantics. For this reason, this function
will error if it would overwrite any data. If you want an
overwriting variant of move we recommend you either either copy the
data, and then delete the original (potentially inefficient), or
use :func:`shutil.move` directly if you know how :func:`os.rename`
works on your system.
Returns:
Path: where the path was moved to
Example:
>>> import ubelt as ub
>>> dpath = ub.Path.appdir('ubelt', 'tests', 'path', 'move').delete().ensuredir()
>>> paths = {}
>>> paths['dpath0'] = (dpath / 'dpath0').ensuredir()
>>> paths['dpath00'] = (dpath / 'dpath0' / 'sub0').ensuredir()
>>> paths['fpath000'] = (dpath / 'dpath0' / 'sub0' / 'f0.txt').touch()
>>> paths['fpath001'] = (dpath / 'dpath0' / 'sub0' / 'f1.txt').touch()
>>> paths['dpath01'] = (dpath / 'dpath0' / 'sub1').ensuredir()
>>> print('paths = {}'.format(ub.repr2(paths, nl=1)))
>>> assert all(p.exists() for p in paths.values())
>>> paths['dpath0'].move(dpath / 'dpath1')
"""
# Behave more like POSIX move to avoid potential confusing behavior
if exists(dst):
raise FileExistsError(
'Moves are only allowed to locations that dont exist')
import shutil
copy_function = self._request_copy_function(
follow_file_symlinks=follow_file_symlinks,
follow_dir_symlinks=follow_dir_symlinks, meta=meta)
real_dst = shutil.move(self, dst, copy_function=copy_function)
return Path(real_dst)
def _parse_chmod_code(code):
"""
Expand a chmod code into a list of actions.
Args:
code (str): of the form: [ugoa…][-+=]perms…[,…]
perms is either zero or more letters from the set rwxXst, or a
single letter from the set ugo.
Yields:
Tuple[str, str, str]: target, op, and perms.
The target is modified by the operation using the value.
target -- specified 'u' for user, 'g' for group, 'o' for other.
op -- specified as '+' to add, '-' to remove, or '=' to assign.
val -- specified as 'r' for read, 'w' for write, or 'x' for execute.
Example:
>>> from ubelt.util_path import _parse_chmod_code
>>> print(list(_parse_chmod_code('ugo+rw,+r,g=rwx')))
>>> print(list(_parse_chmod_code('o+x')))
>>> print(list(_parse_chmod_code('u-x')))
>>> print(list(_parse_chmod_code('x')))
>>> print(list(_parse_chmod_code('ugo+rwx')))
[('ugo', '+', 'rw'), ('ugo', '+', 'r'), ('g', '=', 'rwx')]
[('o', '+', 'x')]
[('u', '-', 'x')]
[('u', '+', 'x')]
[('ugo', '+', 'rwx')]
>>> import pytest
>>> with pytest.raises(ValueError):
>>> list(_parse_chmod_code('a+b+c'))
"""
import re
pat = re.compile(r'([\+\-\=])')
parts = code.split(',')
for part in parts:
ab = pat.split(part)
len_ab = len(ab)
if len_ab == 3:
targets, op, perms = ab
elif len_ab == 1:
perms = ab[0]
op = '+'
targets = 'u'
else:
raise ValueError('unknown chmod code pattern: part={part}')
if targets == '' or targets == 'a':
targets = 'ugo'
yield (targets, op, perms)
def _resolve_chmod_code(old_mode, code):
"""
Modifies integer stat permissions based on a string code.
Args:
old_mode (int): old mode from st_stat
code (str): chmod style codeold mode from st_stat
Returns:
int : new code
Example:
>>> from ubelt.util_path import _resolve_chmod_code
>>> print(oct(_resolve_chmod_code(0, '+rwx')))
>>> print(oct(_resolve_chmod_code(0, 'ugo+rwx')))
>>> print(oct(_resolve_chmod_code(0, 'a-rwx')))
>>> print(oct(_resolve_chmod_code(0, 'u+rw,go+r,go-wx')))
>>> print(oct(_resolve_chmod_code(0o777, 'u+rw,go+r,go-wx')))
0o777
0o777
0o0
0o644
0o744
>>> import pytest
>>> with pytest.raises(NotImplementedError):
>>> print(oct(_resolve_chmod_code(0, 'u=rw')))
>>> with pytest.raises(ValueError):
>>> _resolve_chmod_code(0, 'u?w')
"""
import stat
import itertools as it
action_lut = {
# TODO: handle suid, sgid, and sticky?
# suid = stat.S_ISUID
# sgid = stat.S_ISGID
# sticky = stat.S_ISVTX
'ur' : stat.S_IRUSR,
'uw' : stat.S_IWUSR,
'ux' : stat.S_IXUSR,
'gr' : stat.S_IRGRP,
'gw' : stat.S_IWGRP,
'gx' : stat.S_IXGRP,
'or' : stat.S_IROTH,
'ow' : stat.S_IWOTH,
'ox' : stat.S_IXOTH,
}
actions = _parse_chmod_code(code)
new_mode = int(old_mode) # (could optimize to modify inplace if needed)
for action in actions:
targets, op, perms = action
try:
action_keys = (target + perm for target, perm in it.product(targets, perms))
action_values = (action_lut[key] for key in action_keys)
action_values = list(action_values)
if op == '+':
for val in action_values:
new_mode |= val
elif op == '-':
for val in action_values:
new_mode &= (~val)
elif op == '=':
raise NotImplementedError(f'new chmod code for op={op}')
else:
raise AssertionError(
f'should not be able to get here. unknown op code: op={op}')
except KeyError:
# Give a better error message if something goes wrong
raise ValueError(f'Unknown action: {action}')
return new_mode
def _encode_chmod_int(int_code):
"""
Convert a chmod integer code to a string
Currently unused, but may be useful in the future.
Example:
>>> from ubelt.util_path import _encode_chmod_int
>>> int_code = 0o744
>>> print(_encode_chmod_int(int_code))
u=rwx,g=r,o=r
"""
import stat
action_lut = {
'ur' : stat.S_IRUSR,
'uw' : stat.S_IWUSR,
'ux' : stat.S_IXUSR,
'gr' : stat.S_IRGRP,
'gw' : stat.S_IWGRP,
'gx' : stat.S_IXGRP,
'or' : stat.S_IROTH,
'ow' : stat.S_IWOTH,
'ox' : stat.S_IXOTH,
}
from collections import defaultdict
target_to_perms = defaultdict(list)
for key, val in action_lut.items():
target, perm = key
if int_code & val:
target_to_perms[target].append(perm)
parts = [k + '=' + ''.join(vs) for k, vs in target_to_perms.items()]
code = ','.join(parts)
return code
if sys.version_info[0:2] < (3, 8): # nocover
# Vendor in a nearly modern copytree for Python 3.6 and 3.7
def _compat_copytree(src, dst, symlinks=False, ignore=None,
copy_function=None, ignore_dangling_symlinks=False,
dirs_exist_ok=False):
"""
A vendored shutil.copytree for older pythons based on the 3.10
implementation
"""
from shutil import Error, copystat, copy2, copy
with os.scandir(src) as itr:
entries = list(itr)
if ignore is not None:
ignored_names = ignore(os.fspath(src), [x.name for x in entries])
else:
ignored_names = set()
os.makedirs(dst, exist_ok=dirs_exist_ok)
errors = []
use_srcentry = copy_function is copy2 or copy_function is copy
for srcentry in entries:
if srcentry.name in ignored_names:
continue
srcname = os.path.join(src, srcentry.name)
dstname = os.path.join(dst, srcentry.name)
srcobj = srcentry if use_srcentry else srcname
try:
is_symlink = srcentry.is_symlink()
if is_symlink and os.name == 'nt':
# Special check for directory junctions, which appear as
# symlinks but we want to recurse.
# Not available on 3.6, use our impl instead
# lstat = srcentry.stat(follow_symlinks=False)
# if lstat.st_reparse_tag == stat.IO_REPARSE_TAG_MOUNT_POINT:
# is_symlink = False
from ubelt._win32_links import _win32_is_junction
if _win32_is_junction(srcentry):
is_symlink = False
if is_symlink:
linkto = os.readlink(srcname)
if symlinks:
# We can't just leave it to `copy_function` because legacy
# code with a custom `copy_function` may rely on copytree
# doing the right thing.
os.symlink(linkto, dstname)
copystat(srcobj, dstname, follow_symlinks=not symlinks)
else:
# ignore dangling symlink if the flag is on
if not os.path.exists(linkto) and ignore_dangling_symlinks:
continue
# otherwise let the copy occur. copy2 will raise an error
if srcentry.is_dir():
_compat_copytree(srcobj, dstname, symlinks, ignore,
copy_function,
dirs_exist_ok=dirs_exist_ok)
else:
copy_function(srcobj, dstname)
elif srcentry.is_dir():
_compat_copytree(srcobj, dstname, symlinks, ignore,
copy_function,
dirs_exist_ok=dirs_exist_ok)
else:
# Will raise a SpecialFileError for unsupported file types
copy_function(srcobj, dstname)
# catch the Error from the recursive copytree so that we can
# continue with other files
except Error as err:
errors.extend(err.args[0])
except OSError as why:
errors.append((srcname, dstname, str(why)))
try:
copystat(src, dst)
except OSError as why:
# Copying file access times may fail on Windows
if getattr(why, 'winerror', None) is None:
errors.append((src, dst, str(why)))
if errors:
raise Error(errors)
return dst