• Home
  • Line#
  • Scopes#
  • Navigate#
  • Raw
  • Download
1"""Utility functions for copying and archiving files and directory trees.
2
3XXX The functions here don't copy the resource fork or other metadata on Mac.
4
5"""
6
7import os
8import sys
9import stat
10import fnmatch
11import collections
12import errno
13
14try:
15    import zlib
16    del zlib
17    _ZLIB_SUPPORTED = True
18except ImportError:
19    _ZLIB_SUPPORTED = False
20
21try:
22    import bz2
23    del bz2
24    _BZ2_SUPPORTED = True
25except ImportError:
26    _BZ2_SUPPORTED = False
27
28try:
29    import lzma
30    del lzma
31    _LZMA_SUPPORTED = True
32except ImportError:
33    _LZMA_SUPPORTED = False
34
35try:
36    from pwd import getpwnam
37except ImportError:
38    getpwnam = None
39
40try:
41    from grp import getgrnam
42except ImportError:
43    getgrnam = None
44
45_WINDOWS = os.name == 'nt'
46posix = nt = None
47if os.name == 'posix':
48    import posix
49elif _WINDOWS:
50    import nt
51
52COPY_BUFSIZE = 1024 * 1024 if _WINDOWS else 64 * 1024
53_USE_CP_SENDFILE = hasattr(os, "sendfile") and sys.platform.startswith("linux")
54_HAS_FCOPYFILE = posix and hasattr(posix, "_fcopyfile")  # macOS
55
56# CMD defaults in Windows 10
57_WIN_DEFAULT_PATHEXT = ".COM;.EXE;.BAT;.CMD;.VBS;.JS;.WS;.MSC"
58
59__all__ = ["copyfileobj", "copyfile", "copymode", "copystat", "copy", "copy2",
60           "copytree", "move", "rmtree", "Error", "SpecialFileError",
61           "ExecError", "make_archive", "get_archive_formats",
62           "register_archive_format", "unregister_archive_format",
63           "get_unpack_formats", "register_unpack_format",
64           "unregister_unpack_format", "unpack_archive",
65           "ignore_patterns", "chown", "which", "get_terminal_size",
66           "SameFileError"]
67           # disk_usage is added later, if available on the platform
68
69class Error(OSError):
70    pass
71
72class SameFileError(Error):
73    """Raised when source and destination are the same file."""
74
75class SpecialFileError(OSError):
76    """Raised when trying to do a kind of operation (e.g. copying) which is
77    not supported on a special file (e.g. a named pipe)"""
78
79class ExecError(OSError):
80    """Raised when a command could not be executed"""
81
82class ReadError(OSError):
83    """Raised when an archive cannot be read"""
84
85class RegistryError(Exception):
86    """Raised when a registry operation with the archiving
87    and unpacking registries fails"""
88
89class _GiveupOnFastCopy(Exception):
90    """Raised as a signal to fallback on using raw read()/write()
91    file copy when fast-copy functions fail to do so.
92    """
93
94def _fastcopy_fcopyfile(fsrc, fdst, flags):
95    """Copy a regular file content or metadata by using high-performance
96    fcopyfile(3) syscall (macOS).
97    """
98    try:
99        infd = fsrc.fileno()
100        outfd = fdst.fileno()
101    except Exception as err:
102        raise _GiveupOnFastCopy(err)  # not a regular file
103
104    try:
105        posix._fcopyfile(infd, outfd, flags)
106    except OSError as err:
107        err.filename = fsrc.name
108        err.filename2 = fdst.name
109        if err.errno in {errno.EINVAL, errno.ENOTSUP}:
110            raise _GiveupOnFastCopy(err)
111        else:
112            raise err from None
113
114def _fastcopy_sendfile(fsrc, fdst):
115    """Copy data from one regular mmap-like fd to another by using
116    high-performance sendfile(2) syscall.
117    This should work on Linux >= 2.6.33 only.
118    """
119    # Note: copyfileobj() is left alone in order to not introduce any
120    # unexpected breakage. Possible risks by using zero-copy calls
121    # in copyfileobj() are:
122    # - fdst cannot be open in "a"(ppend) mode
123    # - fsrc and fdst may be open in "t"(ext) mode
124    # - fsrc may be a BufferedReader (which hides unread data in a buffer),
125    #   GzipFile (which decompresses data), HTTPResponse (which decodes
126    #   chunks).
127    # - possibly others (e.g. encrypted fs/partition?)
128    global _USE_CP_SENDFILE
129    try:
130        infd = fsrc.fileno()
131        outfd = fdst.fileno()
132    except Exception as err:
133        raise _GiveupOnFastCopy(err)  # not a regular file
134
135    # Hopefully the whole file will be copied in a single call.
136    # sendfile() is called in a loop 'till EOF is reached (0 return)
137    # so a bufsize smaller or bigger than the actual file size
138    # should not make any difference, also in case the file content
139    # changes while being copied.
140    try:
141        blocksize = max(os.fstat(infd).st_size, 2 ** 23)  # min 8MiB
142    except OSError:
143        blocksize = 2 ** 27  # 128MiB
144    # On 32-bit architectures truncate to 1GiB to avoid OverflowError,
145    # see bpo-38319.
146    if sys.maxsize < 2 ** 32:
147        blocksize = min(blocksize, 2 ** 30)
148
149    offset = 0
150    while True:
151        try:
152            sent = os.sendfile(outfd, infd, offset, blocksize)
153        except OSError as err:
154            # ...in oder to have a more informative exception.
155            err.filename = fsrc.name
156            err.filename2 = fdst.name
157
158            if err.errno == errno.ENOTSOCK:
159                # sendfile() on this platform (probably Linux < 2.6.33)
160                # does not support copies between regular files (only
161                # sockets).
162                _USE_CP_SENDFILE = False
163                raise _GiveupOnFastCopy(err)
164
165            if err.errno == errno.ENOSPC:  # filesystem is full
166                raise err from None
167
168            # Give up on first call and if no data was copied.
169            if offset == 0 and os.lseek(outfd, 0, os.SEEK_CUR) == 0:
170                raise _GiveupOnFastCopy(err)
171
172            raise err
173        else:
174            if sent == 0:
175                break  # EOF
176            offset += sent
177
178def _copyfileobj_readinto(fsrc, fdst, length=COPY_BUFSIZE):
179    """readinto()/memoryview() based variant of copyfileobj().
180    *fsrc* must support readinto() method and both files must be
181    open in binary mode.
182    """
183    # Localize variable access to minimize overhead.
184    fsrc_readinto = fsrc.readinto
185    fdst_write = fdst.write
186    with memoryview(bytearray(length)) as mv:
187        while True:
188            n = fsrc_readinto(mv)
189            if not n:
190                break
191            elif n < length:
192                with mv[:n] as smv:
193                    fdst.write(smv)
194            else:
195                fdst_write(mv)
196
197def copyfileobj(fsrc, fdst, length=0):
198    """copy data from file-like object fsrc to file-like object fdst"""
199    # Localize variable access to minimize overhead.
200    if not length:
201        length = COPY_BUFSIZE
202    fsrc_read = fsrc.read
203    fdst_write = fdst.write
204    while True:
205        buf = fsrc_read(length)
206        if not buf:
207            break
208        fdst_write(buf)
209
210def _samefile(src, dst):
211    # Macintosh, Unix.
212    if isinstance(src, os.DirEntry) and hasattr(os.path, 'samestat'):
213        try:
214            return os.path.samestat(src.stat(), os.stat(dst))
215        except OSError:
216            return False
217
218    if hasattr(os.path, 'samefile'):
219        try:
220            return os.path.samefile(src, dst)
221        except OSError:
222            return False
223
224    # All other platforms: check for same pathname.
225    return (os.path.normcase(os.path.abspath(src)) ==
226            os.path.normcase(os.path.abspath(dst)))
227
228def _stat(fn):
229    return fn.stat() if isinstance(fn, os.DirEntry) else os.stat(fn)
230
231def _islink(fn):
232    return fn.is_symlink() if isinstance(fn, os.DirEntry) else os.path.islink(fn)
233
234def copyfile(src, dst, *, follow_symlinks=True):
235    """Copy data from src to dst in the most efficient way possible.
236
237    If follow_symlinks is not set and src is a symbolic link, a new
238    symlink will be created instead of copying the file it points to.
239
240    """
241    sys.audit("shutil.copyfile", src, dst)
242
243    if _samefile(src, dst):
244        raise SameFileError("{!r} and {!r} are the same file".format(src, dst))
245
246    file_size = 0
247    for i, fn in enumerate([src, dst]):
248        try:
249            st = _stat(fn)
250        except OSError:
251            # File most likely does not exist
252            pass
253        else:
254            # XXX What about other special files? (sockets, devices...)
255            if stat.S_ISFIFO(st.st_mode):
256                fn = fn.path if isinstance(fn, os.DirEntry) else fn
257                raise SpecialFileError("`%s` is a named pipe" % fn)
258            if _WINDOWS and i == 0:
259                file_size = st.st_size
260
261    if not follow_symlinks and _islink(src):
262        os.symlink(os.readlink(src), dst)
263    else:
264        with open(src, 'rb') as fsrc, open(dst, 'wb') as fdst:
265            # macOS
266            if _HAS_FCOPYFILE:
267                try:
268                    _fastcopy_fcopyfile(fsrc, fdst, posix._COPYFILE_DATA)
269                    return dst
270                except _GiveupOnFastCopy:
271                    pass
272            # Linux
273            elif _USE_CP_SENDFILE:
274                try:
275                    _fastcopy_sendfile(fsrc, fdst)
276                    return dst
277                except _GiveupOnFastCopy:
278                    pass
279            # Windows, see:
280            # https://github.com/python/cpython/pull/7160#discussion_r195405230
281            elif _WINDOWS and file_size > 0:
282                _copyfileobj_readinto(fsrc, fdst, min(file_size, COPY_BUFSIZE))
283                return dst
284
285            copyfileobj(fsrc, fdst)
286
287    return dst
288
289def copymode(src, dst, *, follow_symlinks=True):
290    """Copy mode bits from src to dst.
291
292    If follow_symlinks is not set, symlinks aren't followed if and only
293    if both `src` and `dst` are symlinks.  If `lchmod` isn't available
294    (e.g. Linux) this method does nothing.
295
296    """
297    sys.audit("shutil.copymode", src, dst)
298
299    if not follow_symlinks and _islink(src) and os.path.islink(dst):
300        if hasattr(os, 'lchmod'):
301            stat_func, chmod_func = os.lstat, os.lchmod
302        else:
303            return
304    else:
305        stat_func, chmod_func = _stat, os.chmod
306
307    st = stat_func(src)
308    chmod_func(dst, stat.S_IMODE(st.st_mode))
309
310if hasattr(os, 'listxattr'):
311    def _copyxattr(src, dst, *, follow_symlinks=True):
312        """Copy extended filesystem attributes from `src` to `dst`.
313
314        Overwrite existing attributes.
315
316        If `follow_symlinks` is false, symlinks won't be followed.
317
318        """
319
320        try:
321            names = os.listxattr(src, follow_symlinks=follow_symlinks)
322        except OSError as e:
323            if e.errno not in (errno.ENOTSUP, errno.ENODATA, errno.EINVAL):
324                raise
325            return
326        for name in names:
327            try:
328                value = os.getxattr(src, name, follow_symlinks=follow_symlinks)
329                os.setxattr(dst, name, value, follow_symlinks=follow_symlinks)
330            except OSError as e:
331                if e.errno not in (errno.EPERM, errno.ENOTSUP, errno.ENODATA,
332                                   errno.EINVAL):
333                    raise
334else:
335    def _copyxattr(*args, **kwargs):
336        pass
337
338def copystat(src, dst, *, follow_symlinks=True):
339    """Copy file metadata
340
341    Copy the permission bits, last access time, last modification time, and
342    flags from `src` to `dst`. On Linux, copystat() also copies the "extended
343    attributes" where possible. The file contents, owner, and group are
344    unaffected. `src` and `dst` are path-like objects or path names given as
345    strings.
346
347    If the optional flag `follow_symlinks` is not set, symlinks aren't
348    followed if and only if both `src` and `dst` are symlinks.
349    """
350    sys.audit("shutil.copystat", src, dst)
351
352    def _nop(*args, ns=None, follow_symlinks=None):
353        pass
354
355    # follow symlinks (aka don't not follow symlinks)
356    follow = follow_symlinks or not (_islink(src) and os.path.islink(dst))
357    if follow:
358        # use the real function if it exists
359        def lookup(name):
360            return getattr(os, name, _nop)
361    else:
362        # use the real function only if it exists
363        # *and* it supports follow_symlinks
364        def lookup(name):
365            fn = getattr(os, name, _nop)
366            if fn in os.supports_follow_symlinks:
367                return fn
368            return _nop
369
370    if isinstance(src, os.DirEntry):
371        st = src.stat(follow_symlinks=follow)
372    else:
373        st = lookup("stat")(src, follow_symlinks=follow)
374    mode = stat.S_IMODE(st.st_mode)
375    lookup("utime")(dst, ns=(st.st_atime_ns, st.st_mtime_ns),
376        follow_symlinks=follow)
377    # We must copy extended attributes before the file is (potentially)
378    # chmod()'ed read-only, otherwise setxattr() will error with -EACCES.
379    _copyxattr(src, dst, follow_symlinks=follow)
380    try:
381        lookup("chmod")(dst, mode, follow_symlinks=follow)
382    except NotImplementedError:
383        # if we got a NotImplementedError, it's because
384        #   * follow_symlinks=False,
385        #   * lchown() is unavailable, and
386        #   * either
387        #       * fchownat() is unavailable or
388        #       * fchownat() doesn't implement AT_SYMLINK_NOFOLLOW.
389        #         (it returned ENOSUP.)
390        # therefore we're out of options--we simply cannot chown the
391        # symlink.  give up, suppress the error.
392        # (which is what shutil always did in this circumstance.)
393        pass
394    if hasattr(st, 'st_flags'):
395        try:
396            lookup("chflags")(dst, st.st_flags, follow_symlinks=follow)
397        except OSError as why:
398            for err in 'EOPNOTSUPP', 'ENOTSUP':
399                if hasattr(errno, err) and why.errno == getattr(errno, err):
400                    break
401            else:
402                raise
403
404def copy(src, dst, *, follow_symlinks=True):
405    """Copy data and mode bits ("cp src dst"). Return the file's destination.
406
407    The destination may be a directory.
408
409    If follow_symlinks is false, symlinks won't be followed. This
410    resembles GNU's "cp -P src dst".
411
412    If source and destination are the same file, a SameFileError will be
413    raised.
414
415    """
416    if os.path.isdir(dst):
417        dst = os.path.join(dst, os.path.basename(src))
418    copyfile(src, dst, follow_symlinks=follow_symlinks)
419    copymode(src, dst, follow_symlinks=follow_symlinks)
420    return dst
421
422def copy2(src, dst, *, follow_symlinks=True):
423    """Copy data and metadata. Return the file's destination.
424
425    Metadata is copied with copystat(). Please see the copystat function
426    for more information.
427
428    The destination may be a directory.
429
430    If follow_symlinks is false, symlinks won't be followed. This
431    resembles GNU's "cp -P src dst".
432    """
433    if os.path.isdir(dst):
434        dst = os.path.join(dst, os.path.basename(src))
435    copyfile(src, dst, follow_symlinks=follow_symlinks)
436    copystat(src, dst, follow_symlinks=follow_symlinks)
437    return dst
438
439def ignore_patterns(*patterns):
440    """Function that can be used as copytree() ignore parameter.
441
442    Patterns is a sequence of glob-style patterns
443    that are used to exclude files"""
444    def _ignore_patterns(path, names):
445        ignored_names = []
446        for pattern in patterns:
447            ignored_names.extend(fnmatch.filter(names, pattern))
448        return set(ignored_names)
449    return _ignore_patterns
450
451def _copytree(entries, src, dst, symlinks, ignore, copy_function,
452              ignore_dangling_symlinks, dirs_exist_ok=False):
453    if ignore is not None:
454        ignored_names = ignore(os.fspath(src), [x.name for x in entries])
455    else:
456        ignored_names = set()
457
458    os.makedirs(dst, exist_ok=dirs_exist_ok)
459    errors = []
460    use_srcentry = copy_function is copy2 or copy_function is copy
461
462    for srcentry in entries:
463        if srcentry.name in ignored_names:
464            continue
465        srcname = os.path.join(src, srcentry.name)
466        dstname = os.path.join(dst, srcentry.name)
467        srcobj = srcentry if use_srcentry else srcname
468        try:
469            is_symlink = srcentry.is_symlink()
470            if is_symlink and os.name == 'nt':
471                # Special check for directory junctions, which appear as
472                # symlinks but we want to recurse.
473                lstat = srcentry.stat(follow_symlinks=False)
474                if lstat.st_reparse_tag == stat.IO_REPARSE_TAG_MOUNT_POINT:
475                    is_symlink = False
476            if is_symlink:
477                linkto = os.readlink(srcname)
478                if symlinks:
479                    # We can't just leave it to `copy_function` because legacy
480                    # code with a custom `copy_function` may rely on copytree
481                    # doing the right thing.
482                    os.symlink(linkto, dstname)
483                    copystat(srcobj, dstname, follow_symlinks=not symlinks)
484                else:
485                    # ignore dangling symlink if the flag is on
486                    if not os.path.exists(linkto) and ignore_dangling_symlinks:
487                        continue
488                    # otherwise let the copy occur. copy2 will raise an error
489                    if srcentry.is_dir():
490                        copytree(srcobj, dstname, symlinks, ignore,
491                                 copy_function, dirs_exist_ok=dirs_exist_ok)
492                    else:
493                        copy_function(srcobj, dstname)
494            elif srcentry.is_dir():
495                copytree(srcobj, dstname, symlinks, ignore, copy_function,
496                         dirs_exist_ok=dirs_exist_ok)
497            else:
498                # Will raise a SpecialFileError for unsupported file types
499                copy_function(srcobj, dstname)
500        # catch the Error from the recursive copytree so that we can
501        # continue with other files
502        except Error as err:
503            errors.extend(err.args[0])
504        except OSError as why:
505            errors.append((srcname, dstname, str(why)))
506    try:
507        copystat(src, dst)
508    except OSError as why:
509        # Copying file access times may fail on Windows
510        if getattr(why, 'winerror', None) is None:
511            errors.append((src, dst, str(why)))
512    if errors:
513        raise Error(errors)
514    return dst
515
516def copytree(src, dst, symlinks=False, ignore=None, copy_function=copy2,
517             ignore_dangling_symlinks=False, dirs_exist_ok=False):
518    """Recursively copy a directory tree and return the destination directory.
519
520    dirs_exist_ok dictates whether to raise an exception in case dst or any
521    missing parent directory already exists.
522
523    If exception(s) occur, an Error is raised with a list of reasons.
524
525    If the optional symlinks flag is true, symbolic links in the
526    source tree result in symbolic links in the destination tree; if
527    it is false, the contents of the files pointed to by symbolic
528    links are copied. If the file pointed by the symlink doesn't
529    exist, an exception will be added in the list of errors raised in
530    an Error exception at the end of the copy process.
531
532    You can set the optional ignore_dangling_symlinks flag to true if you
533    want to silence this exception. Notice that this has no effect on
534    platforms that don't support os.symlink.
535
536    The optional ignore argument is a callable. If given, it
537    is called with the `src` parameter, which is the directory
538    being visited by copytree(), and `names` which is the list of
539    `src` contents, as returned by os.listdir():
540
541        callable(src, names) -> ignored_names
542
543    Since copytree() is called recursively, the callable will be
544    called once for each directory that is copied. It returns a
545    list of names relative to the `src` directory that should
546    not be copied.
547
548    The optional copy_function argument is a callable that will be used
549    to copy each file. It will be called with the source path and the
550    destination path as arguments. By default, copy2() is used, but any
551    function that supports the same signature (like copy()) can be used.
552
553    """
554    sys.audit("shutil.copytree", src, dst)
555    with os.scandir(src) as itr:
556        entries = list(itr)
557    return _copytree(entries=entries, src=src, dst=dst, symlinks=symlinks,
558                     ignore=ignore, copy_function=copy_function,
559                     ignore_dangling_symlinks=ignore_dangling_symlinks,
560                     dirs_exist_ok=dirs_exist_ok)
561
562if hasattr(os.stat_result, 'st_file_attributes'):
563    # Special handling for directory junctions to make them behave like
564    # symlinks for shutil.rmtree, since in general they do not appear as
565    # regular links.
566    def _rmtree_isdir(entry):
567        try:
568            st = entry.stat(follow_symlinks=False)
569            return (stat.S_ISDIR(st.st_mode) and not
570                (st.st_file_attributes & stat.FILE_ATTRIBUTE_REPARSE_POINT
571                 and st.st_reparse_tag == stat.IO_REPARSE_TAG_MOUNT_POINT))
572        except OSError:
573            return False
574
575    def _rmtree_islink(path):
576        try:
577            st = os.lstat(path)
578            return (stat.S_ISLNK(st.st_mode) or
579                (st.st_file_attributes & stat.FILE_ATTRIBUTE_REPARSE_POINT
580                 and st.st_reparse_tag == stat.IO_REPARSE_TAG_MOUNT_POINT))
581        except OSError:
582            return False
583else:
584    def _rmtree_isdir(entry):
585        try:
586            return entry.is_dir(follow_symlinks=False)
587        except OSError:
588            return False
589
590    def _rmtree_islink(path):
591        return os.path.islink(path)
592
593# version vulnerable to race conditions
594def _rmtree_unsafe(path, onerror):
595    try:
596        with os.scandir(path) as scandir_it:
597            entries = list(scandir_it)
598    except OSError:
599        onerror(os.scandir, path, sys.exc_info())
600        entries = []
601    for entry in entries:
602        fullname = entry.path
603        if _rmtree_isdir(entry):
604            try:
605                if entry.is_symlink():
606                    # This can only happen if someone replaces
607                    # a directory with a symlink after the call to
608                    # os.scandir or entry.is_dir above.
609                    raise OSError("Cannot call rmtree on a symbolic link")
610            except OSError:
611                onerror(os.path.islink, fullname, sys.exc_info())
612                continue
613            _rmtree_unsafe(fullname, onerror)
614        else:
615            try:
616                os.unlink(fullname)
617            except OSError:
618                onerror(os.unlink, fullname, sys.exc_info())
619    try:
620        os.rmdir(path)
621    except OSError:
622        onerror(os.rmdir, path, sys.exc_info())
623
624# Version using fd-based APIs to protect against races
625def _rmtree_safe_fd(topfd, path, onerror):
626    try:
627        with os.scandir(topfd) as scandir_it:
628            entries = list(scandir_it)
629    except OSError as err:
630        err.filename = path
631        onerror(os.scandir, path, sys.exc_info())
632        return
633    for entry in entries:
634        fullname = os.path.join(path, entry.name)
635        try:
636            is_dir = entry.is_dir(follow_symlinks=False)
637        except OSError:
638            is_dir = False
639        else:
640            if is_dir:
641                try:
642                    orig_st = entry.stat(follow_symlinks=False)
643                    is_dir = stat.S_ISDIR(orig_st.st_mode)
644                except OSError:
645                    onerror(os.lstat, fullname, sys.exc_info())
646                    continue
647        if is_dir:
648            try:
649                dirfd = os.open(entry.name, os.O_RDONLY, dir_fd=topfd)
650            except OSError:
651                onerror(os.open, fullname, sys.exc_info())
652            else:
653                try:
654                    if os.path.samestat(orig_st, os.fstat(dirfd)):
655                        _rmtree_safe_fd(dirfd, fullname, onerror)
656                        try:
657                            os.rmdir(entry.name, dir_fd=topfd)
658                        except OSError:
659                            onerror(os.rmdir, fullname, sys.exc_info())
660                    else:
661                        try:
662                            # This can only happen if someone replaces
663                            # a directory with a symlink after the call to
664                            # os.scandir or stat.S_ISDIR above.
665                            raise OSError("Cannot call rmtree on a symbolic "
666                                          "link")
667                        except OSError:
668                            onerror(os.path.islink, fullname, sys.exc_info())
669                finally:
670                    os.close(dirfd)
671        else:
672            try:
673                os.unlink(entry.name, dir_fd=topfd)
674            except OSError:
675                onerror(os.unlink, fullname, sys.exc_info())
676
677_use_fd_functions = ({os.open, os.stat, os.unlink, os.rmdir} <=
678                     os.supports_dir_fd and
679                     os.scandir in os.supports_fd and
680                     os.stat in os.supports_follow_symlinks)
681
682def rmtree(path, ignore_errors=False, onerror=None):
683    """Recursively delete a directory tree.
684
685    If ignore_errors is set, errors are ignored; otherwise, if onerror
686    is set, it is called to handle the error with arguments (func,
687    path, exc_info) where func is platform and implementation dependent;
688    path is the argument to that function that caused it to fail; and
689    exc_info is a tuple returned by sys.exc_info().  If ignore_errors
690    is false and onerror is None, an exception is raised.
691
692    """
693    sys.audit("shutil.rmtree", path)
694    if ignore_errors:
695        def onerror(*args):
696            pass
697    elif onerror is None:
698        def onerror(*args):
699            raise
700    if _use_fd_functions:
701        # While the unsafe rmtree works fine on bytes, the fd based does not.
702        if isinstance(path, bytes):
703            path = os.fsdecode(path)
704        # Note: To guard against symlink races, we use the standard
705        # lstat()/open()/fstat() trick.
706        try:
707            orig_st = os.lstat(path)
708        except Exception:
709            onerror(os.lstat, path, sys.exc_info())
710            return
711        try:
712            fd = os.open(path, os.O_RDONLY)
713        except Exception:
714            onerror(os.open, path, sys.exc_info())
715            return
716        try:
717            if os.path.samestat(orig_st, os.fstat(fd)):
718                _rmtree_safe_fd(fd, path, onerror)
719                try:
720                    os.rmdir(path)
721                except OSError:
722                    onerror(os.rmdir, path, sys.exc_info())
723            else:
724                try:
725                    # symlinks to directories are forbidden, see bug #1669
726                    raise OSError("Cannot call rmtree on a symbolic link")
727                except OSError:
728                    onerror(os.path.islink, path, sys.exc_info())
729        finally:
730            os.close(fd)
731    else:
732        try:
733            if _rmtree_islink(path):
734                # symlinks to directories are forbidden, see bug #1669
735                raise OSError("Cannot call rmtree on a symbolic link")
736        except OSError:
737            onerror(os.path.islink, path, sys.exc_info())
738            # can't continue even if onerror hook returns
739            return
740        return _rmtree_unsafe(path, onerror)
741
742# Allow introspection of whether or not the hardening against symlink
743# attacks is supported on the current platform
744rmtree.avoids_symlink_attacks = _use_fd_functions
745
746def _basename(path):
747    """A basename() variant which first strips the trailing slash, if present.
748    Thus we always get the last component of the path, even for directories.
749
750    path: Union[PathLike, str]
751
752    e.g.
753    >>> os.path.basename('/bar/foo')
754    'foo'
755    >>> os.path.basename('/bar/foo/')
756    ''
757    >>> _basename('/bar/foo/')
758    'foo'
759    """
760    path = os.fspath(path)
761    sep = os.path.sep + (os.path.altsep or '')
762    return os.path.basename(path.rstrip(sep))
763
764def move(src, dst, copy_function=copy2):
765    """Recursively move a file or directory to another location. This is
766    similar to the Unix "mv" command. Return the file or directory's
767    destination.
768
769    If the destination is a directory or a symlink to a directory, the source
770    is moved inside the directory. The destination path must not already
771    exist.
772
773    If the destination already exists but is not a directory, it may be
774    overwritten depending on os.rename() semantics.
775
776    If the destination is on our current filesystem, then rename() is used.
777    Otherwise, src is copied to the destination and then removed. Symlinks are
778    recreated under the new name if os.rename() fails because of cross
779    filesystem renames.
780
781    The optional `copy_function` argument is a callable that will be used
782    to copy the source or it will be delegated to `copytree`.
783    By default, copy2() is used, but any function that supports the same
784    signature (like copy()) can be used.
785
786    A lot more could be done here...  A look at a mv.c shows a lot of
787    the issues this implementation glosses over.
788
789    """
790    sys.audit("shutil.move", src, dst)
791    real_dst = dst
792    if os.path.isdir(dst):
793        if _samefile(src, dst):
794            # We might be on a case insensitive filesystem,
795            # perform the rename anyway.
796            os.rename(src, dst)
797            return
798
799        # Using _basename instead of os.path.basename is important, as we must
800        # ignore any trailing slash to avoid the basename returning ''
801        real_dst = os.path.join(dst, _basename(src))
802
803        if os.path.exists(real_dst):
804            raise Error("Destination path '%s' already exists" % real_dst)
805    try:
806        os.rename(src, real_dst)
807    except OSError:
808        if os.path.islink(src):
809            linkto = os.readlink(src)
810            os.symlink(linkto, real_dst)
811            os.unlink(src)
812        elif os.path.isdir(src):
813            if _destinsrc(src, dst):
814                raise Error("Cannot move a directory '%s' into itself"
815                            " '%s'." % (src, dst))
816            copytree(src, real_dst, copy_function=copy_function,
817                     symlinks=True)
818            rmtree(src)
819        else:
820            copy_function(src, real_dst)
821            os.unlink(src)
822    return real_dst
823
824def _destinsrc(src, dst):
825    src = os.path.abspath(src)
826    dst = os.path.abspath(dst)
827    if not src.endswith(os.path.sep):
828        src += os.path.sep
829    if not dst.endswith(os.path.sep):
830        dst += os.path.sep
831    return dst.startswith(src)
832
833def _get_gid(name):
834    """Returns a gid, given a group name."""
835    if getgrnam is None or name is None:
836        return None
837    try:
838        result = getgrnam(name)
839    except KeyError:
840        result = None
841    if result is not None:
842        return result[2]
843    return None
844
845def _get_uid(name):
846    """Returns an uid, given a user name."""
847    if getpwnam is None or name is None:
848        return None
849    try:
850        result = getpwnam(name)
851    except KeyError:
852        result = None
853    if result is not None:
854        return result[2]
855    return None
856
857def _make_tarball(base_name, base_dir, compress="gzip", verbose=0, dry_run=0,
858                  owner=None, group=None, logger=None):
859    """Create a (possibly compressed) tar file from all the files under
860    'base_dir'.
861
862    'compress' must be "gzip" (the default), "bzip2", "xz", or None.
863
864    'owner' and 'group' can be used to define an owner and a group for the
865    archive that is being built. If not provided, the current owner and group
866    will be used.
867
868    The output tar file will be named 'base_name' +  ".tar", possibly plus
869    the appropriate compression extension (".gz", ".bz2", or ".xz").
870
871    Returns the output filename.
872    """
873    if compress is None:
874        tar_compression = ''
875    elif _ZLIB_SUPPORTED and compress == 'gzip':
876        tar_compression = 'gz'
877    elif _BZ2_SUPPORTED and compress == 'bzip2':
878        tar_compression = 'bz2'
879    elif _LZMA_SUPPORTED and compress == 'xz':
880        tar_compression = 'xz'
881    else:
882        raise ValueError("bad value for 'compress', or compression format not "
883                         "supported : {0}".format(compress))
884
885    import tarfile  # late import for breaking circular dependency
886
887    compress_ext = '.' + tar_compression if compress else ''
888    archive_name = base_name + '.tar' + compress_ext
889    archive_dir = os.path.dirname(archive_name)
890
891    if archive_dir and not os.path.exists(archive_dir):
892        if logger is not None:
893            logger.info("creating %s", archive_dir)
894        if not dry_run:
895            os.makedirs(archive_dir)
896
897    # creating the tarball
898    if logger is not None:
899        logger.info('Creating tar archive')
900
901    uid = _get_uid(owner)
902    gid = _get_gid(group)
903
904    def _set_uid_gid(tarinfo):
905        if gid is not None:
906            tarinfo.gid = gid
907            tarinfo.gname = group
908        if uid is not None:
909            tarinfo.uid = uid
910            tarinfo.uname = owner
911        return tarinfo
912
913    if not dry_run:
914        tar = tarfile.open(archive_name, 'w|%s' % tar_compression)
915        try:
916            tar.add(base_dir, filter=_set_uid_gid)
917        finally:
918            tar.close()
919
920    return archive_name
921
922def _make_zipfile(base_name, base_dir, verbose=0, dry_run=0, logger=None):
923    """Create a zip file from all the files under 'base_dir'.
924
925    The output zip file will be named 'base_name' + ".zip".  Returns the
926    name of the output zip file.
927    """
928    import zipfile  # late import for breaking circular dependency
929
930    zip_filename = base_name + ".zip"
931    archive_dir = os.path.dirname(base_name)
932
933    if archive_dir and not os.path.exists(archive_dir):
934        if logger is not None:
935            logger.info("creating %s", archive_dir)
936        if not dry_run:
937            os.makedirs(archive_dir)
938
939    if logger is not None:
940        logger.info("creating '%s' and adding '%s' to it",
941                    zip_filename, base_dir)
942
943    if not dry_run:
944        with zipfile.ZipFile(zip_filename, "w",
945                             compression=zipfile.ZIP_DEFLATED) as zf:
946            path = os.path.normpath(base_dir)
947            if path != os.curdir:
948                zf.write(path, path)
949                if logger is not None:
950                    logger.info("adding '%s'", path)
951            for dirpath, dirnames, filenames in os.walk(base_dir):
952                for name in sorted(dirnames):
953                    path = os.path.normpath(os.path.join(dirpath, name))
954                    zf.write(path, path)
955                    if logger is not None:
956                        logger.info("adding '%s'", path)
957                for name in filenames:
958                    path = os.path.normpath(os.path.join(dirpath, name))
959                    if os.path.isfile(path):
960                        zf.write(path, path)
961                        if logger is not None:
962                            logger.info("adding '%s'", path)
963
964    return zip_filename
965
966_ARCHIVE_FORMATS = {
967    'tar':   (_make_tarball, [('compress', None)], "uncompressed tar file"),
968}
969
970if _ZLIB_SUPPORTED:
971    _ARCHIVE_FORMATS['gztar'] = (_make_tarball, [('compress', 'gzip')],
972                                "gzip'ed tar-file")
973    _ARCHIVE_FORMATS['zip'] = (_make_zipfile, [], "ZIP file")
974
975if _BZ2_SUPPORTED:
976    _ARCHIVE_FORMATS['bztar'] = (_make_tarball, [('compress', 'bzip2')],
977                                "bzip2'ed tar-file")
978
979if _LZMA_SUPPORTED:
980    _ARCHIVE_FORMATS['xztar'] = (_make_tarball, [('compress', 'xz')],
981                                "xz'ed tar-file")
982
983def get_archive_formats():
984    """Returns a list of supported formats for archiving and unarchiving.
985
986    Each element of the returned sequence is a tuple (name, description)
987    """
988    formats = [(name, registry[2]) for name, registry in
989               _ARCHIVE_FORMATS.items()]
990    formats.sort()
991    return formats
992
993def register_archive_format(name, function, extra_args=None, description=''):
994    """Registers an archive format.
995
996    name is the name of the format. function is the callable that will be
997    used to create archives. If provided, extra_args is a sequence of
998    (name, value) tuples that will be passed as arguments to the callable.
999    description can be provided to describe the format, and will be returned
1000    by the get_archive_formats() function.
1001    """
1002    if extra_args is None:
1003        extra_args = []
1004    if not callable(function):
1005        raise TypeError('The %s object is not callable' % function)
1006    if not isinstance(extra_args, (tuple, list)):
1007        raise TypeError('extra_args needs to be a sequence')
1008    for element in extra_args:
1009        if not isinstance(element, (tuple, list)) or len(element) !=2:
1010            raise TypeError('extra_args elements are : (arg_name, value)')
1011
1012    _ARCHIVE_FORMATS[name] = (function, extra_args, description)
1013
1014def unregister_archive_format(name):
1015    del _ARCHIVE_FORMATS[name]
1016
1017def make_archive(base_name, format, root_dir=None, base_dir=None, verbose=0,
1018                 dry_run=0, owner=None, group=None, logger=None):
1019    """Create an archive file (eg. zip or tar).
1020
1021    'base_name' is the name of the file to create, minus any format-specific
1022    extension; 'format' is the archive format: one of "zip", "tar", "gztar",
1023    "bztar", or "xztar".  Or any other registered format.
1024
1025    'root_dir' is a directory that will be the root directory of the
1026    archive; ie. we typically chdir into 'root_dir' before creating the
1027    archive.  'base_dir' is the directory where we start archiving from;
1028    ie. 'base_dir' will be the common prefix of all files and
1029    directories in the archive.  'root_dir' and 'base_dir' both default
1030    to the current directory.  Returns the name of the archive file.
1031
1032    'owner' and 'group' are used when creating a tar archive. By default,
1033    uses the current owner and group.
1034    """
1035    sys.audit("shutil.make_archive", base_name, format, root_dir, base_dir)
1036    save_cwd = os.getcwd()
1037    if root_dir is not None:
1038        if logger is not None:
1039            logger.debug("changing into '%s'", root_dir)
1040        base_name = os.path.abspath(base_name)
1041        if not dry_run:
1042            os.chdir(root_dir)
1043
1044    if base_dir is None:
1045        base_dir = os.curdir
1046
1047    kwargs = {'dry_run': dry_run, 'logger': logger}
1048
1049    try:
1050        format_info = _ARCHIVE_FORMATS[format]
1051    except KeyError:
1052        raise ValueError("unknown archive format '%s'" % format) from None
1053
1054    func = format_info[0]
1055    for arg, val in format_info[1]:
1056        kwargs[arg] = val
1057
1058    if format != 'zip':
1059        kwargs['owner'] = owner
1060        kwargs['group'] = group
1061
1062    try:
1063        filename = func(base_name, base_dir, **kwargs)
1064    finally:
1065        if root_dir is not None:
1066            if logger is not None:
1067                logger.debug("changing back to '%s'", save_cwd)
1068            os.chdir(save_cwd)
1069
1070    return filename
1071
1072
1073def get_unpack_formats():
1074    """Returns a list of supported formats for unpacking.
1075
1076    Each element of the returned sequence is a tuple
1077    (name, extensions, description)
1078    """
1079    formats = [(name, info[0], info[3]) for name, info in
1080               _UNPACK_FORMATS.items()]
1081    formats.sort()
1082    return formats
1083
1084def _check_unpack_options(extensions, function, extra_args):
1085    """Checks what gets registered as an unpacker."""
1086    # first make sure no other unpacker is registered for this extension
1087    existing_extensions = {}
1088    for name, info in _UNPACK_FORMATS.items():
1089        for ext in info[0]:
1090            existing_extensions[ext] = name
1091
1092    for extension in extensions:
1093        if extension in existing_extensions:
1094            msg = '%s is already registered for "%s"'
1095            raise RegistryError(msg % (extension,
1096                                       existing_extensions[extension]))
1097
1098    if not callable(function):
1099        raise TypeError('The registered function must be a callable')
1100
1101
1102def register_unpack_format(name, extensions, function, extra_args=None,
1103                           description=''):
1104    """Registers an unpack format.
1105
1106    `name` is the name of the format. `extensions` is a list of extensions
1107    corresponding to the format.
1108
1109    `function` is the callable that will be
1110    used to unpack archives. The callable will receive archives to unpack.
1111    If it's unable to handle an archive, it needs to raise a ReadError
1112    exception.
1113
1114    If provided, `extra_args` is a sequence of
1115    (name, value) tuples that will be passed as arguments to the callable.
1116    description can be provided to describe the format, and will be returned
1117    by the get_unpack_formats() function.
1118    """
1119    if extra_args is None:
1120        extra_args = []
1121    _check_unpack_options(extensions, function, extra_args)
1122    _UNPACK_FORMATS[name] = extensions, function, extra_args, description
1123
1124def unregister_unpack_format(name):
1125    """Removes the pack format from the registry."""
1126    del _UNPACK_FORMATS[name]
1127
1128def _ensure_directory(path):
1129    """Ensure that the parent directory of `path` exists"""
1130    dirname = os.path.dirname(path)
1131    if not os.path.isdir(dirname):
1132        os.makedirs(dirname)
1133
1134def _unpack_zipfile(filename, extract_dir):
1135    """Unpack zip `filename` to `extract_dir`
1136    """
1137    import zipfile  # late import for breaking circular dependency
1138
1139    if not zipfile.is_zipfile(filename):
1140        raise ReadError("%s is not a zip file" % filename)
1141
1142    zip = zipfile.ZipFile(filename)
1143    try:
1144        for info in zip.infolist():
1145            name = info.filename
1146
1147            # don't extract absolute paths or ones with .. in them
1148            if name.startswith('/') or '..' in name:
1149                continue
1150
1151            target = os.path.join(extract_dir, *name.split('/'))
1152            if not target:
1153                continue
1154
1155            _ensure_directory(target)
1156            if not name.endswith('/'):
1157                # file
1158                data = zip.read(info.filename)
1159                f = open(target, 'wb')
1160                try:
1161                    f.write(data)
1162                finally:
1163                    f.close()
1164                    del data
1165    finally:
1166        zip.close()
1167
1168def _unpack_tarfile(filename, extract_dir):
1169    """Unpack tar/tar.gz/tar.bz2/tar.xz `filename` to `extract_dir`
1170    """
1171    import tarfile  # late import for breaking circular dependency
1172    try:
1173        tarobj = tarfile.open(filename)
1174    except tarfile.TarError:
1175        raise ReadError(
1176            "%s is not a compressed or uncompressed tar file" % filename)
1177    try:
1178        tarobj.extractall(extract_dir)
1179    finally:
1180        tarobj.close()
1181
1182_UNPACK_FORMATS = {
1183    'tar':   (['.tar'], _unpack_tarfile, [], "uncompressed tar file"),
1184    'zip':   (['.zip'], _unpack_zipfile, [], "ZIP file"),
1185}
1186
1187if _ZLIB_SUPPORTED:
1188    _UNPACK_FORMATS['gztar'] = (['.tar.gz', '.tgz'], _unpack_tarfile, [],
1189                                "gzip'ed tar-file")
1190
1191if _BZ2_SUPPORTED:
1192    _UNPACK_FORMATS['bztar'] = (['.tar.bz2', '.tbz2'], _unpack_tarfile, [],
1193                                "bzip2'ed tar-file")
1194
1195if _LZMA_SUPPORTED:
1196    _UNPACK_FORMATS['xztar'] = (['.tar.xz', '.txz'], _unpack_tarfile, [],
1197                                "xz'ed tar-file")
1198
1199def _find_unpack_format(filename):
1200    for name, info in _UNPACK_FORMATS.items():
1201        for extension in info[0]:
1202            if filename.endswith(extension):
1203                return name
1204    return None
1205
1206def unpack_archive(filename, extract_dir=None, format=None):
1207    """Unpack an archive.
1208
1209    `filename` is the name of the archive.
1210
1211    `extract_dir` is the name of the target directory, where the archive
1212    is unpacked. If not provided, the current working directory is used.
1213
1214    `format` is the archive format: one of "zip", "tar", "gztar", "bztar",
1215    or "xztar".  Or any other registered format.  If not provided,
1216    unpack_archive will use the filename extension and see if an unpacker
1217    was registered for that extension.
1218
1219    In case none is found, a ValueError is raised.
1220    """
1221    sys.audit("shutil.unpack_archive", filename, extract_dir, format)
1222
1223    if extract_dir is None:
1224        extract_dir = os.getcwd()
1225
1226    extract_dir = os.fspath(extract_dir)
1227    filename = os.fspath(filename)
1228
1229    if format is not None:
1230        try:
1231            format_info = _UNPACK_FORMATS[format]
1232        except KeyError:
1233            raise ValueError("Unknown unpack format '{0}'".format(format)) from None
1234
1235        func = format_info[1]
1236        func(filename, extract_dir, **dict(format_info[2]))
1237    else:
1238        # we need to look at the registered unpackers supported extensions
1239        format = _find_unpack_format(filename)
1240        if format is None:
1241            raise ReadError("Unknown archive format '{0}'".format(filename))
1242
1243        func = _UNPACK_FORMATS[format][1]
1244        kwargs = dict(_UNPACK_FORMATS[format][2])
1245        func(filename, extract_dir, **kwargs)
1246
1247
1248if hasattr(os, 'statvfs'):
1249
1250    __all__.append('disk_usage')
1251    _ntuple_diskusage = collections.namedtuple('usage', 'total used free')
1252    _ntuple_diskusage.total.__doc__ = 'Total space in bytes'
1253    _ntuple_diskusage.used.__doc__ = 'Used space in bytes'
1254    _ntuple_diskusage.free.__doc__ = 'Free space in bytes'
1255
1256    def disk_usage(path):
1257        """Return disk usage statistics about the given path.
1258
1259        Returned value is a named tuple with attributes 'total', 'used' and
1260        'free', which are the amount of total, used and free space, in bytes.
1261        """
1262        st = os.statvfs(path)
1263        free = st.f_bavail * st.f_frsize
1264        total = st.f_blocks * st.f_frsize
1265        used = (st.f_blocks - st.f_bfree) * st.f_frsize
1266        return _ntuple_diskusage(total, used, free)
1267
1268elif _WINDOWS:
1269
1270    __all__.append('disk_usage')
1271    _ntuple_diskusage = collections.namedtuple('usage', 'total used free')
1272
1273    def disk_usage(path):
1274        """Return disk usage statistics about the given path.
1275
1276        Returned values is a named tuple with attributes 'total', 'used' and
1277        'free', which are the amount of total, used and free space, in bytes.
1278        """
1279        total, free = nt._getdiskusage(path)
1280        used = total - free
1281        return _ntuple_diskusage(total, used, free)
1282
1283
1284def chown(path, user=None, group=None):
1285    """Change owner user and group of the given path.
1286
1287    user and group can be the uid/gid or the user/group names, and in that case,
1288    they are converted to their respective uid/gid.
1289    """
1290    sys.audit('shutil.chown', path, user, group)
1291
1292    if user is None and group is None:
1293        raise ValueError("user and/or group must be set")
1294
1295    _user = user
1296    _group = group
1297
1298    # -1 means don't change it
1299    if user is None:
1300        _user = -1
1301    # user can either be an int (the uid) or a string (the system username)
1302    elif isinstance(user, str):
1303        _user = _get_uid(user)
1304        if _user is None:
1305            raise LookupError("no such user: {!r}".format(user))
1306
1307    if group is None:
1308        _group = -1
1309    elif not isinstance(group, int):
1310        _group = _get_gid(group)
1311        if _group is None:
1312            raise LookupError("no such group: {!r}".format(group))
1313
1314    os.chown(path, _user, _group)
1315
1316def get_terminal_size(fallback=(80, 24)):
1317    """Get the size of the terminal window.
1318
1319    For each of the two dimensions, the environment variable, COLUMNS
1320    and LINES respectively, is checked. If the variable is defined and
1321    the value is a positive integer, it is used.
1322
1323    When COLUMNS or LINES is not defined, which is the common case,
1324    the terminal connected to sys.__stdout__ is queried
1325    by invoking os.get_terminal_size.
1326
1327    If the terminal size cannot be successfully queried, either because
1328    the system doesn't support querying, or because we are not
1329    connected to a terminal, the value given in fallback parameter
1330    is used. Fallback defaults to (80, 24) which is the default
1331    size used by many terminal emulators.
1332
1333    The value returned is a named tuple of type os.terminal_size.
1334    """
1335    # columns, lines are the working values
1336    try:
1337        columns = int(os.environ['COLUMNS'])
1338    except (KeyError, ValueError):
1339        columns = 0
1340
1341    try:
1342        lines = int(os.environ['LINES'])
1343    except (KeyError, ValueError):
1344        lines = 0
1345
1346    # only query if necessary
1347    if columns <= 0 or lines <= 0:
1348        try:
1349            size = os.get_terminal_size(sys.__stdout__.fileno())
1350        except (AttributeError, ValueError, OSError):
1351            # stdout is None, closed, detached, or not a terminal, or
1352            # os.get_terminal_size() is unsupported
1353            size = os.terminal_size(fallback)
1354        if columns <= 0:
1355            columns = size.columns
1356        if lines <= 0:
1357            lines = size.lines
1358
1359    return os.terminal_size((columns, lines))
1360
1361
1362# Check that a given file can be accessed with the correct mode.
1363# Additionally check that `file` is not a directory, as on Windows
1364# directories pass the os.access check.
1365def _access_check(fn, mode):
1366    return (os.path.exists(fn) and os.access(fn, mode)
1367            and not os.path.isdir(fn))
1368
1369
1370def which(cmd, mode=os.F_OK | os.X_OK, path=None):
1371    """Given a command, mode, and a PATH string, return the path which
1372    conforms to the given mode on the PATH, or None if there is no such
1373    file.
1374
1375    `mode` defaults to os.F_OK | os.X_OK. `path` defaults to the result
1376    of os.environ.get("PATH"), or can be overridden with a custom search
1377    path.
1378
1379    """
1380    # If we're given a path with a directory part, look it up directly rather
1381    # than referring to PATH directories. This includes checking relative to the
1382    # current directory, e.g. ./script
1383    if os.path.dirname(cmd):
1384        if _access_check(cmd, mode):
1385            return cmd
1386        return None
1387
1388    use_bytes = isinstance(cmd, bytes)
1389
1390    if path is None:
1391        path = os.environ.get("PATH", None)
1392        if path is None:
1393            try:
1394                path = os.confstr("CS_PATH")
1395            except (AttributeError, ValueError):
1396                # os.confstr() or CS_PATH is not available
1397                path = os.defpath
1398        # bpo-35755: Don't use os.defpath if the PATH environment variable is
1399        # set to an empty string
1400
1401    # PATH='' doesn't match, whereas PATH=':' looks in the current directory
1402    if not path:
1403        return None
1404
1405    if use_bytes:
1406        path = os.fsencode(path)
1407        path = path.split(os.fsencode(os.pathsep))
1408    else:
1409        path = os.fsdecode(path)
1410        path = path.split(os.pathsep)
1411
1412    if sys.platform == "win32":
1413        # The current directory takes precedence on Windows.
1414        curdir = os.curdir
1415        if use_bytes:
1416            curdir = os.fsencode(curdir)
1417        if curdir not in path:
1418            path.insert(0, curdir)
1419
1420        # PATHEXT is necessary to check on Windows.
1421        pathext_source = os.getenv("PATHEXT") or _WIN_DEFAULT_PATHEXT
1422        pathext = [ext for ext in pathext_source.split(os.pathsep) if ext]
1423
1424        if use_bytes:
1425            pathext = [os.fsencode(ext) for ext in pathext]
1426        # See if the given file matches any of the expected path extensions.
1427        # This will allow us to short circuit when given "python.exe".
1428        # If it does match, only test that one, otherwise we have to try
1429        # others.
1430        if any(cmd.lower().endswith(ext.lower()) for ext in pathext):
1431            files = [cmd]
1432        else:
1433            files = [cmd + ext for ext in pathext]
1434    else:
1435        # On other platforms you don't have things like PATHEXT to tell you
1436        # what file suffixes are executable, so just pass on cmd as-is.
1437        files = [cmd]
1438
1439    seen = set()
1440    for dir in path:
1441        normdir = os.path.normcase(dir)
1442        if not normdir in seen:
1443            seen.add(normdir)
1444            for thefile in files:
1445                name = os.path.join(dir, thefile)
1446                if _access_check(name, mode):
1447                    return name
1448    return None
1449