mirror of
https://github.com/python/cpython.git
synced 2025-01-08 17:44:35 +08:00
faf2f63faf
svn+ssh://pythondev@svn.python.org/python/trunk ........ r59704 | christian.heimes | 2008-01-04 04:15:05 +0100 (Fri, 04 Jan 2008) | 1 line Moved include "Python.h" in front of other imports to silence a warning. ........ r59706 | raymond.hettinger | 2008-01-04 04:22:53 +0100 (Fri, 04 Jan 2008) | 10 lines Minor fix-ups to named tuples: * Make the _replace() method respect subclassing. * Using property() to make _fields read-only wasn't a good idea. It caused len(Point._fields) to fail. * Add note to _cast() about length checking and alternative with the star-operator. ........ r59707 | jeffrey.yasskin | 2008-01-04 09:01:23 +0100 (Fri, 04 Jan 2008) | 3 lines Make math.{floor,ceil}({int,long}) return float again for backwards compatibility after r59671 made them return integral types. ........ r59709 | christian.heimes | 2008-01-04 14:21:07 +0100 (Fri, 04 Jan 2008) | 1 line Bug #1713: posixpath.ismount() claims symlink to a mountpoint is a mountpoint. ........ r59712 | lars.gustaebel | 2008-01-04 15:00:33 +0100 (Fri, 04 Jan 2008) | 5 lines Issue #1735: TarFile.extractall() now correctly sets directory permissions and times. (will backport to 2.5) ........ r59714 | andrew.kuchling | 2008-01-04 15:47:17 +0100 (Fri, 04 Jan 2008) | 1 line Update links to bug/patch tracker ........ r59716 | christian.heimes | 2008-01-04 16:23:30 +0100 (Fri, 04 Jan 2008) | 1 line Added interface to Windows' WSAIoctl and a simple example for a network sniffer. ........ r59717 | christian.heimes | 2008-01-04 16:29:00 +0100 (Fri, 04 Jan 2008) | 1 line And here is the rest of Hirokazu Yamamoto's patch for VS6.0 support. Thanks Hiro! ........ r59719 | christian.heimes | 2008-01-04 16:34:06 +0100 (Fri, 04 Jan 2008) | 1 line Reverted last transaction. It's the wrong branch. ........ r59721 | christian.heimes | 2008-01-04 16:48:06 +0100 (Fri, 04 Jan 2008) | 1 line socket.ioctl is only available on Windows ........ r59722 | andrew.kuchling | 2008-01-04 19:24:41 +0100 (Fri, 04 Jan 2008) | 1 line Fix markup ........ r59723 | andrew.kuchling | 2008-01-04 19:25:05 +0100 (Fri, 04 Jan 2008) | 1 line Fix markup ........ r59725 | guido.van.rossum | 2008-01-05 01:59:59 +0100 (Sat, 05 Jan 2008) | 3 lines Patch #1725 by Mark Dickinson, fixes incorrect conversion of -1e1000 and adds errors for -0x. ........ r59726 | guido.van.rossum | 2008-01-05 02:21:57 +0100 (Sat, 05 Jan 2008) | 2 lines Patch #1698 by Senthil: allow '@' in username when parsed by urlparse.py. ........ r59727 | raymond.hettinger | 2008-01-05 02:35:43 +0100 (Sat, 05 Jan 2008) | 1 line Improve namedtuple's _cast() method with a docstring, new name, and error-checking. ........ r59728 | raymond.hettinger | 2008-01-05 03:17:24 +0100 (Sat, 05 Jan 2008) | 1 line Add error-checking to namedtuple's _replace() method. ........ r59730 | fred.drake | 2008-01-05 05:38:38 +0100 (Sat, 05 Jan 2008) | 2 lines clean up a comment ........ r59731 | jeffrey.yasskin | 2008-01-05 09:47:13 +0100 (Sat, 05 Jan 2008) | 11 lines Continue rolling back pep-3141 changes that changed behavior from 2.5. This round included: * Revert round to its 2.6 behavior (half away from 0). * Because round, floor, and ceil always return float again, it's no longer necessary to have them delegate to __xxx___, so I've ripped that out of their implementations and the Real ABC. This also helps in implementing types that work in both 2.6 and 3.0: you return int from the __xxx__ methods, and let it get enabled by the version upgrade. * Make pow(-1, .5) raise a ValueError again. ........ r59736 | andrew.kuchling | 2008-01-05 16:13:49 +0100 (Sat, 05 Jan 2008) | 1 line Fix comment typo ........ r59738 | thomas.heller | 2008-01-05 18:15:44 +0100 (Sat, 05 Jan 2008) | 1 line Add myself. ........ r59739 | georg.brandl | 2008-01-05 18:49:17 +0100 (Sat, 05 Jan 2008) | 2 lines Fix C++-style comment. ........ r59742 | georg.brandl | 2008-01-05 20:28:16 +0100 (Sat, 05 Jan 2008) | 2 lines Remove with_statement future imports from 2.6 docs. ........ r59743 | georg.brandl | 2008-01-05 20:29:45 +0100 (Sat, 05 Jan 2008) | 2 lines Simplify index entries; fix #1712. ........ r59744 | georg.brandl | 2008-01-05 20:44:22 +0100 (Sat, 05 Jan 2008) | 2 lines Doc patch #1730 from Robin Stocker; minor corrections mostly to os.rst. ........ r59749 | georg.brandl | 2008-01-05 21:29:13 +0100 (Sat, 05 Jan 2008) | 2 lines Revert socket.rst to unix-eol. ........ r59750 | georg.brandl | 2008-01-05 21:33:46 +0100 (Sat, 05 Jan 2008) | 2 lines Set native svn:eol-style property for text files. ........ r59752 | georg.brandl | 2008-01-05 21:46:29 +0100 (Sat, 05 Jan 2008) | 2 lines #1719: capitalization error in "UuidCreate". ........ r59753 | georg.brandl | 2008-01-05 22:02:25 +0100 (Sat, 05 Jan 2008) | 2 lines Repair markup. ........ r59754 | georg.brandl | 2008-01-05 22:10:50 +0100 (Sat, 05 Jan 2008) | 2 lines Use markup. ........ r59757 | christian.heimes | 2008-01-05 22:35:52 +0100 (Sat, 05 Jan 2008) | 1 line Final adjustments for #1601 ........ r59758 | guido.van.rossum | 2008-01-05 23:19:06 +0100 (Sat, 05 Jan 2008) | 3 lines Patch #1637: fix urlparse for URLs like 'http://x.com?arg=/foo'. Fix by John Nagle. ........ r59759 | guido.van.rossum | 2008-01-05 23:20:01 +0100 (Sat, 05 Jan 2008) | 2 lines Add John Nagle (of issue #1637). ........ r59765 | raymond.hettinger | 2008-01-06 10:02:24 +0100 (Sun, 06 Jan 2008) | 1 line Small code simplification. Forgot that classmethods can be called from intances. ........ r59766 | martin.v.loewis | 2008-01-06 11:09:48 +0100 (Sun, 06 Jan 2008) | 2 lines Use vcbuild for VS 2009. ........ r59767 | martin.v.loewis | 2008-01-06 12:03:43 +0100 (Sun, 06 Jan 2008) | 2 lines Package using VS 2008. ........ r59768 | martin.v.loewis | 2008-01-06 12:13:16 +0100 (Sun, 06 Jan 2008) | 2 lines Don't try to package msvcr90 for the moment. ........ r59769 | georg.brandl | 2008-01-06 15:17:36 +0100 (Sun, 06 Jan 2008) | 4 lines #1696393: don't check for '.' and '..' in ntpath.walk since they aren't returned from os.listdir anymore. Reported by Michael Haggerty. ........ r59770 | georg.brandl | 2008-01-06 15:27:15 +0100 (Sun, 06 Jan 2008) | 3 lines #1742: don't raise exception on os.path.relpath("a", "a"), but return os.curdir. Reported by Jesse Towner. ........ r59771 | georg.brandl | 2008-01-06 15:33:52 +0100 (Sun, 06 Jan 2008) | 2 lines #1591: Clarify docstring of Popen3. ........ r59772 | georg.brandl | 2008-01-06 16:30:34 +0100 (Sun, 06 Jan 2008) | 2 lines #1680: fix context manager example function name. ........ r59773 | georg.brandl | 2008-01-06 16:34:57 +0100 (Sun, 06 Jan 2008) | 2 lines #1755097: document default values for [].sort() and sorted(). ........
404 lines
12 KiB
Python
404 lines
12 KiB
Python
"""Common operations on Posix pathnames.
|
|
|
|
Instead of importing this module directly, import os and refer to
|
|
this module as os.path. The "os.path" name is an alias for this
|
|
module on Posix systems; on other systems (e.g. Mac, Windows),
|
|
os.path provides the same operations in a manner specific to that
|
|
platform, and is an alias to another module (e.g. macpath, ntpath).
|
|
|
|
Some of this can actually be useful on non-Posix systems too, e.g.
|
|
for manipulation of the pathname component of URLs.
|
|
"""
|
|
|
|
import os
|
|
import stat
|
|
import genericpath
|
|
from genericpath import *
|
|
|
|
__all__ = ["normcase","isabs","join","splitdrive","split","splitext",
|
|
"basename","dirname","commonprefix","getsize","getmtime",
|
|
"getatime","getctime","islink","exists","lexists","isdir","isfile",
|
|
"ismount","walk","expanduser","expandvars","normpath","abspath",
|
|
"samefile","sameopenfile","samestat",
|
|
"curdir","pardir","sep","pathsep","defpath","altsep","extsep",
|
|
"devnull","realpath","supports_unicode_filenames","relpath"]
|
|
|
|
# strings representing various path-related bits and pieces
|
|
curdir = '.'
|
|
pardir = '..'
|
|
extsep = '.'
|
|
sep = '/'
|
|
pathsep = ':'
|
|
defpath = ':/bin:/usr/bin'
|
|
altsep = None
|
|
devnull = '/dev/null'
|
|
|
|
# Normalize the case of a pathname. Trivial in Posix, string.lower on Mac.
|
|
# On MS-DOS this may also turn slashes into backslashes; however, other
|
|
# normalizations (such as optimizing '../' away) are not allowed
|
|
# (another function should be defined to do that).
|
|
|
|
def normcase(s):
|
|
"""Normalize case of pathname. Has no effect under Posix"""
|
|
return s
|
|
|
|
|
|
# Return whether a path is absolute.
|
|
# Trivial in Posix, harder on the Mac or MS-DOS.
|
|
|
|
def isabs(s):
|
|
"""Test whether a path is absolute"""
|
|
return s.startswith('/')
|
|
|
|
|
|
# Join pathnames.
|
|
# Ignore the previous parts if a part is absolute.
|
|
# Insert a '/' unless the first part is empty or already ends in '/'.
|
|
|
|
def join(a, *p):
|
|
"""Join two or more pathname components, inserting '/' as needed.
|
|
If any component is an absolute path, all previous path components
|
|
will be discarded."""
|
|
path = a
|
|
for b in p:
|
|
if b.startswith('/'):
|
|
path = b
|
|
elif path == '' or path.endswith('/'):
|
|
path += b
|
|
else:
|
|
path += '/' + b
|
|
return path
|
|
|
|
|
|
# Split a path in head (everything up to the last '/') and tail (the
|
|
# rest). If the path ends in '/', tail will be empty. If there is no
|
|
# '/' in the path, head will be empty.
|
|
# Trailing '/'es are stripped from head unless it is the root.
|
|
|
|
def split(p):
|
|
"""Split a pathname. Returns tuple "(head, tail)" where "tail" is
|
|
everything after the final slash. Either part may be empty."""
|
|
i = p.rfind('/') + 1
|
|
head, tail = p[:i], p[i:]
|
|
if head and head != '/'*len(head):
|
|
head = head.rstrip('/')
|
|
return head, tail
|
|
|
|
|
|
# Split a path in root and extension.
|
|
# The extension is everything starting at the last dot in the last
|
|
# pathname component; the root is everything before that.
|
|
# It is always true that root + ext == p.
|
|
|
|
def splitext(p):
|
|
return genericpath._splitext(p, sep, altsep, extsep)
|
|
splitext.__doc__ = genericpath._splitext.__doc__
|
|
|
|
# Split a pathname into a drive specification and the rest of the
|
|
# path. Useful on DOS/Windows/NT; on Unix, the drive is always empty.
|
|
|
|
def splitdrive(p):
|
|
"""Split a pathname into drive and path. On Posix, drive is always
|
|
empty."""
|
|
return '', p
|
|
|
|
|
|
# Return the tail (basename) part of a path, same as split(path)[1].
|
|
|
|
def basename(p):
|
|
"""Returns the final component of a pathname"""
|
|
i = p.rfind('/') + 1
|
|
return p[i:]
|
|
|
|
|
|
# Return the head (dirname) part of a path, same as split(path)[0].
|
|
|
|
def dirname(p):
|
|
"""Returns the directory component of a pathname"""
|
|
i = p.rfind('/') + 1
|
|
head = p[:i]
|
|
if head and head != '/'*len(head):
|
|
head = head.rstrip('/')
|
|
return head
|
|
|
|
|
|
# Is a path a symbolic link?
|
|
# This will always return false on systems where os.lstat doesn't exist.
|
|
|
|
def islink(path):
|
|
"""Test whether a path is a symbolic link"""
|
|
try:
|
|
st = os.lstat(path)
|
|
except (os.error, AttributeError):
|
|
return False
|
|
return stat.S_ISLNK(st.st_mode)
|
|
|
|
# Being true for dangling symbolic links is also useful.
|
|
|
|
def lexists(path):
|
|
"""Test whether a path exists. Returns True for broken symbolic links"""
|
|
try:
|
|
st = os.lstat(path)
|
|
except os.error:
|
|
return False
|
|
return True
|
|
|
|
|
|
# Are two filenames really pointing to the same file?
|
|
|
|
def samefile(f1, f2):
|
|
"""Test whether two pathnames reference the same actual file"""
|
|
s1 = os.stat(f1)
|
|
s2 = os.stat(f2)
|
|
return samestat(s1, s2)
|
|
|
|
|
|
# Are two open files really referencing the same file?
|
|
# (Not necessarily the same file descriptor!)
|
|
|
|
def sameopenfile(fp1, fp2):
|
|
"""Test whether two open file objects reference the same file"""
|
|
s1 = os.fstat(fp1)
|
|
s2 = os.fstat(fp2)
|
|
return samestat(s1, s2)
|
|
|
|
|
|
# Are two stat buffers (obtained from stat, fstat or lstat)
|
|
# describing the same file?
|
|
|
|
def samestat(s1, s2):
|
|
"""Test whether two stat buffers reference the same file"""
|
|
return s1.st_ino == s2.st_ino and \
|
|
s1.st_dev == s2.st_dev
|
|
|
|
|
|
# Is a path a mount point?
|
|
# (Does this work for all UNIXes? Is it even guaranteed to work by Posix?)
|
|
|
|
def ismount(path):
|
|
"""Test whether a path is a mount point"""
|
|
try:
|
|
s1 = os.lstat(path)
|
|
s2 = os.lstat(join(path, '..'))
|
|
except os.error:
|
|
return False # It doesn't exist -- so not a mount point :-)
|
|
dev1 = s1.st_dev
|
|
dev2 = s2.st_dev
|
|
if dev1 != dev2:
|
|
return True # path/.. on a different device as path
|
|
ino1 = s1.st_ino
|
|
ino2 = s2.st_ino
|
|
if ino1 == ino2:
|
|
return True # path/.. is the same i-node as path
|
|
return False
|
|
|
|
|
|
# Directory tree walk.
|
|
# For each directory under top (including top itself, but excluding
|
|
# '.' and '..'), func(arg, dirname, filenames) is called, where
|
|
# dirname is the name of the directory and filenames is the list
|
|
# of files (and subdirectories etc.) in the directory.
|
|
# The func may modify the filenames list, to implement a filter,
|
|
# or to impose a different order of visiting.
|
|
|
|
def walk(top, func, arg):
|
|
"""Directory tree walk with callback function.
|
|
|
|
For each directory in the directory tree rooted at top (including top
|
|
itself, but excluding '.' and '..'), call func(arg, dirname, fnames).
|
|
dirname is the name of the directory, and fnames a list of the names of
|
|
the files and subdirectories in dirname (excluding '.' and '..'). func
|
|
may modify the fnames list in-place (e.g. via del or slice assignment),
|
|
and walk will only recurse into the subdirectories whose names remain in
|
|
fnames; this can be used to implement a filter, or to impose a specific
|
|
order of visiting. No semantics are defined for, or required of, arg,
|
|
beyond that arg is always passed to func. It can be used, e.g., to pass
|
|
a filename pattern, or a mutable object designed to accumulate
|
|
statistics. Passing None for arg is common."""
|
|
|
|
try:
|
|
names = os.listdir(top)
|
|
except os.error:
|
|
return
|
|
func(arg, top, names)
|
|
for name in names:
|
|
name = join(top, name)
|
|
try:
|
|
st = os.lstat(name)
|
|
except os.error:
|
|
continue
|
|
if stat.S_ISDIR(st.st_mode):
|
|
walk(name, func, arg)
|
|
|
|
|
|
# Expand paths beginning with '~' or '~user'.
|
|
# '~' means $HOME; '~user' means that user's home directory.
|
|
# If the path doesn't begin with '~', or if the user or $HOME is unknown,
|
|
# the path is returned unchanged (leaving error reporting to whatever
|
|
# function is called with the expanded path as argument).
|
|
# See also module 'glob' for expansion of *, ? and [...] in pathnames.
|
|
# (A function should also be defined to do full *sh-style environment
|
|
# variable expansion.)
|
|
|
|
def expanduser(path):
|
|
"""Expand ~ and ~user constructions. If user or $HOME is unknown,
|
|
do nothing."""
|
|
if not path.startswith('~'):
|
|
return path
|
|
i = path.find('/', 1)
|
|
if i < 0:
|
|
i = len(path)
|
|
if i == 1:
|
|
if 'HOME' not in os.environ:
|
|
import pwd
|
|
userhome = pwd.getpwuid(os.getuid()).pw_dir
|
|
else:
|
|
userhome = os.environ['HOME']
|
|
else:
|
|
import pwd
|
|
try:
|
|
pwent = pwd.getpwnam(path[1:i])
|
|
except KeyError:
|
|
return path
|
|
userhome = pwent.pw_dir
|
|
userhome = userhome.rstrip('/')
|
|
return userhome + path[i:]
|
|
|
|
|
|
# Expand paths containing shell variable substitutions.
|
|
# This expands the forms $variable and ${variable} only.
|
|
# Non-existent variables are left unchanged.
|
|
|
|
_varprog = None
|
|
|
|
def expandvars(path):
|
|
"""Expand shell variables of form $var and ${var}. Unknown variables
|
|
are left unchanged."""
|
|
global _varprog
|
|
if '$' not in path:
|
|
return path
|
|
if not _varprog:
|
|
import re
|
|
_varprog = re.compile(r'\$(\w+|\{[^}]*\})')
|
|
i = 0
|
|
while True:
|
|
m = _varprog.search(path, i)
|
|
if not m:
|
|
break
|
|
i, j = m.span(0)
|
|
name = m.group(1)
|
|
if name.startswith('{') and name.endswith('}'):
|
|
name = name[1:-1]
|
|
if name in os.environ:
|
|
tail = path[j:]
|
|
path = path[:i] + os.environ[name]
|
|
i = len(path)
|
|
path += tail
|
|
else:
|
|
i = j
|
|
return path
|
|
|
|
|
|
# Normalize a path, e.g. A//B, A/./B and A/foo/../B all become A/B.
|
|
# It should be understood that this may change the meaning of the path
|
|
# if it contains symbolic links!
|
|
|
|
def normpath(path):
|
|
"""Normalize path, eliminating double slashes, etc."""
|
|
if path == '':
|
|
return '.'
|
|
initial_slashes = path.startswith('/')
|
|
# POSIX allows one or two initial slashes, but treats three or more
|
|
# as single slash.
|
|
if (initial_slashes and
|
|
path.startswith('//') and not path.startswith('///')):
|
|
initial_slashes = 2
|
|
comps = path.split('/')
|
|
new_comps = []
|
|
for comp in comps:
|
|
if comp in ('', '.'):
|
|
continue
|
|
if (comp != '..' or (not initial_slashes and not new_comps) or
|
|
(new_comps and new_comps[-1] == '..')):
|
|
new_comps.append(comp)
|
|
elif new_comps:
|
|
new_comps.pop()
|
|
comps = new_comps
|
|
path = '/'.join(comps)
|
|
if initial_slashes:
|
|
path = '/'*initial_slashes + path
|
|
return path or '.'
|
|
|
|
|
|
def abspath(path):
|
|
"""Return an absolute path."""
|
|
if not isabs(path):
|
|
path = join(os.getcwd(), path)
|
|
return normpath(path)
|
|
|
|
|
|
# Return a canonical path (i.e. the absolute location of a file on the
|
|
# filesystem).
|
|
|
|
def realpath(filename):
|
|
"""Return the canonical path of the specified filename, eliminating any
|
|
symbolic links encountered in the path."""
|
|
if isabs(filename):
|
|
bits = ['/'] + filename.split('/')[1:]
|
|
else:
|
|
bits = [''] + filename.split('/')
|
|
|
|
for i in range(2, len(bits)+1):
|
|
component = join(*bits[0:i])
|
|
# Resolve symbolic links.
|
|
if islink(component):
|
|
resolved = _resolve_link(component)
|
|
if resolved is None:
|
|
# Infinite loop -- return original component + rest of the path
|
|
return abspath(join(*([component] + bits[i:])))
|
|
else:
|
|
newpath = join(*([resolved] + bits[i:]))
|
|
return realpath(newpath)
|
|
|
|
return abspath(filename)
|
|
|
|
|
|
def _resolve_link(path):
|
|
"""Internal helper function. Takes a path and follows symlinks
|
|
until we either arrive at something that isn't a symlink, or
|
|
encounter a path we've seen before (meaning that there's a loop).
|
|
"""
|
|
paths_seen = []
|
|
while islink(path):
|
|
if path in paths_seen:
|
|
# Already seen this path, so we must have a symlink loop
|
|
return None
|
|
paths_seen.append(path)
|
|
# Resolve where the link points to
|
|
resolved = os.readlink(path)
|
|
if not isabs(resolved):
|
|
dir = dirname(path)
|
|
path = normpath(join(dir, resolved))
|
|
else:
|
|
path = normpath(resolved)
|
|
return path
|
|
|
|
supports_unicode_filenames = False
|
|
|
|
def relpath(path, start=curdir):
|
|
"""Return a relative version of a path"""
|
|
|
|
if not path:
|
|
raise ValueError("no path specified")
|
|
|
|
start_list = abspath(start).split(sep)
|
|
path_list = abspath(path).split(sep)
|
|
|
|
# Work out how much of the filepath is shared by start and path.
|
|
i = len(commonprefix([start_list, path_list]))
|
|
|
|
rel_list = [pardir] * (len(start_list)-i) + path_list[i:]
|
|
if not rel_list:
|
|
return curdir
|
|
return join(*rel_list)
|