2000-02-04 15:10:34 +00:00
|
|
|
"""Common operations on Posix pathnames.
|
|
|
|
|
|
|
|
Instead of importing this module directly, import os and refer to
|
|
|
|
this module as os.path. The "os.path" name is an alias for this
|
|
|
|
module on Posix systems; on other systems (e.g. Mac, Windows),
|
|
|
|
os.path provides the same operations in a manner specific to that
|
|
|
|
platform, and is an alias to another module (e.g. macpath, ntpath).
|
|
|
|
|
|
|
|
Some of this can actually be useful on non-Posix systems too, e.g.
|
|
|
|
for manipulation of the pathname component of URLs.
|
1997-12-05 19:04:51 +00:00
|
|
|
"""
|
1996-07-23 03:47:28 +00:00
|
|
|
|
|
|
|
import os
|
1990-10-21 16:17:34 +00:00
|
|
|
import stat
|
1990-10-13 19:23:40 +00:00
|
|
|
|
2001-02-12 02:00:42 +00:00
|
|
|
__all__ = ["normcase","isabs","join","splitdrive","split","splitext",
|
|
|
|
"basename","dirname","commonprefix","getsize","getmtime",
|
|
|
|
"getatime","islink","exists","isdir","isfile","ismount",
|
|
|
|
"walk","expanduser","expandvars","normpath","abspath",
|
|
|
|
"samefile","sameopenfile","samestat"]
|
1990-10-13 19:23:40 +00:00
|
|
|
|
1992-01-14 18:29:32 +00:00
|
|
|
# Normalize the case of a pathname. Trivial in Posix, string.lower on Mac.
|
|
|
|
# On MS-DOS this may also turn slashes into backslashes; however, other
|
|
|
|
# normalizations (such as optimizing '../' away) are not allowed
|
|
|
|
# (another function should be defined to do that).
|
|
|
|
|
|
|
|
def normcase(s):
|
1997-12-05 19:04:51 +00:00
|
|
|
"""Normalize case of pathname. Has no effect under Posix"""
|
|
|
|
return s
|
1992-01-14 18:29:32 +00:00
|
|
|
|
|
|
|
|
2000-06-28 14:48:01 +00:00
|
|
|
# Return whether a path is absolute.
|
1992-01-14 18:29:32 +00:00
|
|
|
# Trivial in Posix, harder on the Mac or MS-DOS.
|
|
|
|
|
|
|
|
def isabs(s):
|
1997-12-05 19:04:51 +00:00
|
|
|
"""Test whether a path is absolute"""
|
|
|
|
return s[:1] == '/'
|
1992-01-14 18:29:32 +00:00
|
|
|
|
|
|
|
|
1997-02-18 21:53:25 +00:00
|
|
|
# Join pathnames.
|
|
|
|
# Ignore the previous parts if a part is absolute.
|
1991-08-16 13:27:58 +00:00
|
|
|
# Insert a '/' unless the first part is empty or already ends in '/'.
|
1992-01-14 18:29:32 +00:00
|
|
|
|
1997-02-18 21:53:25 +00:00
|
|
|
def join(a, *p):
|
1997-12-05 19:04:51 +00:00
|
|
|
"""Join two or more pathname components, inserting '/' as needed"""
|
|
|
|
path = a
|
|
|
|
for b in p:
|
|
|
|
if b[:1] == '/':
|
|
|
|
path = b
|
|
|
|
elif path == '' or path[-1:] == '/':
|
|
|
|
path = path + b
|
|
|
|
else:
|
|
|
|
path = path + '/' + b
|
|
|
|
return path
|
1990-10-13 19:23:40 +00:00
|
|
|
|
|
|
|
|
1992-03-31 18:54:35 +00:00
|
|
|
# Split a path in head (everything up to the last '/') and tail (the
|
1995-09-01 20:32:21 +00:00
|
|
|
# rest). If the path ends in '/', tail will be empty. If there is no
|
|
|
|
# '/' in the path, head will be empty.
|
|
|
|
# Trailing '/'es are stripped from head unless it is the root.
|
1992-01-14 18:29:32 +00:00
|
|
|
|
1990-10-13 19:23:40 +00:00
|
|
|
def split(p):
|
2001-01-15 00:50:52 +00:00
|
|
|
"""Split a pathname. Returns tuple "(head, tail)" where "tail" is
|
2000-09-28 16:22:52 +00:00
|
|
|
everything after the final slash. Either part may be empty."""
|
2000-09-28 15:04:39 +00:00
|
|
|
i = p.rfind('/') + 1
|
1997-12-05 19:04:51 +00:00
|
|
|
head, tail = p[:i], p[i:]
|
2000-12-12 23:20:45 +00:00
|
|
|
if head and head != '/'*len(head):
|
1997-12-05 19:04:51 +00:00
|
|
|
while head[-1] == '/':
|
|
|
|
head = head[:-1]
|
|
|
|
return head, tail
|
1990-10-13 19:23:40 +00:00
|
|
|
|
|
|
|
|
1991-08-16 13:27:58 +00:00
|
|
|
# Split a path in root and extension.
|
1996-08-20 20:24:17 +00:00
|
|
|
# The extension is everything starting at the last dot in the last
|
1991-08-16 13:27:58 +00:00
|
|
|
# pathname component; the root is everything before that.
|
1992-01-14 18:29:32 +00:00
|
|
|
# It is always true that root + ext == p.
|
|
|
|
|
1991-08-16 13:27:58 +00:00
|
|
|
def splitext(p):
|
1997-12-05 19:04:51 +00:00
|
|
|
"""Split the extension from a pathname. Extension is everything from the
|
2000-09-28 16:22:52 +00:00
|
|
|
last dot to the end. Returns "(root, ext)", either part may be empty."""
|
1997-12-05 19:04:51 +00:00
|
|
|
root, ext = '', ''
|
|
|
|
for c in p:
|
|
|
|
if c == '/':
|
|
|
|
root, ext = root + ext + c, ''
|
|
|
|
elif c == '.':
|
|
|
|
if ext:
|
|
|
|
root, ext = root + ext, c
|
|
|
|
else:
|
|
|
|
ext = c
|
|
|
|
elif ext:
|
|
|
|
ext = ext + c
|
|
|
|
else:
|
|
|
|
root = root + c
|
|
|
|
return root, ext
|
1991-08-16 13:27:58 +00:00
|
|
|
|
|
|
|
|
1995-08-07 20:17:55 +00:00
|
|
|
# Split a pathname into a drive specification and the rest of the
|
|
|
|
# path. Useful on DOS/Windows/NT; on Unix, the drive is always empty.
|
|
|
|
|
|
|
|
def splitdrive(p):
|
2001-01-15 00:50:52 +00:00
|
|
|
"""Split a pathname into drive and path. On Posix, drive is always
|
2000-09-28 16:22:52 +00:00
|
|
|
empty."""
|
1997-12-05 19:04:51 +00:00
|
|
|
return '', p
|
1995-08-07 20:17:55 +00:00
|
|
|
|
|
|
|
|
1990-10-13 19:23:40 +00:00
|
|
|
# Return the tail (basename) part of a path.
|
1992-01-14 18:29:32 +00:00
|
|
|
|
1990-10-13 19:23:40 +00:00
|
|
|
def basename(p):
|
1997-12-05 19:04:51 +00:00
|
|
|
"""Returns the final component of a pathname"""
|
|
|
|
return split(p)[1]
|
1990-10-13 19:23:40 +00:00
|
|
|
|
|
|
|
|
1992-11-05 10:43:02 +00:00
|
|
|
# Return the head (dirname) part of a path.
|
|
|
|
|
|
|
|
def dirname(p):
|
1997-12-05 19:04:51 +00:00
|
|
|
"""Returns the directory component of a pathname"""
|
|
|
|
return split(p)[0]
|
1992-11-05 10:43:02 +00:00
|
|
|
|
|
|
|
|
1990-10-13 19:23:40 +00:00
|
|
|
# Return the longest prefix of all list elements.
|
1992-01-14 18:29:32 +00:00
|
|
|
|
1990-10-13 19:23:40 +00:00
|
|
|
def commonprefix(m):
|
1997-12-05 19:04:51 +00:00
|
|
|
"Given a list of pathnames, returns the longest common leading component"
|
|
|
|
if not m: return ''
|
2000-08-22 13:01:53 +00:00
|
|
|
prefix = m[0]
|
|
|
|
for item in m:
|
1997-12-05 19:04:51 +00:00
|
|
|
for i in range(len(prefix)):
|
2000-12-12 23:20:45 +00:00
|
|
|
if prefix[:i+1] != item[:i+1]:
|
1997-12-05 19:04:51 +00:00
|
|
|
prefix = prefix[:i]
|
|
|
|
if i == 0: return ''
|
|
|
|
break
|
2000-08-22 13:01:53 +00:00
|
|
|
return prefix
|
1990-10-13 19:23:40 +00:00
|
|
|
|
|
|
|
|
1998-07-24 20:49:26 +00:00
|
|
|
# Get size, mtime, atime of files.
|
|
|
|
|
|
|
|
def getsize(filename):
|
|
|
|
"""Return the size of a file, reported by os.stat()."""
|
|
|
|
st = os.stat(filename)
|
|
|
|
return st[stat.ST_SIZE]
|
|
|
|
|
|
|
|
def getmtime(filename):
|
|
|
|
"""Return the last modification time of a file, reported by os.stat()."""
|
|
|
|
st = os.stat(filename)
|
|
|
|
return st[stat.ST_MTIME]
|
|
|
|
|
|
|
|
def getatime(filename):
|
|
|
|
"""Return the last access time of a file, reported by os.stat()."""
|
|
|
|
st = os.stat(filename)
|
2000-02-24 02:26:51 +00:00
|
|
|
return st[stat.ST_ATIME]
|
1998-07-24 20:49:26 +00:00
|
|
|
|
|
|
|
|
1992-01-14 18:29:32 +00:00
|
|
|
# Is a path a symbolic link?
|
1996-07-23 03:47:28 +00:00
|
|
|
# This will always return false on systems where os.lstat doesn't exist.
|
1992-01-14 18:29:32 +00:00
|
|
|
|
|
|
|
def islink(path):
|
1997-12-05 19:04:51 +00:00
|
|
|
"""Test whether a path is a symbolic link"""
|
|
|
|
try:
|
|
|
|
st = os.lstat(path)
|
|
|
|
except (os.error, AttributeError):
|
|
|
|
return 0
|
|
|
|
return stat.S_ISLNK(st[stat.ST_MODE])
|
1992-01-14 18:29:32 +00:00
|
|
|
|
|
|
|
|
|
|
|
# Does a path exist?
|
|
|
|
# This is false for dangling symbolic links.
|
|
|
|
|
1990-10-13 19:23:40 +00:00
|
|
|
def exists(path):
|
1997-12-05 19:04:51 +00:00
|
|
|
"""Test whether a path exists. Returns false for broken symbolic links"""
|
|
|
|
try:
|
|
|
|
st = os.stat(path)
|
|
|
|
except os.error:
|
|
|
|
return 0
|
|
|
|
return 1
|
1990-10-13 19:23:40 +00:00
|
|
|
|
|
|
|
|
1996-07-23 03:47:28 +00:00
|
|
|
# Is a path a directory?
|
1992-01-14 18:29:32 +00:00
|
|
|
# This follows symbolic links, so both islink() and isdir() can be true
|
|
|
|
# for the same path.
|
|
|
|
|
1990-10-13 19:23:40 +00:00
|
|
|
def isdir(path):
|
1997-12-05 19:04:51 +00:00
|
|
|
"""Test whether a path is a directory"""
|
|
|
|
try:
|
|
|
|
st = os.stat(path)
|
|
|
|
except os.error:
|
|
|
|
return 0
|
|
|
|
return stat.S_ISDIR(st[stat.ST_MODE])
|
1990-10-13 19:23:40 +00:00
|
|
|
|
|
|
|
|
1992-03-31 18:54:35 +00:00
|
|
|
# Is a path a regular file?
|
1994-08-01 11:34:53 +00:00
|
|
|
# This follows symbolic links, so both islink() and isfile() can be true
|
1992-01-14 18:29:32 +00:00
|
|
|
# for the same path.
|
|
|
|
|
|
|
|
def isfile(path):
|
1997-12-05 19:04:51 +00:00
|
|
|
"""Test whether a path is a regular file"""
|
|
|
|
try:
|
|
|
|
st = os.stat(path)
|
|
|
|
except os.error:
|
|
|
|
return 0
|
|
|
|
return stat.S_ISREG(st[stat.ST_MODE])
|
1990-10-13 19:23:40 +00:00
|
|
|
|
|
|
|
|
1991-11-12 15:37:40 +00:00
|
|
|
# Are two filenames really pointing to the same file?
|
1992-01-14 18:29:32 +00:00
|
|
|
|
1991-11-12 15:37:40 +00:00
|
|
|
def samefile(f1, f2):
|
1997-12-05 19:04:51 +00:00
|
|
|
"""Test whether two pathnames reference the same actual file"""
|
|
|
|
s1 = os.stat(f1)
|
|
|
|
s2 = os.stat(f2)
|
|
|
|
return samestat(s1, s2)
|
1991-11-12 15:37:40 +00:00
|
|
|
|
|
|
|
|
|
|
|
# Are two open files really referencing the same file?
|
|
|
|
# (Not necessarily the same file descriptor!)
|
1992-01-14 18:29:32 +00:00
|
|
|
|
1991-11-12 15:37:40 +00:00
|
|
|
def sameopenfile(fp1, fp2):
|
1997-12-05 19:04:51 +00:00
|
|
|
"""Test whether two open file objects reference the same file"""
|
|
|
|
s1 = os.fstat(fp1)
|
|
|
|
s2 = os.fstat(fp2)
|
|
|
|
return samestat(s1, s2)
|
1991-11-12 15:37:40 +00:00
|
|
|
|
|
|
|
|
|
|
|
# Are two stat buffers (obtained from stat, fstat or lstat)
|
|
|
|
# describing the same file?
|
1992-01-14 18:29:32 +00:00
|
|
|
|
1991-11-12 15:37:40 +00:00
|
|
|
def samestat(s1, s2):
|
1997-12-05 19:04:51 +00:00
|
|
|
"""Test whether two stat buffers reference the same file"""
|
|
|
|
return s1[stat.ST_INO] == s2[stat.ST_INO] and \
|
2001-01-15 00:50:52 +00:00
|
|
|
s1[stat.ST_DEV] == s2[stat.ST_DEV]
|
1990-10-13 19:23:40 +00:00
|
|
|
|
|
|
|
|
|
|
|
# Is a path a mount point?
|
1996-07-23 03:47:28 +00:00
|
|
|
# (Does this work for all UNIXes? Is it even guaranteed to work by Posix?)
|
1992-01-14 18:29:32 +00:00
|
|
|
|
1990-10-13 19:23:40 +00:00
|
|
|
def ismount(path):
|
1997-12-05 19:04:51 +00:00
|
|
|
"""Test whether a path is a mount point"""
|
|
|
|
try:
|
|
|
|
s1 = os.stat(path)
|
|
|
|
s2 = os.stat(join(path, '..'))
|
|
|
|
except os.error:
|
|
|
|
return 0 # It doesn't exist -- so not a mount point :-)
|
|
|
|
dev1 = s1[stat.ST_DEV]
|
|
|
|
dev2 = s2[stat.ST_DEV]
|
|
|
|
if dev1 != dev2:
|
|
|
|
return 1 # path/.. on a different device as path
|
|
|
|
ino1 = s1[stat.ST_INO]
|
|
|
|
ino2 = s2[stat.ST_INO]
|
|
|
|
if ino1 == ino2:
|
|
|
|
return 1 # path/.. is the same i-node as path
|
|
|
|
return 0
|
1990-10-13 19:23:40 +00:00
|
|
|
|
|
|
|
|
|
|
|
# Directory tree walk.
|
1992-01-14 18:29:32 +00:00
|
|
|
# For each directory under top (including top itself, but excluding
|
|
|
|
# '.' and '..'), func(arg, dirname, filenames) is called, where
|
|
|
|
# dirname is the name of the directory and filenames is the list
|
1997-12-05 19:04:51 +00:00
|
|
|
# of files (and subdirectories etc.) in the directory.
|
1992-01-14 18:29:32 +00:00
|
|
|
# The func may modify the filenames list, to implement a filter,
|
1990-10-13 19:23:40 +00:00
|
|
|
# or to impose a different order of visiting.
|
1992-01-14 18:29:32 +00:00
|
|
|
|
1990-10-13 19:23:40 +00:00
|
|
|
def walk(top, func, arg):
|
2001-01-15 00:50:52 +00:00
|
|
|
"""walk(top,func,arg) calls func(arg, d, files) for each directory "d"
|
2000-09-28 16:22:52 +00:00
|
|
|
in the tree rooted at "top" (including "top" itself). "files" is a list
|
|
|
|
of all the files and subdirs in directory "d".
|
|
|
|
"""
|
1997-12-05 19:04:51 +00:00
|
|
|
try:
|
|
|
|
names = os.listdir(top)
|
|
|
|
except os.error:
|
|
|
|
return
|
|
|
|
func(arg, top, names)
|
|
|
|
for name in names:
|
2001-01-15 00:50:52 +00:00
|
|
|
name = join(top, name)
|
2001-04-16 18:12:04 +00:00
|
|
|
try:
|
|
|
|
st = os.lstat(name)
|
|
|
|
except os.error:
|
|
|
|
continue
|
2001-01-15 00:50:52 +00:00
|
|
|
if stat.S_ISDIR(st[stat.ST_MODE]):
|
|
|
|
walk(name, func, arg)
|
1992-01-14 18:29:32 +00:00
|
|
|
|
|
|
|
|
|
|
|
# Expand paths beginning with '~' or '~user'.
|
|
|
|
# '~' means $HOME; '~user' means that user's home directory.
|
|
|
|
# If the path doesn't begin with '~', or if the user or $HOME is unknown,
|
|
|
|
# the path is returned unchanged (leaving error reporting to whatever
|
|
|
|
# function is called with the expanded path as argument).
|
|
|
|
# See also module 'glob' for expansion of *, ? and [...] in pathnames.
|
|
|
|
# (A function should also be defined to do full *sh-style environment
|
|
|
|
# variable expansion.)
|
|
|
|
|
|
|
|
def expanduser(path):
|
2001-01-15 00:50:52 +00:00
|
|
|
"""Expand ~ and ~user constructions. If user or $HOME is unknown,
|
2000-09-28 16:22:52 +00:00
|
|
|
do nothing."""
|
2000-12-12 23:20:45 +00:00
|
|
|
if path[:1] != '~':
|
1997-12-05 19:04:51 +00:00
|
|
|
return path
|
|
|
|
i, n = 1, len(path)
|
2000-12-12 23:20:45 +00:00
|
|
|
while i < n and path[i] != '/':
|
2000-09-28 16:22:52 +00:00
|
|
|
i = i + 1
|
1997-12-05 19:04:51 +00:00
|
|
|
if i == 1:
|
|
|
|
if not os.environ.has_key('HOME'):
|
|
|
|
return path
|
|
|
|
userhome = os.environ['HOME']
|
|
|
|
else:
|
|
|
|
import pwd
|
|
|
|
try:
|
|
|
|
pwent = pwd.getpwnam(path[1:i])
|
|
|
|
except KeyError:
|
|
|
|
return path
|
|
|
|
userhome = pwent[5]
|
2000-09-28 16:22:52 +00:00
|
|
|
if userhome[-1:] == '/': i = i + 1
|
1997-12-05 19:04:51 +00:00
|
|
|
return userhome + path[i:]
|
1992-08-09 13:54:50 +00:00
|
|
|
|
|
|
|
|
|
|
|
# Expand paths containing shell variable substitutions.
|
1994-08-01 11:34:53 +00:00
|
|
|
# This expands the forms $variable and ${variable} only.
|
2000-06-28 14:48:01 +00:00
|
|
|
# Non-existent variables are left unchanged.
|
1994-08-01 11:34:53 +00:00
|
|
|
|
|
|
|
_varprog = None
|
1992-08-09 13:54:50 +00:00
|
|
|
|
|
|
|
def expandvars(path):
|
1997-12-05 19:04:51 +00:00
|
|
|
"""Expand shell variables of form $var and ${var}. Unknown variables
|
2000-09-28 16:22:52 +00:00
|
|
|
are left unchanged."""
|
1997-12-05 19:04:51 +00:00
|
|
|
global _varprog
|
|
|
|
if '$' not in path:
|
|
|
|
return path
|
|
|
|
if not _varprog:
|
|
|
|
import re
|
|
|
|
_varprog = re.compile(r'\$(\w+|\{[^}]*\})')
|
|
|
|
i = 0
|
|
|
|
while 1:
|
|
|
|
m = _varprog.search(path, i)
|
|
|
|
if not m:
|
|
|
|
break
|
|
|
|
i, j = m.span(0)
|
|
|
|
name = m.group(1)
|
|
|
|
if name[:1] == '{' and name[-1:] == '}':
|
|
|
|
name = name[1:-1]
|
|
|
|
if os.environ.has_key(name):
|
|
|
|
tail = path[j:]
|
|
|
|
path = path[:i] + os.environ[name]
|
|
|
|
i = len(path)
|
|
|
|
path = path + tail
|
|
|
|
else:
|
|
|
|
i = j
|
|
|
|
return path
|
1992-11-05 10:43:02 +00:00
|
|
|
|
|
|
|
|
|
|
|
# Normalize a path, e.g. A//B, A/./B and A/foo/../B all become A/B.
|
|
|
|
# It should be understood that this may change the meaning of the path
|
|
|
|
# if it contains symbolic links!
|
|
|
|
|
|
|
|
def normpath(path):
|
1997-12-05 19:04:51 +00:00
|
|
|
"""Normalize path, eliminating double slashes, etc."""
|
2000-07-19 17:09:51 +00:00
|
|
|
if path == '':
|
|
|
|
return '.'
|
2001-01-29 11:29:44 +00:00
|
|
|
initial_slashes = path.startswith('/')
|
|
|
|
# POSIX allows one or two initial slashes, but treats three or more
|
|
|
|
# as single slash.
|
2001-02-09 20:06:00 +00:00
|
|
|
if (initial_slashes and
|
2001-01-29 11:29:44 +00:00
|
|
|
path.startswith('//') and not path.startswith('///')):
|
|
|
|
initial_slashes = 2
|
2000-09-28 15:04:39 +00:00
|
|
|
comps = path.split('/')
|
2000-07-19 17:09:51 +00:00
|
|
|
new_comps = []
|
|
|
|
for comp in comps:
|
|
|
|
if comp in ('', '.'):
|
|
|
|
continue
|
2001-01-29 11:29:44 +00:00
|
|
|
if (comp != '..' or (not initial_slashes and not new_comps) or
|
2000-07-19 17:09:51 +00:00
|
|
|
(new_comps and new_comps[-1] == '..')):
|
|
|
|
new_comps.append(comp)
|
|
|
|
elif new_comps:
|
|
|
|
new_comps.pop()
|
|
|
|
comps = new_comps
|
2000-09-28 15:04:39 +00:00
|
|
|
path = '/'.join(comps)
|
2001-01-29 11:29:44 +00:00
|
|
|
if initial_slashes:
|
|
|
|
path = '/'*initial_slashes + path
|
2000-07-19 17:09:51 +00:00
|
|
|
return path or '.'
|
1999-01-29 18:05:18 +00:00
|
|
|
|
|
|
|
|
|
|
|
def abspath(path):
|
2000-02-04 15:10:34 +00:00
|
|
|
"""Return an absolute path."""
|
1999-01-29 18:05:18 +00:00
|
|
|
if not isabs(path):
|
|
|
|
path = join(os.getcwd(), path)
|
|
|
|
return normpath(path)
|
2001-09-17 15:16:09 +00:00
|
|
|
|
|
|
|
|
|
|
|
# Return a canonical path (i.e. the absolute location of a file on the
|
|
|
|
# filesystem).
|
|
|
|
|
|
|
|
def realpath(filename):
|
|
|
|
"""Return the canonical path of the specified filename, eliminating any
|
|
|
|
symbolic links encountered in the path."""
|
|
|
|
filename = abspath(filename)
|
|
|
|
|
|
|
|
bits = ['/'] + filename.split('/')[1:]
|
|
|
|
for i in range(2, len(bits)+1):
|
|
|
|
component = join(*bits[0:i])
|
|
|
|
if islink(component):
|
|
|
|
resolved = os.readlink(component)
|
|
|
|
(dir, file) = split(component)
|
|
|
|
resolved = normpath(join(dir, resolved))
|
|
|
|
newpath = join(*([resolved] + bits[i:]))
|
|
|
|
return realpath(newpath)
|
2001-09-18 02:26:39 +00:00
|
|
|
|
2001-09-17 15:16:09 +00:00
|
|
|
return filename
|