Issue #789290: make sure that hash(2**63) == hash(2.**63) on 64-bit
[python.git] / Lib / ntpath.py
blob714f2054161ed2b731be7a57f3cb502d56ee1d34
1 # Module 'ntpath' -- common operations on WinNT/Win95 pathnames
2 """Common pathname manipulations, WindowsNT/95 version.
4 Instead of importing this module directly, import os and refer to this
5 module as os.path.
6 """
8 import os
9 import sys
10 import stat
11 import genericpath
12 import warnings
14 from genericpath import *
16 __all__ = ["normcase","isabs","join","splitdrive","split","splitext",
17 "basename","dirname","commonprefix","getsize","getmtime",
18 "getatime","getctime", "islink","exists","lexists","isdir","isfile",
19 "ismount","walk","expanduser","expandvars","normpath","abspath",
20 "splitunc","curdir","pardir","sep","pathsep","defpath","altsep",
21 "extsep","devnull","realpath","supports_unicode_filenames","relpath"]
23 # strings representing various path-related bits and pieces
24 curdir = '.'
25 pardir = '..'
26 extsep = '.'
27 sep = '\\'
28 pathsep = ';'
29 altsep = '/'
30 defpath = '.;C:\\bin'
31 if 'ce' in sys.builtin_module_names:
32 defpath = '\\Windows'
33 elif 'os2' in sys.builtin_module_names:
34 # OS/2 w/ VACPP
35 altsep = '/'
36 devnull = 'nul'
38 # Normalize the case of a pathname and map slashes to backslashes.
39 # Other normalizations (such as optimizing '../' away) are not done
40 # (this is done by normpath).
42 def normcase(s):
43 """Normalize case of pathname.
45 Makes all characters lowercase and all slashes into backslashes."""
46 return s.replace("/", "\\").lower()
49 # Return whether a path is absolute.
50 # Trivial in Posix, harder on the Mac or MS-DOS.
51 # For DOS it is absolute if it starts with a slash or backslash (current
52 # volume), or if a pathname after the volume letter and colon / UNC resource
53 # starts with a slash or backslash.
55 def isabs(s):
56 """Test whether a path is absolute"""
57 s = splitdrive(s)[1]
58 return s != '' and s[:1] in '/\\'
61 # Join two (or more) paths.
63 def join(a, *p):
64 """Join two or more pathname components, inserting "\\" as needed.
65 If any component is an absolute path, all previous path components
66 will be discarded."""
67 path = a
68 for b in p:
69 b_wins = 0 # set to 1 iff b makes path irrelevant
70 if path == "":
71 b_wins = 1
73 elif isabs(b):
74 # This probably wipes out path so far. However, it's more
75 # complicated if path begins with a drive letter:
76 # 1. join('c:', '/a') == 'c:/a'
77 # 2. join('c:/', '/a') == 'c:/a'
78 # But
79 # 3. join('c:/a', '/b') == '/b'
80 # 4. join('c:', 'd:/') = 'd:/'
81 # 5. join('c:/', 'd:/') = 'd:/'
82 if path[1:2] != ":" or b[1:2] == ":":
83 # Path doesn't start with a drive letter, or cases 4 and 5.
84 b_wins = 1
86 # Else path has a drive letter, and b doesn't but is absolute.
87 elif len(path) > 3 or (len(path) == 3 and
88 path[-1] not in "/\\"):
89 # case 3
90 b_wins = 1
92 if b_wins:
93 path = b
94 else:
95 # Join, and ensure there's a separator.
96 assert len(path) > 0
97 if path[-1] in "/\\":
98 if b and b[0] in "/\\":
99 path += b[1:]
100 else:
101 path += b
102 elif path[-1] == ":":
103 path += b
104 elif b:
105 if b[0] in "/\\":
106 path += b
107 else:
108 path += "\\" + b
109 else:
110 # path is not empty and does not end with a backslash,
111 # but b is empty; since, e.g., split('a/') produces
112 # ('a', ''), it's best if join() adds a backslash in
113 # this case.
114 path += '\\'
116 return path
119 # Split a path in a drive specification (a drive letter followed by a
120 # colon) and the path specification.
121 # It is always true that drivespec + pathspec == p
122 def splitdrive(p):
123 """Split a pathname into drive and path specifiers. Returns a 2-tuple
124 "(drive,path)"; either part may be empty"""
125 if p[1:2] == ':':
126 return p[0:2], p[2:]
127 return '', p
130 # Parse UNC paths
131 def splitunc(p):
132 """Split a pathname into UNC mount point and relative path specifiers.
134 Return a 2-tuple (unc, rest); either part may be empty.
135 If unc is not empty, it has the form '//host/mount' (or similar
136 using backslashes). unc+rest is always the input path.
137 Paths containing drive letters never have an UNC part.
139 if p[1:2] == ':':
140 return '', p # Drive letter present
141 firstTwo = p[0:2]
142 if firstTwo == '//' or firstTwo == '\\\\':
143 # is a UNC path:
144 # vvvvvvvvvvvvvvvvvvvv equivalent to drive letter
145 # \\machine\mountpoint\directories...
146 # directory ^^^^^^^^^^^^^^^
147 normp = normcase(p)
148 index = normp.find('\\', 2)
149 if index == -1:
150 ##raise RuntimeError, 'illegal UNC path: "' + p + '"'
151 return ("", p)
152 index = normp.find('\\', index + 1)
153 if index == -1:
154 index = len(p)
155 return p[:index], p[index:]
156 return '', p
159 # Split a path in head (everything up to the last '/') and tail (the
160 # rest). After the trailing '/' is stripped, the invariant
161 # join(head, tail) == p holds.
162 # The resulting head won't end in '/' unless it is the root.
164 def split(p):
165 """Split a pathname.
167 Return tuple (head, tail) where tail is everything after the final slash.
168 Either part may be empty."""
170 d, p = splitdrive(p)
171 # set i to index beyond p's last slash
172 i = len(p)
173 while i and p[i-1] not in '/\\':
174 i = i - 1
175 head, tail = p[:i], p[i:] # now tail has no slashes
176 # remove trailing slashes from head, unless it's all slashes
177 head2 = head
178 while head2 and head2[-1] in '/\\':
179 head2 = head2[:-1]
180 head = head2 or head
181 return d + head, tail
184 # Split a path in root and extension.
185 # The extension is everything starting at the last dot in the last
186 # pathname component; the root is everything before that.
187 # It is always true that root + ext == p.
189 def splitext(p):
190 return genericpath._splitext(p, sep, altsep, extsep)
191 splitext.__doc__ = genericpath._splitext.__doc__
194 # Return the tail (basename) part of a path.
196 def basename(p):
197 """Returns the final component of a pathname"""
198 return split(p)[1]
201 # Return the head (dirname) part of a path.
203 def dirname(p):
204 """Returns the directory component of a pathname"""
205 return split(p)[0]
207 # Is a path a symbolic link?
208 # This will always return false on systems where posix.lstat doesn't exist.
210 def islink(path):
211 """Test for symbolic link.
212 On WindowsNT/95 and OS/2 always returns false
214 return False
216 # alias exists to lexists
217 lexists = exists
219 # Is a path a mount point? Either a root (with or without drive letter)
220 # or an UNC path with at most a / or \ after the mount point.
222 def ismount(path):
223 """Test whether a path is a mount point (defined as root of drive)"""
224 unc, rest = splitunc(path)
225 if unc:
226 return rest in ("", "/", "\\")
227 p = splitdrive(path)[1]
228 return len(p) == 1 and p[0] in '/\\'
231 # Directory tree walk.
232 # For each directory under top (including top itself, but excluding
233 # '.' and '..'), func(arg, dirname, filenames) is called, where
234 # dirname is the name of the directory and filenames is the list
235 # of files (and subdirectories etc.) in the directory.
236 # The func may modify the filenames list, to implement a filter,
237 # or to impose a different order of visiting.
239 def walk(top, func, arg):
240 """Directory tree walk with callback function.
242 For each directory in the directory tree rooted at top (including top
243 itself, but excluding '.' and '..'), call func(arg, dirname, fnames).
244 dirname is the name of the directory, and fnames a list of the names of
245 the files and subdirectories in dirname (excluding '.' and '..'). func
246 may modify the fnames list in-place (e.g. via del or slice assignment),
247 and walk will only recurse into the subdirectories whose names remain in
248 fnames; this can be used to implement a filter, or to impose a specific
249 order of visiting. No semantics are defined for, or required of, arg,
250 beyond that arg is always passed to func. It can be used, e.g., to pass
251 a filename pattern, or a mutable object designed to accumulate
252 statistics. Passing None for arg is common."""
253 warnings.warnpy3k("In 3.x, os.path.walk is removed in favor of os.walk.")
254 try:
255 names = os.listdir(top)
256 except os.error:
257 return
258 func(arg, top, names)
259 for name in names:
260 name = join(top, name)
261 if isdir(name):
262 walk(name, func, arg)
265 # Expand paths beginning with '~' or '~user'.
266 # '~' means $HOME; '~user' means that user's home directory.
267 # If the path doesn't begin with '~', or if the user or $HOME is unknown,
268 # the path is returned unchanged (leaving error reporting to whatever
269 # function is called with the expanded path as argument).
270 # See also module 'glob' for expansion of *, ? and [...] in pathnames.
271 # (A function should also be defined to do full *sh-style environment
272 # variable expansion.)
274 def expanduser(path):
275 """Expand ~ and ~user constructs.
277 If user or $HOME is unknown, do nothing."""
278 if path[:1] != '~':
279 return path
280 i, n = 1, len(path)
281 while i < n and path[i] not in '/\\':
282 i = i + 1
284 if 'HOME' in os.environ:
285 userhome = os.environ['HOME']
286 elif 'USERPROFILE' in os.environ:
287 userhome = os.environ['USERPROFILE']
288 elif not 'HOMEPATH' in os.environ:
289 return path
290 else:
291 try:
292 drive = os.environ['HOMEDRIVE']
293 except KeyError:
294 drive = ''
295 userhome = join(drive, os.environ['HOMEPATH'])
297 if i != 1: #~user
298 userhome = join(dirname(userhome), path[1:i])
300 return userhome + path[i:]
303 # Expand paths containing shell variable substitutions.
304 # The following rules apply:
305 # - no expansion within single quotes
306 # - '$$' is translated into '$'
307 # - '%%' is translated into '%' if '%%' are not seen in %var1%%var2%
308 # - ${varname} is accepted.
309 # - $varname is accepted.
310 # - %varname% is accepted.
311 # - varnames can be made out of letters, digits and the characters '_-'
312 # (though is not verifed in the ${varname} and %varname% cases)
313 # XXX With COMMAND.COM you can use any characters in a variable name,
314 # XXX except '^|<>='.
316 def expandvars(path):
317 """Expand shell variables of the forms $var, ${var} and %var%.
319 Unknown variables are left unchanged."""
320 if '$' not in path and '%' not in path:
321 return path
322 import string
323 varchars = string.ascii_letters + string.digits + '_-'
324 res = ''
325 index = 0
326 pathlen = len(path)
327 while index < pathlen:
328 c = path[index]
329 if c == '\'': # no expansion within single quotes
330 path = path[index + 1:]
331 pathlen = len(path)
332 try:
333 index = path.index('\'')
334 res = res + '\'' + path[:index + 1]
335 except ValueError:
336 res = res + path
337 index = pathlen - 1
338 elif c == '%': # variable or '%'
339 if path[index + 1:index + 2] == '%':
340 res = res + c
341 index = index + 1
342 else:
343 path = path[index+1:]
344 pathlen = len(path)
345 try:
346 index = path.index('%')
347 except ValueError:
348 res = res + '%' + path
349 index = pathlen - 1
350 else:
351 var = path[:index]
352 if var in os.environ:
353 res = res + os.environ[var]
354 else:
355 res = res + '%' + var + '%'
356 elif c == '$': # variable or '$$'
357 if path[index + 1:index + 2] == '$':
358 res = res + c
359 index = index + 1
360 elif path[index + 1:index + 2] == '{':
361 path = path[index+2:]
362 pathlen = len(path)
363 try:
364 index = path.index('}')
365 var = path[:index]
366 if var in os.environ:
367 res = res + os.environ[var]
368 else:
369 res = res + '${' + var + '}'
370 except ValueError:
371 res = res + '${' + path
372 index = pathlen - 1
373 else:
374 var = ''
375 index = index + 1
376 c = path[index:index + 1]
377 while c != '' and c in varchars:
378 var = var + c
379 index = index + 1
380 c = path[index:index + 1]
381 if var in os.environ:
382 res = res + os.environ[var]
383 else:
384 res = res + '$' + var
385 if c != '':
386 index = index - 1
387 else:
388 res = res + c
389 index = index + 1
390 return res
393 # Normalize a path, e.g. A//B, A/./B and A/foo/../B all become A\B.
394 # Previously, this function also truncated pathnames to 8+3 format,
395 # but as this module is called "ntpath", that's obviously wrong!
397 def normpath(path):
398 """Normalize path, eliminating double slashes, etc."""
399 path = path.replace("/", "\\")
400 prefix, path = splitdrive(path)
401 # We need to be careful here. If the prefix is empty, and the path starts
402 # with a backslash, it could either be an absolute path on the current
403 # drive (\dir1\dir2\file) or a UNC filename (\\server\mount\dir1\file). It
404 # is therefore imperative NOT to collapse multiple backslashes blindly in
405 # that case.
406 # The code below preserves multiple backslashes when there is no drive
407 # letter. This means that the invalid filename \\\a\b is preserved
408 # unchanged, where a\\\b is normalised to a\b. It's not clear that there
409 # is any better behaviour for such edge cases.
410 if prefix == '':
411 # No drive letter - preserve initial backslashes
412 while path[:1] == "\\":
413 prefix = prefix + "\\"
414 path = path[1:]
415 else:
416 # We have a drive letter - collapse initial backslashes
417 if path.startswith("\\"):
418 prefix = prefix + "\\"
419 path = path.lstrip("\\")
420 comps = path.split("\\")
421 i = 0
422 while i < len(comps):
423 if comps[i] in ('.', ''):
424 del comps[i]
425 elif comps[i] == '..':
426 if i > 0 and comps[i-1] != '..':
427 del comps[i-1:i+1]
428 i -= 1
429 elif i == 0 and prefix.endswith("\\"):
430 del comps[i]
431 else:
432 i += 1
433 else:
434 i += 1
435 # If the path is now empty, substitute '.'
436 if not prefix and not comps:
437 comps.append('.')
438 return prefix + "\\".join(comps)
441 # Return an absolute path.
442 try:
443 from nt import _getfullpathname
445 except ImportError: # not running on Windows - mock up something sensible
446 def abspath(path):
447 """Return the absolute version of a path."""
448 if not isabs(path):
449 path = join(os.getcwd(), path)
450 return normpath(path)
452 else: # use native Windows method on Windows
453 def abspath(path):
454 """Return the absolute version of a path."""
456 if path: # Empty path must return current working directory.
457 try:
458 path = _getfullpathname(path)
459 except WindowsError:
460 pass # Bad path - return unchanged.
461 else:
462 path = os.getcwd()
463 return normpath(path)
465 # realpath is a no-op on systems without islink support
466 realpath = abspath
467 # Win9x family and earlier have no Unicode filename support.
468 supports_unicode_filenames = (hasattr(sys, "getwindowsversion") and
469 sys.getwindowsversion()[3] >= 2)
471 def relpath(path, start=curdir):
472 """Return a relative version of a path"""
474 if not path:
475 raise ValueError("no path specified")
476 start_list = abspath(start).split(sep)
477 path_list = abspath(path).split(sep)
478 if start_list[0].lower() != path_list[0].lower():
479 unc_path, rest = splitunc(path)
480 unc_start, rest = splitunc(start)
481 if bool(unc_path) ^ bool(unc_start):
482 raise ValueError("Cannot mix UNC and non-UNC paths (%s and %s)"
483 % (path, start))
484 else:
485 raise ValueError("path is on drive %s, start on drive %s"
486 % (path_list[0], start_list[0]))
487 # Work out how much of the filepath is shared by start and path.
488 for i in range(min(len(start_list), len(path_list))):
489 if start_list[i].lower() != path_list[i].lower():
490 break
491 else:
492 i += 1
494 rel_list = [pardir] * (len(start_list)-i) + path_list[i:]
495 if not rel_list:
496 return curdir
497 return join(*rel_list)