pathlib.py 46 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141114211431144114511461147114811491150115111521153115411551156115711581159116011611162116311641165116611671168116911701171117211731174117511761177117811791180118111821183118411851186118711881189119011911192119311941195119611971198119912001201120212031204120512061207120812091210121112121213121412151216121712181219122012211222122312241225122612271228122912301231123212331234123512361237123812391240124112421243124412451246124712481249125012511252125312541255125612571258125912601261126212631264126512661267126812691270127112721273127412751276127712781279128012811282128312841285128612871288128912901291129212931294129512961297129812991300130113021303130413051306130713081309131013111312131313141315131613171318131913201321132213231324132513261327132813291330133113321333133413351336133713381339134013411342134313441345134613471348134913501351135213531354135513561357135813591360136113621363136413651366136713681369137013711372137313741375137613771378137913801381138213831384138513861387138813891390139113921393139413951396139713981399140014011402140314041405140614071408140914101411141214131414141514161417141814191420142114221423142414251426
  1. import fnmatch
  2. import functools
  3. import io
  4. import ntpath
  5. import os
  6. import posixpath
  7. import re
  8. import sys
  9. from collections import Sequence
  10. from contextlib import contextmanager
  11. from errno import EINVAL, ENOENT, ENOTDIR
  12. from operator import attrgetter
  13. from stat import S_ISDIR, S_ISLNK, S_ISREG, S_ISSOCK, S_ISBLK, S_ISCHR, S_ISFIFO
  14. from urllib.parse import quote_from_bytes as urlquote_from_bytes
  15. supports_symlinks = True
  16. if os.name == 'nt':
  17. import nt
  18. if sys.getwindowsversion()[:2] >= (6, 0):
  19. from nt import _getfinalpathname
  20. else:
  21. supports_symlinks = False
  22. _getfinalpathname = None
  23. else:
  24. nt = None
  25. __all__ = [
  26. "PurePath", "PurePosixPath", "PureWindowsPath",
  27. "Path", "PosixPath", "WindowsPath",
  28. ]
  29. #
  30. # Internals
  31. #
  32. def _is_wildcard_pattern(pat):
  33. # Whether this pattern needs actual matching using fnmatch, or can
  34. # be looked up directly as a file.
  35. return "*" in pat or "?" in pat or "[" in pat
  36. class _Flavour(object):
  37. """A flavour implements a particular (platform-specific) set of path
  38. semantics."""
  39. def __init__(self):
  40. self.join = self.sep.join
  41. def parse_parts(self, parts):
  42. parsed = []
  43. sep = self.sep
  44. altsep = self.altsep
  45. drv = root = ''
  46. it = reversed(parts)
  47. for part in it:
  48. if not part:
  49. continue
  50. if altsep:
  51. part = part.replace(altsep, sep)
  52. drv, root, rel = self.splitroot(part)
  53. if sep in rel:
  54. for x in reversed(rel.split(sep)):
  55. if x and x != '.':
  56. parsed.append(sys.intern(x))
  57. else:
  58. if rel and rel != '.':
  59. parsed.append(sys.intern(rel))
  60. if drv or root:
  61. if not drv:
  62. # If no drive is present, try to find one in the previous
  63. # parts. This makes the result of parsing e.g.
  64. # ("C:", "/", "a") reasonably intuitive.
  65. for part in it:
  66. if not part:
  67. continue
  68. if altsep:
  69. part = part.replace(altsep, sep)
  70. drv = self.splitroot(part)[0]
  71. if drv:
  72. break
  73. break
  74. if drv or root:
  75. parsed.append(drv + root)
  76. parsed.reverse()
  77. return drv, root, parsed
  78. def join_parsed_parts(self, drv, root, parts, drv2, root2, parts2):
  79. """
  80. Join the two paths represented by the respective
  81. (drive, root, parts) tuples. Return a new (drive, root, parts) tuple.
  82. """
  83. if root2:
  84. if not drv2 and drv:
  85. return drv, root2, [drv + root2] + parts2[1:]
  86. elif drv2:
  87. if drv2 == drv or self.casefold(drv2) == self.casefold(drv):
  88. # Same drive => second path is relative to the first
  89. return drv, root, parts + parts2[1:]
  90. else:
  91. # Second path is non-anchored (common case)
  92. return drv, root, parts + parts2
  93. return drv2, root2, parts2
  94. class _WindowsFlavour(_Flavour):
  95. # Reference for Windows paths can be found at
  96. # http://msdn.microsoft.com/en-us/library/aa365247%28v=vs.85%29.aspx
  97. sep = '\\'
  98. altsep = '/'
  99. has_drv = True
  100. pathmod = ntpath
  101. is_supported = (os.name == 'nt')
  102. drive_letters = (
  103. set(chr(x) for x in range(ord('a'), ord('z') + 1)) |
  104. set(chr(x) for x in range(ord('A'), ord('Z') + 1))
  105. )
  106. ext_namespace_prefix = '\\\\?\\'
  107. reserved_names = (
  108. {'CON', 'PRN', 'AUX', 'NUL'} |
  109. {'COM%d' % i for i in range(1, 10)} |
  110. {'LPT%d' % i for i in range(1, 10)}
  111. )
  112. # Interesting findings about extended paths:
  113. # - '\\?\c:\a', '//?/c:\a' and '//?/c:/a' are all supported
  114. # but '\\?\c:/a' is not
  115. # - extended paths are always absolute; "relative" extended paths will
  116. # fail.
  117. def splitroot(self, part, sep=sep):
  118. first = part[0:1]
  119. second = part[1:2]
  120. if (second == sep and first == sep):
  121. # XXX extended paths should also disable the collapsing of "."
  122. # components (according to MSDN docs).
  123. prefix, part = self._split_extended_path(part)
  124. first = part[0:1]
  125. second = part[1:2]
  126. else:
  127. prefix = ''
  128. third = part[2:3]
  129. if (second == sep and first == sep and third != sep):
  130. # is a UNC path:
  131. # vvvvvvvvvvvvvvvvvvvvv root
  132. # \\machine\mountpoint\directory\etc\...
  133. # directory ^^^^^^^^^^^^^^
  134. index = part.find(sep, 2)
  135. if index != -1:
  136. index2 = part.find(sep, index + 1)
  137. # a UNC path can't have two slashes in a row
  138. # (after the initial two)
  139. if index2 != index + 1:
  140. if index2 == -1:
  141. index2 = len(part)
  142. if prefix:
  143. return prefix + part[1:index2], sep, part[index2+1:]
  144. else:
  145. return part[:index2], sep, part[index2+1:]
  146. drv = root = ''
  147. if second == ':' and first in self.drive_letters:
  148. drv = part[:2]
  149. part = part[2:]
  150. first = third
  151. if first == sep:
  152. root = first
  153. part = part.lstrip(sep)
  154. return prefix + drv, root, part
  155. def casefold(self, s):
  156. return s.lower()
  157. def casefold_parts(self, parts):
  158. return [p.lower() for p in parts]
  159. def resolve(self, path):
  160. s = str(path)
  161. if not s:
  162. return os.getcwd()
  163. if _getfinalpathname is not None:
  164. return self._ext_to_normal(_getfinalpathname(s))
  165. # Means fallback on absolute
  166. return None
  167. def _split_extended_path(self, s, ext_prefix=ext_namespace_prefix):
  168. prefix = ''
  169. if s.startswith(ext_prefix):
  170. prefix = s[:4]
  171. s = s[4:]
  172. if s.startswith('UNC\\'):
  173. prefix += s[:3]
  174. s = '\\' + s[3:]
  175. return prefix, s
  176. def _ext_to_normal(self, s):
  177. # Turn back an extended path into a normal DOS-like path
  178. return self._split_extended_path(s)[1]
  179. def is_reserved(self, parts):
  180. # NOTE: the rules for reserved names seem somewhat complicated
  181. # (e.g. r"..\NUL" is reserved but not r"foo\NUL").
  182. # We err on the side of caution and return True for paths which are
  183. # not considered reserved by Windows.
  184. if not parts:
  185. return False
  186. if parts[0].startswith('\\\\'):
  187. # UNC paths are never reserved
  188. return False
  189. return parts[-1].partition('.')[0].upper() in self.reserved_names
  190. def make_uri(self, path):
  191. # Under Windows, file URIs use the UTF-8 encoding.
  192. drive = path.drive
  193. if len(drive) == 2 and drive[1] == ':':
  194. # It's a path on a local drive => 'file:///c:/a/b'
  195. rest = path.as_posix()[2:].lstrip('/')
  196. return 'file:///%s/%s' % (
  197. drive, urlquote_from_bytes(rest.encode('utf-8')))
  198. else:
  199. # It's a path on a network drive => 'file://host/share/a/b'
  200. return 'file:' + urlquote_from_bytes(path.as_posix().encode('utf-8'))
  201. def gethomedir(self, username):
  202. if 'HOME' in os.environ:
  203. userhome = os.environ['HOME']
  204. elif 'USERPROFILE' in os.environ:
  205. userhome = os.environ['USERPROFILE']
  206. elif 'HOMEPATH' in os.environ:
  207. try:
  208. drv = os.environ['HOMEDRIVE']
  209. except KeyError:
  210. drv = ''
  211. userhome = drv + os.environ['HOMEPATH']
  212. else:
  213. raise RuntimeError("Can't determine home directory")
  214. if username:
  215. # Try to guess user home directory. By default all users
  216. # directories are located in the same place and are named by
  217. # corresponding usernames. If current user home directory points
  218. # to nonstandard place, this guess is likely wrong.
  219. if os.environ['USERNAME'] != username:
  220. drv, root, parts = self.parse_parts((userhome,))
  221. if parts[-1] != os.environ['USERNAME']:
  222. raise RuntimeError("Can't determine home directory "
  223. "for %r" % username)
  224. parts[-1] = username
  225. if drv or root:
  226. userhome = drv + root + self.join(parts[1:])
  227. else:
  228. userhome = self.join(parts)
  229. return userhome
  230. class _PosixFlavour(_Flavour):
  231. sep = '/'
  232. altsep = ''
  233. has_drv = False
  234. pathmod = posixpath
  235. is_supported = (os.name != 'nt')
  236. def splitroot(self, part, sep=sep):
  237. if part and part[0] == sep:
  238. stripped_part = part.lstrip(sep)
  239. # According to POSIX path resolution:
  240. # http://pubs.opengroup.org/onlinepubs/009695399/basedefs/xbd_chap04.html#tag_04_11
  241. # "A pathname that begins with two successive slashes may be
  242. # interpreted in an implementation-defined manner, although more
  243. # than two leading slashes shall be treated as a single slash".
  244. if len(part) - len(stripped_part) == 2:
  245. return '', sep * 2, stripped_part
  246. else:
  247. return '', sep, stripped_part
  248. else:
  249. return '', '', part
  250. def casefold(self, s):
  251. return s
  252. def casefold_parts(self, parts):
  253. return parts
  254. def resolve(self, path):
  255. sep = self.sep
  256. accessor = path._accessor
  257. seen = {}
  258. def _resolve(path, rest):
  259. if rest.startswith(sep):
  260. path = ''
  261. for name in rest.split(sep):
  262. if not name or name == '.':
  263. # current dir
  264. continue
  265. if name == '..':
  266. # parent dir
  267. path, _, _ = path.rpartition(sep)
  268. continue
  269. newpath = path + sep + name
  270. if newpath in seen:
  271. # Already seen this path
  272. path = seen[newpath]
  273. if path is not None:
  274. # use cached value
  275. continue
  276. # The symlink is not resolved, so we must have a symlink loop.
  277. raise RuntimeError("Symlink loop from %r" % newpath)
  278. # Resolve the symbolic link
  279. try:
  280. target = accessor.readlink(newpath)
  281. except OSError as e:
  282. if e.errno != EINVAL:
  283. raise
  284. # Not a symlink
  285. path = newpath
  286. else:
  287. seen[newpath] = None # not resolved symlink
  288. path = _resolve(path, target)
  289. seen[newpath] = path # resolved symlink
  290. return path
  291. # NOTE: according to POSIX, getcwd() cannot contain path components
  292. # which are symlinks.
  293. base = '' if path.is_absolute() else os.getcwd()
  294. return _resolve(base, str(path)) or sep
  295. def is_reserved(self, parts):
  296. return False
  297. def make_uri(self, path):
  298. # We represent the path using the local filesystem encoding,
  299. # for portability to other applications.
  300. bpath = bytes(path)
  301. return 'file://' + urlquote_from_bytes(bpath)
  302. def gethomedir(self, username):
  303. if not username:
  304. try:
  305. return os.environ['HOME']
  306. except KeyError:
  307. import pwd
  308. return pwd.getpwuid(os.getuid()).pw_dir
  309. else:
  310. import pwd
  311. try:
  312. return pwd.getpwnam(username).pw_dir
  313. except KeyError:
  314. raise RuntimeError("Can't determine home directory "
  315. "for %r" % username)
  316. _windows_flavour = _WindowsFlavour()
  317. _posix_flavour = _PosixFlavour()
  318. class _Accessor:
  319. """An accessor implements a particular (system-specific or not) way of
  320. accessing paths on the filesystem."""
  321. class _NormalAccessor(_Accessor):
  322. def _wrap_strfunc(strfunc):
  323. @functools.wraps(strfunc)
  324. def wrapped(pathobj, *args):
  325. return strfunc(str(pathobj), *args)
  326. return staticmethod(wrapped)
  327. def _wrap_binary_strfunc(strfunc):
  328. @functools.wraps(strfunc)
  329. def wrapped(pathobjA, pathobjB, *args):
  330. return strfunc(str(pathobjA), str(pathobjB), *args)
  331. return staticmethod(wrapped)
  332. stat = _wrap_strfunc(os.stat)
  333. lstat = _wrap_strfunc(os.lstat)
  334. open = _wrap_strfunc(os.open)
  335. listdir = _wrap_strfunc(os.listdir)
  336. chmod = _wrap_strfunc(os.chmod)
  337. if hasattr(os, "lchmod"):
  338. lchmod = _wrap_strfunc(os.lchmod)
  339. else:
  340. def lchmod(self, pathobj, mode):
  341. raise NotImplementedError("lchmod() not available on this system")
  342. mkdir = _wrap_strfunc(os.mkdir)
  343. unlink = _wrap_strfunc(os.unlink)
  344. rmdir = _wrap_strfunc(os.rmdir)
  345. rename = _wrap_binary_strfunc(os.rename)
  346. replace = _wrap_binary_strfunc(os.replace)
  347. if nt:
  348. if supports_symlinks:
  349. symlink = _wrap_binary_strfunc(os.symlink)
  350. else:
  351. def symlink(a, b, target_is_directory):
  352. raise NotImplementedError("symlink() not available on this system")
  353. else:
  354. # Under POSIX, os.symlink() takes two args
  355. @staticmethod
  356. def symlink(a, b, target_is_directory):
  357. return os.symlink(str(a), str(b))
  358. utime = _wrap_strfunc(os.utime)
  359. # Helper for resolve()
  360. def readlink(self, path):
  361. return os.readlink(path)
  362. _normal_accessor = _NormalAccessor()
  363. #
  364. # Globbing helpers
  365. #
  366. @contextmanager
  367. def _cached(func):
  368. try:
  369. func.__cached__
  370. yield func
  371. except AttributeError:
  372. cache = {}
  373. def wrapper(*args):
  374. try:
  375. return cache[args]
  376. except KeyError:
  377. value = cache[args] = func(*args)
  378. return value
  379. wrapper.__cached__ = True
  380. try:
  381. yield wrapper
  382. finally:
  383. cache.clear()
  384. def _make_selector(pattern_parts):
  385. pat = pattern_parts[0]
  386. child_parts = pattern_parts[1:]
  387. if pat == '**':
  388. cls = _RecursiveWildcardSelector
  389. elif '**' in pat:
  390. raise ValueError("Invalid pattern: '**' can only be an entire path component")
  391. elif _is_wildcard_pattern(pat):
  392. cls = _WildcardSelector
  393. else:
  394. cls = _PreciseSelector
  395. return cls(pat, child_parts)
  396. if hasattr(functools, "lru_cache"):
  397. _make_selector = functools.lru_cache()(_make_selector)
  398. class _Selector:
  399. """A selector matches a specific glob pattern part against the children
  400. of a given path."""
  401. def __init__(self, child_parts):
  402. self.child_parts = child_parts
  403. if child_parts:
  404. self.successor = _make_selector(child_parts)
  405. else:
  406. self.successor = _TerminatingSelector()
  407. def select_from(self, parent_path):
  408. """Iterate over all child paths of `parent_path` matched by this
  409. selector. This can contain parent_path itself."""
  410. path_cls = type(parent_path)
  411. is_dir = path_cls.is_dir
  412. exists = path_cls.exists
  413. listdir = parent_path._accessor.listdir
  414. return self._select_from(parent_path, is_dir, exists, listdir)
  415. class _TerminatingSelector:
  416. def _select_from(self, parent_path, is_dir, exists, listdir):
  417. yield parent_path
  418. class _PreciseSelector(_Selector):
  419. def __init__(self, name, child_parts):
  420. self.name = name
  421. _Selector.__init__(self, child_parts)
  422. def _select_from(self, parent_path, is_dir, exists, listdir):
  423. try:
  424. if not is_dir(parent_path):
  425. return
  426. path = parent_path._make_child_relpath(self.name)
  427. if exists(path):
  428. for p in self.successor._select_from(path, is_dir, exists, listdir):
  429. yield p
  430. except PermissionError:
  431. return
  432. class _WildcardSelector(_Selector):
  433. def __init__(self, pat, child_parts):
  434. self.pat = re.compile(fnmatch.translate(pat))
  435. _Selector.__init__(self, child_parts)
  436. def _select_from(self, parent_path, is_dir, exists, listdir):
  437. try:
  438. if not is_dir(parent_path):
  439. return
  440. cf = parent_path._flavour.casefold
  441. for name in listdir(parent_path):
  442. casefolded = cf(name)
  443. if self.pat.match(casefolded):
  444. path = parent_path._make_child_relpath(name)
  445. for p in self.successor._select_from(path, is_dir, exists, listdir):
  446. yield p
  447. except PermissionError:
  448. return
  449. class _RecursiveWildcardSelector(_Selector):
  450. def __init__(self, pat, child_parts):
  451. _Selector.__init__(self, child_parts)
  452. def _iterate_directories(self, parent_path, is_dir, listdir):
  453. yield parent_path
  454. try:
  455. for name in listdir(parent_path):
  456. path = parent_path._make_child_relpath(name)
  457. if is_dir(path) and not path.is_symlink():
  458. for p in self._iterate_directories(path, is_dir, listdir):
  459. yield p
  460. except PermissionError:
  461. return
  462. def _select_from(self, parent_path, is_dir, exists, listdir):
  463. try:
  464. if not is_dir(parent_path):
  465. return
  466. with _cached(listdir) as listdir:
  467. yielded = set()
  468. try:
  469. successor_select = self.successor._select_from
  470. for starting_point in self._iterate_directories(parent_path, is_dir, listdir):
  471. for p in successor_select(starting_point, is_dir, exists, listdir):
  472. if p not in yielded:
  473. yield p
  474. yielded.add(p)
  475. finally:
  476. yielded.clear()
  477. except PermissionError:
  478. return
  479. #
  480. # Public API
  481. #
  482. class _PathParents(Sequence):
  483. """This object provides sequence-like access to the logical ancestors
  484. of a path. Don't try to construct it yourself."""
  485. __slots__ = ('_pathcls', '_drv', '_root', '_parts')
  486. def __init__(self, path):
  487. # We don't store the instance to avoid reference cycles
  488. self._pathcls = type(path)
  489. self._drv = path._drv
  490. self._root = path._root
  491. self._parts = path._parts
  492. def __len__(self):
  493. if self._drv or self._root:
  494. return len(self._parts) - 1
  495. else:
  496. return len(self._parts)
  497. def __getitem__(self, idx):
  498. if idx < 0 or idx >= len(self):
  499. raise IndexError(idx)
  500. return self._pathcls._from_parsed_parts(self._drv, self._root,
  501. self._parts[:-idx - 1])
  502. def __repr__(self):
  503. return "<{}.parents>".format(self._pathcls.__name__)
  504. class PurePath(object):
  505. """PurePath represents a filesystem path and offers operations which
  506. don't imply any actual filesystem I/O. Depending on your system,
  507. instantiating a PurePath will return either a PurePosixPath or a
  508. PureWindowsPath object. You can also instantiate either of these classes
  509. directly, regardless of your system.
  510. """
  511. __slots__ = (
  512. '_drv', '_root', '_parts',
  513. '_str', '_hash', '_pparts', '_cached_cparts',
  514. )
  515. def __new__(cls, *args):
  516. """Construct a PurePath from one or several strings and or existing
  517. PurePath objects. The strings and path objects are combined so as
  518. to yield a canonicalized path, which is incorporated into the
  519. new PurePath object.
  520. """
  521. if cls is PurePath:
  522. cls = PureWindowsPath if os.name == 'nt' else PurePosixPath
  523. return cls._from_parts(args)
  524. def __reduce__(self):
  525. # Using the parts tuple helps share interned path parts
  526. # when pickling related paths.
  527. return (self.__class__, tuple(self._parts))
  528. @classmethod
  529. def _parse_args(cls, args):
  530. # This is useful when you don't want to create an instance, just
  531. # canonicalize some constructor arguments.
  532. parts = []
  533. for a in args:
  534. if isinstance(a, PurePath):
  535. parts += a._parts
  536. elif isinstance(a, str):
  537. # Force-cast str subclasses to str (issue #21127)
  538. parts.append(str(a))
  539. else:
  540. raise TypeError(
  541. "argument should be a path or str object, not %r"
  542. % type(a))
  543. return cls._flavour.parse_parts(parts)
  544. @classmethod
  545. def _from_parts(cls, args, init=True):
  546. # We need to call _parse_args on the instance, so as to get the
  547. # right flavour.
  548. self = object.__new__(cls)
  549. drv, root, parts = self._parse_args(args)
  550. self._drv = drv
  551. self._root = root
  552. self._parts = parts
  553. if init:
  554. self._init()
  555. return self
  556. @classmethod
  557. def _from_parsed_parts(cls, drv, root, parts, init=True):
  558. self = object.__new__(cls)
  559. self._drv = drv
  560. self._root = root
  561. self._parts = parts
  562. if init:
  563. self._init()
  564. return self
  565. @classmethod
  566. def _format_parsed_parts(cls, drv, root, parts):
  567. if drv or root:
  568. return drv + root + cls._flavour.join(parts[1:])
  569. else:
  570. return cls._flavour.join(parts)
  571. def _init(self):
  572. # Overridden in concrete Path
  573. pass
  574. def _make_child(self, args):
  575. drv, root, parts = self._parse_args(args)
  576. drv, root, parts = self._flavour.join_parsed_parts(
  577. self._drv, self._root, self._parts, drv, root, parts)
  578. return self._from_parsed_parts(drv, root, parts)
  579. def __str__(self):
  580. """Return the string representation of the path, suitable for
  581. passing to system calls."""
  582. try:
  583. return self._str
  584. except AttributeError:
  585. self._str = self._format_parsed_parts(self._drv, self._root,
  586. self._parts) or '.'
  587. return self._str
  588. def as_posix(self):
  589. """Return the string representation of the path with forward (/)
  590. slashes."""
  591. f = self._flavour
  592. return str(self).replace(f.sep, '/')
  593. def __bytes__(self):
  594. """Return the bytes representation of the path. This is only
  595. recommended to use under Unix."""
  596. return os.fsencode(str(self))
  597. def __repr__(self):
  598. return "{}({!r})".format(self.__class__.__name__, self.as_posix())
  599. def as_uri(self):
  600. """Return the path as a 'file' URI."""
  601. if not self.is_absolute():
  602. raise ValueError("relative path can't be expressed as a file URI")
  603. return self._flavour.make_uri(self)
  604. @property
  605. def _cparts(self):
  606. # Cached casefolded parts, for hashing and comparison
  607. try:
  608. return self._cached_cparts
  609. except AttributeError:
  610. self._cached_cparts = self._flavour.casefold_parts(self._parts)
  611. return self._cached_cparts
  612. def __eq__(self, other):
  613. if not isinstance(other, PurePath):
  614. return NotImplemented
  615. return self._cparts == other._cparts and self._flavour is other._flavour
  616. def __hash__(self):
  617. try:
  618. return self._hash
  619. except AttributeError:
  620. self._hash = hash(tuple(self._cparts))
  621. return self._hash
  622. def __lt__(self, other):
  623. if not isinstance(other, PurePath) or self._flavour is not other._flavour:
  624. return NotImplemented
  625. return self._cparts < other._cparts
  626. def __le__(self, other):
  627. if not isinstance(other, PurePath) or self._flavour is not other._flavour:
  628. return NotImplemented
  629. return self._cparts <= other._cparts
  630. def __gt__(self, other):
  631. if not isinstance(other, PurePath) or self._flavour is not other._flavour:
  632. return NotImplemented
  633. return self._cparts > other._cparts
  634. def __ge__(self, other):
  635. if not isinstance(other, PurePath) or self._flavour is not other._flavour:
  636. return NotImplemented
  637. return self._cparts >= other._cparts
  638. drive = property(attrgetter('_drv'),
  639. doc="""The drive prefix (letter or UNC path), if any.""")
  640. root = property(attrgetter('_root'),
  641. doc="""The root of the path, if any.""")
  642. @property
  643. def anchor(self):
  644. """The concatenation of the drive and root, or ''."""
  645. anchor = self._drv + self._root
  646. return anchor
  647. @property
  648. def name(self):
  649. """The final path component, if any."""
  650. parts = self._parts
  651. if len(parts) == (1 if (self._drv or self._root) else 0):
  652. return ''
  653. return parts[-1]
  654. @property
  655. def suffix(self):
  656. """The final component's last suffix, if any."""
  657. name = self.name
  658. i = name.rfind('.')
  659. if 0 < i < len(name) - 1:
  660. return name[i:]
  661. else:
  662. return ''
  663. @property
  664. def suffixes(self):
  665. """A list of the final component's suffixes, if any."""
  666. name = self.name
  667. if name.endswith('.'):
  668. return []
  669. name = name.lstrip('.')
  670. return ['.' + suffix for suffix in name.split('.')[1:]]
  671. @property
  672. def stem(self):
  673. """The final path component, minus its last suffix."""
  674. name = self.name
  675. i = name.rfind('.')
  676. if 0 < i < len(name) - 1:
  677. return name[:i]
  678. else:
  679. return name
  680. def with_name(self, name):
  681. """Return a new path with the file name changed."""
  682. if not self.name:
  683. raise ValueError("%r has an empty name" % (self,))
  684. drv, root, parts = self._flavour.parse_parts((name,))
  685. if (not name or name[-1] in [self._flavour.sep, self._flavour.altsep]
  686. or drv or root or len(parts) != 1):
  687. raise ValueError("Invalid name %r" % (name))
  688. return self._from_parsed_parts(self._drv, self._root,
  689. self._parts[:-1] + [name])
  690. def with_suffix(self, suffix):
  691. """Return a new path with the file suffix changed (or added, if none)."""
  692. # XXX if suffix is None, should the current suffix be removed?
  693. f = self._flavour
  694. if f.sep in suffix or f.altsep and f.altsep in suffix:
  695. raise ValueError("Invalid suffix %r" % (suffix))
  696. if suffix and not suffix.startswith('.') or suffix == '.':
  697. raise ValueError("Invalid suffix %r" % (suffix))
  698. name = self.name
  699. if not name:
  700. raise ValueError("%r has an empty name" % (self,))
  701. old_suffix = self.suffix
  702. if not old_suffix:
  703. name = name + suffix
  704. else:
  705. name = name[:-len(old_suffix)] + suffix
  706. return self._from_parsed_parts(self._drv, self._root,
  707. self._parts[:-1] + [name])
  708. def relative_to(self, *other):
  709. """Return the relative path to another path identified by the passed
  710. arguments. If the operation is not possible (because this is not
  711. a subpath of the other path), raise ValueError.
  712. """
  713. # For the purpose of this method, drive and root are considered
  714. # separate parts, i.e.:
  715. # Path('c:/').relative_to('c:') gives Path('/')
  716. # Path('c:/').relative_to('/') raise ValueError
  717. if not other:
  718. raise TypeError("need at least one argument")
  719. parts = self._parts
  720. drv = self._drv
  721. root = self._root
  722. if root:
  723. abs_parts = [drv, root] + parts[1:]
  724. else:
  725. abs_parts = parts
  726. to_drv, to_root, to_parts = self._parse_args(other)
  727. if to_root:
  728. to_abs_parts = [to_drv, to_root] + to_parts[1:]
  729. else:
  730. to_abs_parts = to_parts
  731. n = len(to_abs_parts)
  732. cf = self._flavour.casefold_parts
  733. if (root or drv) if n == 0 else cf(abs_parts[:n]) != cf(to_abs_parts):
  734. formatted = self._format_parsed_parts(to_drv, to_root, to_parts)
  735. raise ValueError("{!r} does not start with {!r}"
  736. .format(str(self), str(formatted)))
  737. return self._from_parsed_parts('', root if n == 1 else '',
  738. abs_parts[n:])
  739. @property
  740. def parts(self):
  741. """An object providing sequence-like access to the
  742. components in the filesystem path."""
  743. # We cache the tuple to avoid building a new one each time .parts
  744. # is accessed. XXX is this necessary?
  745. try:
  746. return self._pparts
  747. except AttributeError:
  748. self._pparts = tuple(self._parts)
  749. return self._pparts
  750. def joinpath(self, *args):
  751. """Combine this path with one or several arguments, and return a
  752. new path representing either a subpath (if all arguments are relative
  753. paths) or a totally different path (if one of the arguments is
  754. anchored).
  755. """
  756. return self._make_child(args)
  757. def __truediv__(self, key):
  758. return self._make_child((key,))
  759. def __rtruediv__(self, key):
  760. return self._from_parts([key] + self._parts)
  761. @property
  762. def parent(self):
  763. """The logical parent of the path."""
  764. drv = self._drv
  765. root = self._root
  766. parts = self._parts
  767. if len(parts) == 1 and (drv or root):
  768. return self
  769. return self._from_parsed_parts(drv, root, parts[:-1])
  770. @property
  771. def parents(self):
  772. """A sequence of this path's logical parents."""
  773. return _PathParents(self)
  774. def is_absolute(self):
  775. """True if the path is absolute (has both a root and, if applicable,
  776. a drive)."""
  777. if not self._root:
  778. return False
  779. return not self._flavour.has_drv or bool(self._drv)
  780. def is_reserved(self):
  781. """Return True if the path contains one of the special names reserved
  782. by the system, if any."""
  783. return self._flavour.is_reserved(self._parts)
  784. def match(self, path_pattern):
  785. """
  786. Return True if this path matches the given pattern.
  787. """
  788. cf = self._flavour.casefold
  789. path_pattern = cf(path_pattern)
  790. drv, root, pat_parts = self._flavour.parse_parts((path_pattern,))
  791. if not pat_parts:
  792. raise ValueError("empty pattern")
  793. if drv and drv != cf(self._drv):
  794. return False
  795. if root and root != cf(self._root):
  796. return False
  797. parts = self._cparts
  798. if drv or root:
  799. if len(pat_parts) != len(parts):
  800. return False
  801. pat_parts = pat_parts[1:]
  802. elif len(pat_parts) > len(parts):
  803. return False
  804. for part, pat in zip(reversed(parts), reversed(pat_parts)):
  805. if not fnmatch.fnmatchcase(part, pat):
  806. return False
  807. return True
  808. class PurePosixPath(PurePath):
  809. _flavour = _posix_flavour
  810. __slots__ = ()
  811. class PureWindowsPath(PurePath):
  812. _flavour = _windows_flavour
  813. __slots__ = ()
  814. # Filesystem-accessing classes
  815. class Path(PurePath):
  816. __slots__ = (
  817. '_accessor',
  818. '_closed',
  819. )
  820. def __new__(cls, *args, **kwargs):
  821. if cls is Path:
  822. cls = WindowsPath if os.name == 'nt' else PosixPath
  823. self = cls._from_parts(args, init=False)
  824. if not self._flavour.is_supported:
  825. raise NotImplementedError("cannot instantiate %r on your system"
  826. % (cls.__name__,))
  827. self._init()
  828. return self
  829. def _init(self,
  830. # Private non-constructor arguments
  831. template=None,
  832. ):
  833. self._closed = False
  834. if template is not None:
  835. self._accessor = template._accessor
  836. else:
  837. self._accessor = _normal_accessor
  838. def _make_child_relpath(self, part):
  839. # This is an optimization used for dir walking. `part` must be
  840. # a single part relative to this path.
  841. parts = self._parts + [part]
  842. return self._from_parsed_parts(self._drv, self._root, parts)
  843. def __enter__(self):
  844. if self._closed:
  845. self._raise_closed()
  846. return self
  847. def __exit__(self, t, v, tb):
  848. self._closed = True
  849. def _raise_closed(self):
  850. raise ValueError("I/O operation on closed path")
  851. def _opener(self, name, flags, mode=0o666):
  852. # A stub for the opener argument to built-in open()
  853. return self._accessor.open(self, flags, mode)
  854. def _raw_open(self, flags, mode=0o777):
  855. """
  856. Open the file pointed by this path and return a file descriptor,
  857. as os.open() does.
  858. """
  859. if self._closed:
  860. self._raise_closed()
  861. return self._accessor.open(self, flags, mode)
  862. # Public API
  863. @classmethod
  864. def cwd(cls):
  865. """Return a new path pointing to the current working directory
  866. (as returned by os.getcwd()).
  867. """
  868. return cls(os.getcwd())
  869. @classmethod
  870. def home(cls):
  871. """Return a new path pointing to the user's home directory (as
  872. returned by os.path.expanduser('~')).
  873. """
  874. return cls(cls()._flavour.gethomedir(None))
  875. def samefile(self, other_path):
  876. """Return whether other_path is the same or not as this file
  877. (as returned by os.path.samefile()).
  878. """
  879. st = self.stat()
  880. try:
  881. other_st = other_path.stat()
  882. except AttributeError:
  883. other_st = os.stat(other_path)
  884. return os.path.samestat(st, other_st)
  885. def iterdir(self):
  886. """Iterate over the files in this directory. Does not yield any
  887. result for the special paths '.' and '..'.
  888. """
  889. if self._closed:
  890. self._raise_closed()
  891. for name in self._accessor.listdir(self):
  892. if name in {'.', '..'}:
  893. # Yielding a path object for these makes little sense
  894. continue
  895. yield self._make_child_relpath(name)
  896. if self._closed:
  897. self._raise_closed()
  898. def glob(self, pattern):
  899. """Iterate over this subtree and yield all existing files (of any
  900. kind, including directories) matching the given pattern.
  901. """
  902. if not pattern:
  903. raise ValueError("Unacceptable pattern: {!r}".format(pattern))
  904. pattern = self._flavour.casefold(pattern)
  905. drv, root, pattern_parts = self._flavour.parse_parts((pattern,))
  906. if drv or root:
  907. raise NotImplementedError("Non-relative patterns are unsupported")
  908. selector = _make_selector(tuple(pattern_parts))
  909. for p in selector.select_from(self):
  910. yield p
  911. def rglob(self, pattern):
  912. """Recursively yield all existing files (of any kind, including
  913. directories) matching the given pattern, anywhere in this subtree.
  914. """
  915. pattern = self._flavour.casefold(pattern)
  916. drv, root, pattern_parts = self._flavour.parse_parts((pattern,))
  917. if drv or root:
  918. raise NotImplementedError("Non-relative patterns are unsupported")
  919. selector = _make_selector(("**",) + tuple(pattern_parts))
  920. for p in selector.select_from(self):
  921. yield p
  922. def absolute(self):
  923. """Return an absolute version of this path. This function works
  924. even if the path doesn't point to anything.
  925. No normalization is done, i.e. all '.' and '..' will be kept along.
  926. Use resolve() to get the canonical path to a file.
  927. """
  928. # XXX untested yet!
  929. if self._closed:
  930. self._raise_closed()
  931. if self.is_absolute():
  932. return self
  933. # FIXME this must defer to the specific flavour (and, under Windows,
  934. # use nt._getfullpathname())
  935. obj = self._from_parts([os.getcwd()] + self._parts, init=False)
  936. obj._init(template=self)
  937. return obj
  938. def resolve(self):
  939. """
  940. Make the path absolute, resolving all symlinks on the way and also
  941. normalizing it (for example turning slashes into backslashes under
  942. Windows).
  943. """
  944. if self._closed:
  945. self._raise_closed()
  946. s = self._flavour.resolve(self)
  947. if s is None:
  948. # No symlink resolution => for consistency, raise an error if
  949. # the path doesn't exist or is forbidden
  950. self.stat()
  951. s = str(self.absolute())
  952. # Now we have no symlinks in the path, it's safe to normalize it.
  953. normed = self._flavour.pathmod.normpath(s)
  954. obj = self._from_parts((normed,), init=False)
  955. obj._init(template=self)
  956. return obj
  957. def stat(self):
  958. """
  959. Return the result of the stat() system call on this path, like
  960. os.stat() does.
  961. """
  962. return self._accessor.stat(self)
  963. def owner(self):
  964. """
  965. Return the login name of the file owner.
  966. """
  967. import pwd
  968. return pwd.getpwuid(self.stat().st_uid).pw_name
  969. def group(self):
  970. """
  971. Return the group name of the file gid.
  972. """
  973. import grp
  974. return grp.getgrgid(self.stat().st_gid).gr_name
  975. def open(self, mode='r', buffering=-1, encoding=None,
  976. errors=None, newline=None):
  977. """
  978. Open the file pointed by this path and return a file object, as
  979. the built-in open() function does.
  980. """
  981. if self._closed:
  982. self._raise_closed()
  983. return io.open(str(self), mode, buffering, encoding, errors, newline,
  984. opener=self._opener)
  985. def read_bytes(self):
  986. """
  987. Open the file in bytes mode, read it, and close the file.
  988. """
  989. with self.open(mode='rb') as f:
  990. return f.read()
  991. def read_text(self, encoding=None, errors=None):
  992. """
  993. Open the file in text mode, read it, and close the file.
  994. """
  995. with self.open(mode='r', encoding=encoding, errors=errors) as f:
  996. return f.read()
  997. def write_bytes(self, data):
  998. """
  999. Open the file in bytes mode, write to it, and close the file.
  1000. """
  1001. # type-check for the buffer interface before truncating the file
  1002. view = memoryview(data)
  1003. with self.open(mode='wb') as f:
  1004. return f.write(view)
  1005. def write_text(self, data, encoding=None, errors=None):
  1006. """
  1007. Open the file in text mode, write to it, and close the file.
  1008. """
  1009. if not isinstance(data, str):
  1010. raise TypeError('data must be str, not %s' %
  1011. data.__class__.__name__)
  1012. with self.open(mode='w', encoding=encoding, errors=errors) as f:
  1013. return f.write(data)
  1014. def touch(self, mode=0o666, exist_ok=True):
  1015. """
  1016. Create this file with the given access mode, if it doesn't exist.
  1017. """
  1018. if self._closed:
  1019. self._raise_closed()
  1020. if exist_ok:
  1021. # First try to bump modification time
  1022. # Implementation note: GNU touch uses the UTIME_NOW option of
  1023. # the utimensat() / futimens() functions.
  1024. try:
  1025. self._accessor.utime(self, None)
  1026. except OSError:
  1027. # Avoid exception chaining
  1028. pass
  1029. else:
  1030. return
  1031. flags = os.O_CREAT | os.O_WRONLY
  1032. if not exist_ok:
  1033. flags |= os.O_EXCL
  1034. fd = self._raw_open(flags, mode)
  1035. os.close(fd)
  1036. def mkdir(self, mode=0o777, parents=False, exist_ok=False):
  1037. if self._closed:
  1038. self._raise_closed()
  1039. if not parents:
  1040. try:
  1041. self._accessor.mkdir(self, mode)
  1042. except FileExistsError:
  1043. if not exist_ok or not self.is_dir():
  1044. raise
  1045. else:
  1046. try:
  1047. self._accessor.mkdir(self, mode)
  1048. except FileExistsError:
  1049. if not exist_ok or not self.is_dir():
  1050. raise
  1051. except OSError as e:
  1052. if e.errno != ENOENT:
  1053. raise
  1054. self.parent.mkdir(parents=True)
  1055. self._accessor.mkdir(self, mode)
  1056. def chmod(self, mode):
  1057. """
  1058. Change the permissions of the path, like os.chmod().
  1059. """
  1060. if self._closed:
  1061. self._raise_closed()
  1062. self._accessor.chmod(self, mode)
  1063. def lchmod(self, mode):
  1064. """
  1065. Like chmod(), except if the path points to a symlink, the symlink's
  1066. permissions are changed, rather than its target's.
  1067. """
  1068. if self._closed:
  1069. self._raise_closed()
  1070. self._accessor.lchmod(self, mode)
  1071. def unlink(self):
  1072. """
  1073. Remove this file or link.
  1074. If the path is a directory, use rmdir() instead.
  1075. """
  1076. if self._closed:
  1077. self._raise_closed()
  1078. self._accessor.unlink(self)
  1079. def rmdir(self):
  1080. """
  1081. Remove this directory. The directory must be empty.
  1082. """
  1083. if self._closed:
  1084. self._raise_closed()
  1085. self._accessor.rmdir(self)
  1086. def lstat(self):
  1087. """
  1088. Like stat(), except if the path points to a symlink, the symlink's
  1089. status information is returned, rather than its target's.
  1090. """
  1091. if self._closed:
  1092. self._raise_closed()
  1093. return self._accessor.lstat(self)
  1094. def rename(self, target):
  1095. """
  1096. Rename this path to the given path.
  1097. """
  1098. if self._closed:
  1099. self._raise_closed()
  1100. self._accessor.rename(self, target)
  1101. def replace(self, target):
  1102. """
  1103. Rename this path to the given path, clobbering the existing
  1104. destination if it exists.
  1105. """
  1106. if self._closed:
  1107. self._raise_closed()
  1108. self._accessor.replace(self, target)
  1109. def symlink_to(self, target, target_is_directory=False):
  1110. """
  1111. Make this path a symlink pointing to the given path.
  1112. Note the order of arguments (self, target) is the reverse of os.symlink's.
  1113. """
  1114. if self._closed:
  1115. self._raise_closed()
  1116. self._accessor.symlink(target, self, target_is_directory)
  1117. # Convenience functions for querying the stat results
  1118. def exists(self):
  1119. """
  1120. Whether this path exists.
  1121. """
  1122. try:
  1123. self.stat()
  1124. except OSError as e:
  1125. if e.errno not in (ENOENT, ENOTDIR):
  1126. raise
  1127. return False
  1128. return True
  1129. def is_dir(self):
  1130. """
  1131. Whether this path is a directory.
  1132. """
  1133. try:
  1134. return S_ISDIR(self.stat().st_mode)
  1135. except OSError as e:
  1136. if e.errno not in (ENOENT, ENOTDIR):
  1137. raise
  1138. # Path doesn't exist or is a broken symlink
  1139. # (see https://bitbucket.org/pitrou/pathlib/issue/12/)
  1140. return False
  1141. def is_file(self):
  1142. """
  1143. Whether this path is a regular file (also True for symlinks pointing
  1144. to regular files).
  1145. """
  1146. try:
  1147. return S_ISREG(self.stat().st_mode)
  1148. except OSError as e:
  1149. if e.errno not in (ENOENT, ENOTDIR):
  1150. raise
  1151. # Path doesn't exist or is a broken symlink
  1152. # (see https://bitbucket.org/pitrou/pathlib/issue/12/)
  1153. return False
  1154. def is_symlink(self):
  1155. """
  1156. Whether this path is a symbolic link.
  1157. """
  1158. try:
  1159. return S_ISLNK(self.lstat().st_mode)
  1160. except OSError as e:
  1161. if e.errno not in (ENOENT, ENOTDIR):
  1162. raise
  1163. # Path doesn't exist
  1164. return False
  1165. def is_block_device(self):
  1166. """
  1167. Whether this path is a block device.
  1168. """
  1169. try:
  1170. return S_ISBLK(self.stat().st_mode)
  1171. except OSError as e:
  1172. if e.errno not in (ENOENT, ENOTDIR):
  1173. raise
  1174. # Path doesn't exist or is a broken symlink
  1175. # (see https://bitbucket.org/pitrou/pathlib/issue/12/)
  1176. return False
  1177. def is_char_device(self):
  1178. """
  1179. Whether this path is a character device.
  1180. """
  1181. try:
  1182. return S_ISCHR(self.stat().st_mode)
  1183. except OSError as e:
  1184. if e.errno not in (ENOENT, ENOTDIR):
  1185. raise
  1186. # Path doesn't exist or is a broken symlink
  1187. # (see https://bitbucket.org/pitrou/pathlib/issue/12/)
  1188. return False
  1189. def is_fifo(self):
  1190. """
  1191. Whether this path is a FIFO.
  1192. """
  1193. try:
  1194. return S_ISFIFO(self.stat().st_mode)
  1195. except OSError as e:
  1196. if e.errno not in (ENOENT, ENOTDIR):
  1197. raise
  1198. # Path doesn't exist or is a broken symlink
  1199. # (see https://bitbucket.org/pitrou/pathlib/issue/12/)
  1200. return False
  1201. def is_socket(self):
  1202. """
  1203. Whether this path is a socket.
  1204. """
  1205. try:
  1206. return S_ISSOCK(self.stat().st_mode)
  1207. except OSError as e:
  1208. if e.errno not in (ENOENT, ENOTDIR):
  1209. raise
  1210. # Path doesn't exist or is a broken symlink
  1211. # (see https://bitbucket.org/pitrou/pathlib/issue/12/)
  1212. return False
  1213. def expanduser(self):
  1214. """ Return a new path with expanded ~ and ~user constructs
  1215. (as returned by os.path.expanduser)
  1216. """
  1217. if (not (self._drv or self._root) and
  1218. self._parts and self._parts[0][:1] == '~'):
  1219. homedir = self._flavour.gethomedir(self._parts[0][1:])
  1220. return self._from_parts([homedir] + self._parts[1:])
  1221. return self
  1222. class PosixPath(Path, PurePosixPath):
  1223. __slots__ = ()
  1224. class WindowsPath(Path, PureWindowsPath):
  1225. __slots__ = ()
  1226. def owner(self):
  1227. raise NotImplementedError("Path.owner() is unsupported on this system")
  1228. def group(self):
  1229. raise NotImplementedError("Path.group() is unsupported on this system")