Patrick Williams | c124f4f | 2015-09-15 14:41:29 -0500 | [diff] [blame^] | 1 | # |
| 2 | # Based on standard python library functions but avoid |
| 3 | # repeated stat calls. Its assumed the files will not change from under us |
| 4 | # so we can cache stat calls. |
| 5 | # |
| 6 | |
| 7 | import os |
| 8 | import errno |
| 9 | import stat as statmod |
| 10 | |
| 11 | class CachedPath(object): |
| 12 | def __init__(self): |
| 13 | self.statcache = {} |
| 14 | self.lstatcache = {} |
| 15 | self.normpathcache = {} |
| 16 | return |
| 17 | |
| 18 | def updatecache(self, x): |
| 19 | x = self.normpath(x) |
| 20 | if x in self.statcache: |
| 21 | del self.statcache[x] |
| 22 | if x in self.lstatcache: |
| 23 | del self.lstatcache[x] |
| 24 | |
| 25 | def normpath(self, path): |
| 26 | if path in self.normpathcache: |
| 27 | return self.normpathcache[path] |
| 28 | newpath = os.path.normpath(path) |
| 29 | self.normpathcache[path] = newpath |
| 30 | return newpath |
| 31 | |
| 32 | def _callstat(self, path): |
| 33 | if path in self.statcache: |
| 34 | return self.statcache[path] |
| 35 | try: |
| 36 | st = os.stat(path) |
| 37 | self.statcache[path] = st |
| 38 | return st |
| 39 | except os.error: |
| 40 | self.statcache[path] = False |
| 41 | return False |
| 42 | |
| 43 | # We might as well call lstat and then only |
| 44 | # call stat as well in the symbolic link case |
| 45 | # since this turns out to be much more optimal |
| 46 | # in real world usage of this cache |
| 47 | def callstat(self, path): |
| 48 | path = self.normpath(path) |
| 49 | self.calllstat(path) |
| 50 | return self.statcache[path] |
| 51 | |
| 52 | def calllstat(self, path): |
| 53 | path = self.normpath(path) |
| 54 | if path in self.lstatcache: |
| 55 | return self.lstatcache[path] |
| 56 | #bb.error("LStatpath:" + path) |
| 57 | try: |
| 58 | lst = os.lstat(path) |
| 59 | self.lstatcache[path] = lst |
| 60 | if not statmod.S_ISLNK(lst.st_mode): |
| 61 | self.statcache[path] = lst |
| 62 | else: |
| 63 | self._callstat(path) |
| 64 | return lst |
| 65 | except (os.error, AttributeError): |
| 66 | self.lstatcache[path] = False |
| 67 | self.statcache[path] = False |
| 68 | return False |
| 69 | |
| 70 | # This follows symbolic links, so both islink() and isdir() can be true |
| 71 | # for the same path ono systems that support symlinks |
| 72 | def isfile(self, path): |
| 73 | """Test whether a path is a regular file""" |
| 74 | st = self.callstat(path) |
| 75 | if not st: |
| 76 | return False |
| 77 | return statmod.S_ISREG(st.st_mode) |
| 78 | |
| 79 | # Is a path a directory? |
| 80 | # This follows symbolic links, so both islink() and isdir() |
| 81 | # can be true for the same path on systems that support symlinks |
| 82 | def isdir(self, s): |
| 83 | """Return true if the pathname refers to an existing directory.""" |
| 84 | st = self.callstat(s) |
| 85 | if not st: |
| 86 | return False |
| 87 | return statmod.S_ISDIR(st.st_mode) |
| 88 | |
| 89 | def islink(self, path): |
| 90 | """Test whether a path is a symbolic link""" |
| 91 | st = self.calllstat(path) |
| 92 | if not st: |
| 93 | return False |
| 94 | return statmod.S_ISLNK(st.st_mode) |
| 95 | |
| 96 | # Does a path exist? |
| 97 | # This is false for dangling symbolic links on systems that support them. |
| 98 | def exists(self, path): |
| 99 | """Test whether a path exists. Returns False for broken symbolic links""" |
| 100 | if self.callstat(path): |
| 101 | return True |
| 102 | return False |
| 103 | |
| 104 | def lexists(self, path): |
| 105 | """Test whether a path exists. Returns True for broken symbolic links""" |
| 106 | if self.calllstat(path): |
| 107 | return True |
| 108 | return False |
| 109 | |
| 110 | def stat(self, path): |
| 111 | return self.callstat(path) |
| 112 | |
| 113 | def lstat(self, path): |
| 114 | return self.calllstat(path) |
| 115 | |
| 116 | def walk(self, top, topdown=True, onerror=None, followlinks=False): |
| 117 | # Matches os.walk, not os.path.walk() |
| 118 | |
| 119 | # We may not have read permission for top, in which case we can't |
| 120 | # get a list of the files the directory contains. os.path.walk |
| 121 | # always suppressed the exception then, rather than blow up for a |
| 122 | # minor reason when (say) a thousand readable directories are still |
| 123 | # left to visit. That logic is copied here. |
| 124 | try: |
| 125 | names = os.listdir(top) |
| 126 | except os.error as err: |
| 127 | if onerror is not None: |
| 128 | onerror(err) |
| 129 | return |
| 130 | |
| 131 | dirs, nondirs = [], [] |
| 132 | for name in names: |
| 133 | if self.isdir(os.path.join(top, name)): |
| 134 | dirs.append(name) |
| 135 | else: |
| 136 | nondirs.append(name) |
| 137 | |
| 138 | if topdown: |
| 139 | yield top, dirs, nondirs |
| 140 | for name in dirs: |
| 141 | new_path = os.path.join(top, name) |
| 142 | if followlinks or not self.islink(new_path): |
| 143 | for x in self.walk(new_path, topdown, onerror, followlinks): |
| 144 | yield x |
| 145 | if not topdown: |
| 146 | yield top, dirs, nondirs |
| 147 | |
| 148 | ## realpath() related functions |
| 149 | def __is_path_below(self, file, root): |
| 150 | return (file + os.path.sep).startswith(root) |
| 151 | |
| 152 | def __realpath_rel(self, start, rel_path, root, loop_cnt, assume_dir): |
| 153 | """Calculates real path of symlink 'start' + 'rel_path' below |
| 154 | 'root'; no part of 'start' below 'root' must contain symlinks. """ |
| 155 | have_dir = True |
| 156 | |
| 157 | for d in rel_path.split(os.path.sep): |
| 158 | if not have_dir and not assume_dir: |
| 159 | raise OSError(errno.ENOENT, "no such directory %s" % start) |
| 160 | |
| 161 | if d == os.path.pardir: # '..' |
| 162 | if len(start) >= len(root): |
| 163 | # do not follow '..' before root |
| 164 | start = os.path.dirname(start) |
| 165 | else: |
| 166 | # emit warning? |
| 167 | pass |
| 168 | else: |
| 169 | (start, have_dir) = self.__realpath(os.path.join(start, d), |
| 170 | root, loop_cnt, assume_dir) |
| 171 | |
| 172 | assert(self.__is_path_below(start, root)) |
| 173 | |
| 174 | return start |
| 175 | |
| 176 | def __realpath(self, file, root, loop_cnt, assume_dir): |
| 177 | while self.islink(file) and len(file) >= len(root): |
| 178 | if loop_cnt == 0: |
| 179 | raise OSError(errno.ELOOP, file) |
| 180 | |
| 181 | loop_cnt -= 1 |
| 182 | target = os.path.normpath(os.readlink(file)) |
| 183 | |
| 184 | if not os.path.isabs(target): |
| 185 | tdir = os.path.dirname(file) |
| 186 | assert(self.__is_path_below(tdir, root)) |
| 187 | else: |
| 188 | tdir = root |
| 189 | |
| 190 | file = self.__realpath_rel(tdir, target, root, loop_cnt, assume_dir) |
| 191 | |
| 192 | try: |
| 193 | is_dir = self.isdir(file) |
| 194 | except: |
| 195 | is_dir = False |
| 196 | |
| 197 | return (file, is_dir) |
| 198 | |
| 199 | def realpath(self, file, root, use_physdir = True, loop_cnt = 100, assume_dir = False): |
| 200 | """ Returns the canonical path of 'file' with assuming a |
| 201 | toplevel 'root' directory. When 'use_physdir' is set, all |
| 202 | preceding path components of 'file' will be resolved first; |
| 203 | this flag should be set unless it is guaranteed that there is |
| 204 | no symlink in the path. When 'assume_dir' is not set, missing |
| 205 | path components will raise an ENOENT error""" |
| 206 | |
| 207 | root = os.path.normpath(root) |
| 208 | file = os.path.normpath(file) |
| 209 | |
| 210 | if not root.endswith(os.path.sep): |
| 211 | # letting root end with '/' makes some things easier |
| 212 | root = root + os.path.sep |
| 213 | |
| 214 | if not self.__is_path_below(file, root): |
| 215 | raise OSError(errno.EINVAL, "file '%s' is not below root" % file) |
| 216 | |
| 217 | try: |
| 218 | if use_physdir: |
| 219 | file = self.__realpath_rel(root, file[(len(root) - 1):], root, loop_cnt, assume_dir) |
| 220 | else: |
| 221 | file = self.__realpath(file, root, loop_cnt, assume_dir)[0] |
| 222 | except OSError as e: |
| 223 | if e.errno == errno.ELOOP: |
| 224 | # make ELOOP more readable; without catching it, there will |
| 225 | # be printed a backtrace with 100s of OSError exceptions |
| 226 | # else |
| 227 | raise OSError(errno.ELOOP, |
| 228 | "too much recursions while resolving '%s'; loop in '%s'" % |
| 229 | (file, e.strerror)) |
| 230 | |
| 231 | raise |
| 232 | |
| 233 | return file |