Mercurial > repos > guerler > springsuite
comparison planemo/lib/python3.7/site-packages/distlib/util.py @ 0:d30785e31577 draft
"planemo upload commit 6eee67778febed82ddd413c3ca40b3183a3898f1"
author | guerler |
---|---|
date | Fri, 31 Jul 2020 00:18:57 -0400 |
parents | |
children |
comparison
equal
deleted
inserted
replaced
-1:000000000000 | 0:d30785e31577 |
---|---|
1 # | |
2 # Copyright (C) 2012-2017 The Python Software Foundation. | |
3 # See LICENSE.txt and CONTRIBUTORS.txt. | |
4 # | |
5 import codecs | |
6 from collections import deque | |
7 import contextlib | |
8 import csv | |
9 from glob import iglob as std_iglob | |
10 import io | |
11 import json | |
12 import logging | |
13 import os | |
14 import py_compile | |
15 import re | |
16 import socket | |
17 try: | |
18 import ssl | |
19 except ImportError: # pragma: no cover | |
20 ssl = None | |
21 import subprocess | |
22 import sys | |
23 import tarfile | |
24 import tempfile | |
25 import textwrap | |
26 | |
27 try: | |
28 import threading | |
29 except ImportError: # pragma: no cover | |
30 import dummy_threading as threading | |
31 import time | |
32 | |
33 from . import DistlibException | |
34 from .compat import (string_types, text_type, shutil, raw_input, StringIO, | |
35 cache_from_source, urlopen, urljoin, httplib, xmlrpclib, | |
36 splittype, HTTPHandler, BaseConfigurator, valid_ident, | |
37 Container, configparser, URLError, ZipFile, fsdecode, | |
38 unquote, urlparse) | |
39 | |
40 logger = logging.getLogger(__name__) | |
41 | |
42 # | |
43 # Requirement parsing code as per PEP 508 | |
44 # | |
45 | |
46 IDENTIFIER = re.compile(r'^([\w\.-]+)\s*') | |
47 VERSION_IDENTIFIER = re.compile(r'^([\w\.*+-]+)\s*') | |
48 COMPARE_OP = re.compile(r'^(<=?|>=?|={2,3}|[~!]=)\s*') | |
49 MARKER_OP = re.compile(r'^((<=?)|(>=?)|={2,3}|[~!]=|in|not\s+in)\s*') | |
50 OR = re.compile(r'^or\b\s*') | |
51 AND = re.compile(r'^and\b\s*') | |
52 NON_SPACE = re.compile(r'(\S+)\s*') | |
53 STRING_CHUNK = re.compile(r'([\s\w\.{}()*+#:;,/?!~`@$%^&=|<>\[\]-]+)') | |
54 | |
55 | |
56 def parse_marker(marker_string): | |
57 """ | |
58 Parse a marker string and return a dictionary containing a marker expression. | |
59 | |
60 The dictionary will contain keys "op", "lhs" and "rhs" for non-terminals in | |
61 the expression grammar, or strings. A string contained in quotes is to be | |
62 interpreted as a literal string, and a string not contained in quotes is a | |
63 variable (such as os_name). | |
64 """ | |
65 def marker_var(remaining): | |
66 # either identifier, or literal string | |
67 m = IDENTIFIER.match(remaining) | |
68 if m: | |
69 result = m.groups()[0] | |
70 remaining = remaining[m.end():] | |
71 elif not remaining: | |
72 raise SyntaxError('unexpected end of input') | |
73 else: | |
74 q = remaining[0] | |
75 if q not in '\'"': | |
76 raise SyntaxError('invalid expression: %s' % remaining) | |
77 oq = '\'"'.replace(q, '') | |
78 remaining = remaining[1:] | |
79 parts = [q] | |
80 while remaining: | |
81 # either a string chunk, or oq, or q to terminate | |
82 if remaining[0] == q: | |
83 break | |
84 elif remaining[0] == oq: | |
85 parts.append(oq) | |
86 remaining = remaining[1:] | |
87 else: | |
88 m = STRING_CHUNK.match(remaining) | |
89 if not m: | |
90 raise SyntaxError('error in string literal: %s' % remaining) | |
91 parts.append(m.groups()[0]) | |
92 remaining = remaining[m.end():] | |
93 else: | |
94 s = ''.join(parts) | |
95 raise SyntaxError('unterminated string: %s' % s) | |
96 parts.append(q) | |
97 result = ''.join(parts) | |
98 remaining = remaining[1:].lstrip() # skip past closing quote | |
99 return result, remaining | |
100 | |
101 def marker_expr(remaining): | |
102 if remaining and remaining[0] == '(': | |
103 result, remaining = marker(remaining[1:].lstrip()) | |
104 if remaining[0] != ')': | |
105 raise SyntaxError('unterminated parenthesis: %s' % remaining) | |
106 remaining = remaining[1:].lstrip() | |
107 else: | |
108 lhs, remaining = marker_var(remaining) | |
109 while remaining: | |
110 m = MARKER_OP.match(remaining) | |
111 if not m: | |
112 break | |
113 op = m.groups()[0] | |
114 remaining = remaining[m.end():] | |
115 rhs, remaining = marker_var(remaining) | |
116 lhs = {'op': op, 'lhs': lhs, 'rhs': rhs} | |
117 result = lhs | |
118 return result, remaining | |
119 | |
120 def marker_and(remaining): | |
121 lhs, remaining = marker_expr(remaining) | |
122 while remaining: | |
123 m = AND.match(remaining) | |
124 if not m: | |
125 break | |
126 remaining = remaining[m.end():] | |
127 rhs, remaining = marker_expr(remaining) | |
128 lhs = {'op': 'and', 'lhs': lhs, 'rhs': rhs} | |
129 return lhs, remaining | |
130 | |
131 def marker(remaining): | |
132 lhs, remaining = marker_and(remaining) | |
133 while remaining: | |
134 m = OR.match(remaining) | |
135 if not m: | |
136 break | |
137 remaining = remaining[m.end():] | |
138 rhs, remaining = marker_and(remaining) | |
139 lhs = {'op': 'or', 'lhs': lhs, 'rhs': rhs} | |
140 return lhs, remaining | |
141 | |
142 return marker(marker_string) | |
143 | |
144 | |
145 def parse_requirement(req): | |
146 """ | |
147 Parse a requirement passed in as a string. Return a Container | |
148 whose attributes contain the various parts of the requirement. | |
149 """ | |
150 remaining = req.strip() | |
151 if not remaining or remaining.startswith('#'): | |
152 return None | |
153 m = IDENTIFIER.match(remaining) | |
154 if not m: | |
155 raise SyntaxError('name expected: %s' % remaining) | |
156 distname = m.groups()[0] | |
157 remaining = remaining[m.end():] | |
158 extras = mark_expr = versions = uri = None | |
159 if remaining and remaining[0] == '[': | |
160 i = remaining.find(']', 1) | |
161 if i < 0: | |
162 raise SyntaxError('unterminated extra: %s' % remaining) | |
163 s = remaining[1:i] | |
164 remaining = remaining[i + 1:].lstrip() | |
165 extras = [] | |
166 while s: | |
167 m = IDENTIFIER.match(s) | |
168 if not m: | |
169 raise SyntaxError('malformed extra: %s' % s) | |
170 extras.append(m.groups()[0]) | |
171 s = s[m.end():] | |
172 if not s: | |
173 break | |
174 if s[0] != ',': | |
175 raise SyntaxError('comma expected in extras: %s' % s) | |
176 s = s[1:].lstrip() | |
177 if not extras: | |
178 extras = None | |
179 if remaining: | |
180 if remaining[0] == '@': | |
181 # it's a URI | |
182 remaining = remaining[1:].lstrip() | |
183 m = NON_SPACE.match(remaining) | |
184 if not m: | |
185 raise SyntaxError('invalid URI: %s' % remaining) | |
186 uri = m.groups()[0] | |
187 t = urlparse(uri) | |
188 # there are issues with Python and URL parsing, so this test | |
189 # is a bit crude. See bpo-20271, bpo-23505. Python doesn't | |
190 # always parse invalid URLs correctly - it should raise | |
191 # exceptions for malformed URLs | |
192 if not (t.scheme and t.netloc): | |
193 raise SyntaxError('Invalid URL: %s' % uri) | |
194 remaining = remaining[m.end():].lstrip() | |
195 else: | |
196 | |
197 def get_versions(ver_remaining): | |
198 """ | |
199 Return a list of operator, version tuples if any are | |
200 specified, else None. | |
201 """ | |
202 m = COMPARE_OP.match(ver_remaining) | |
203 versions = None | |
204 if m: | |
205 versions = [] | |
206 while True: | |
207 op = m.groups()[0] | |
208 ver_remaining = ver_remaining[m.end():] | |
209 m = VERSION_IDENTIFIER.match(ver_remaining) | |
210 if not m: | |
211 raise SyntaxError('invalid version: %s' % ver_remaining) | |
212 v = m.groups()[0] | |
213 versions.append((op, v)) | |
214 ver_remaining = ver_remaining[m.end():] | |
215 if not ver_remaining or ver_remaining[0] != ',': | |
216 break | |
217 ver_remaining = ver_remaining[1:].lstrip() | |
218 m = COMPARE_OP.match(ver_remaining) | |
219 if not m: | |
220 raise SyntaxError('invalid constraint: %s' % ver_remaining) | |
221 if not versions: | |
222 versions = None | |
223 return versions, ver_remaining | |
224 | |
225 if remaining[0] != '(': | |
226 versions, remaining = get_versions(remaining) | |
227 else: | |
228 i = remaining.find(')', 1) | |
229 if i < 0: | |
230 raise SyntaxError('unterminated parenthesis: %s' % remaining) | |
231 s = remaining[1:i] | |
232 remaining = remaining[i + 1:].lstrip() | |
233 # As a special diversion from PEP 508, allow a version number | |
234 # a.b.c in parentheses as a synonym for ~= a.b.c (because this | |
235 # is allowed in earlier PEPs) | |
236 if COMPARE_OP.match(s): | |
237 versions, _ = get_versions(s) | |
238 else: | |
239 m = VERSION_IDENTIFIER.match(s) | |
240 if not m: | |
241 raise SyntaxError('invalid constraint: %s' % s) | |
242 v = m.groups()[0] | |
243 s = s[m.end():].lstrip() | |
244 if s: | |
245 raise SyntaxError('invalid constraint: %s' % s) | |
246 versions = [('~=', v)] | |
247 | |
248 if remaining: | |
249 if remaining[0] != ';': | |
250 raise SyntaxError('invalid requirement: %s' % remaining) | |
251 remaining = remaining[1:].lstrip() | |
252 | |
253 mark_expr, remaining = parse_marker(remaining) | |
254 | |
255 if remaining and remaining[0] != '#': | |
256 raise SyntaxError('unexpected trailing data: %s' % remaining) | |
257 | |
258 if not versions: | |
259 rs = distname | |
260 else: | |
261 rs = '%s %s' % (distname, ', '.join(['%s %s' % con for con in versions])) | |
262 return Container(name=distname, extras=extras, constraints=versions, | |
263 marker=mark_expr, url=uri, requirement=rs) | |
264 | |
265 | |
266 def get_resources_dests(resources_root, rules): | |
267 """Find destinations for resources files""" | |
268 | |
269 def get_rel_path(root, path): | |
270 # normalizes and returns a lstripped-/-separated path | |
271 root = root.replace(os.path.sep, '/') | |
272 path = path.replace(os.path.sep, '/') | |
273 assert path.startswith(root) | |
274 return path[len(root):].lstrip('/') | |
275 | |
276 destinations = {} | |
277 for base, suffix, dest in rules: | |
278 prefix = os.path.join(resources_root, base) | |
279 for abs_base in iglob(prefix): | |
280 abs_glob = os.path.join(abs_base, suffix) | |
281 for abs_path in iglob(abs_glob): | |
282 resource_file = get_rel_path(resources_root, abs_path) | |
283 if dest is None: # remove the entry if it was here | |
284 destinations.pop(resource_file, None) | |
285 else: | |
286 rel_path = get_rel_path(abs_base, abs_path) | |
287 rel_dest = dest.replace(os.path.sep, '/').rstrip('/') | |
288 destinations[resource_file] = rel_dest + '/' + rel_path | |
289 return destinations | |
290 | |
291 | |
292 def in_venv(): | |
293 if hasattr(sys, 'real_prefix'): | |
294 # virtualenv venvs | |
295 result = True | |
296 else: | |
297 # PEP 405 venvs | |
298 result = sys.prefix != getattr(sys, 'base_prefix', sys.prefix) | |
299 return result | |
300 | |
301 | |
302 def get_executable(): | |
303 # The __PYVENV_LAUNCHER__ dance is apparently no longer needed, as | |
304 # changes to the stub launcher mean that sys.executable always points | |
305 # to the stub on OS X | |
306 # if sys.platform == 'darwin' and ('__PYVENV_LAUNCHER__' | |
307 # in os.environ): | |
308 # result = os.environ['__PYVENV_LAUNCHER__'] | |
309 # else: | |
310 # result = sys.executable | |
311 # return result | |
312 result = os.path.normcase(sys.executable) | |
313 if not isinstance(result, text_type): | |
314 result = fsdecode(result) | |
315 return result | |
316 | |
317 | |
318 def proceed(prompt, allowed_chars, error_prompt=None, default=None): | |
319 p = prompt | |
320 while True: | |
321 s = raw_input(p) | |
322 p = prompt | |
323 if not s and default: | |
324 s = default | |
325 if s: | |
326 c = s[0].lower() | |
327 if c in allowed_chars: | |
328 break | |
329 if error_prompt: | |
330 p = '%c: %s\n%s' % (c, error_prompt, prompt) | |
331 return c | |
332 | |
333 | |
334 def extract_by_key(d, keys): | |
335 if isinstance(keys, string_types): | |
336 keys = keys.split() | |
337 result = {} | |
338 for key in keys: | |
339 if key in d: | |
340 result[key] = d[key] | |
341 return result | |
342 | |
343 def read_exports(stream): | |
344 if sys.version_info[0] >= 3: | |
345 # needs to be a text stream | |
346 stream = codecs.getreader('utf-8')(stream) | |
347 # Try to load as JSON, falling back on legacy format | |
348 data = stream.read() | |
349 stream = StringIO(data) | |
350 try: | |
351 jdata = json.load(stream) | |
352 result = jdata['extensions']['python.exports']['exports'] | |
353 for group, entries in result.items(): | |
354 for k, v in entries.items(): | |
355 s = '%s = %s' % (k, v) | |
356 entry = get_export_entry(s) | |
357 assert entry is not None | |
358 entries[k] = entry | |
359 return result | |
360 except Exception: | |
361 stream.seek(0, 0) | |
362 | |
363 def read_stream(cp, stream): | |
364 if hasattr(cp, 'read_file'): | |
365 cp.read_file(stream) | |
366 else: | |
367 cp.readfp(stream) | |
368 | |
369 cp = configparser.ConfigParser() | |
370 try: | |
371 read_stream(cp, stream) | |
372 except configparser.MissingSectionHeaderError: | |
373 stream.close() | |
374 data = textwrap.dedent(data) | |
375 stream = StringIO(data) | |
376 read_stream(cp, stream) | |
377 | |
378 result = {} | |
379 for key in cp.sections(): | |
380 result[key] = entries = {} | |
381 for name, value in cp.items(key): | |
382 s = '%s = %s' % (name, value) | |
383 entry = get_export_entry(s) | |
384 assert entry is not None | |
385 #entry.dist = self | |
386 entries[name] = entry | |
387 return result | |
388 | |
389 | |
390 def write_exports(exports, stream): | |
391 if sys.version_info[0] >= 3: | |
392 # needs to be a text stream | |
393 stream = codecs.getwriter('utf-8')(stream) | |
394 cp = configparser.ConfigParser() | |
395 for k, v in exports.items(): | |
396 # TODO check k, v for valid values | |
397 cp.add_section(k) | |
398 for entry in v.values(): | |
399 if entry.suffix is None: | |
400 s = entry.prefix | |
401 else: | |
402 s = '%s:%s' % (entry.prefix, entry.suffix) | |
403 if entry.flags: | |
404 s = '%s [%s]' % (s, ', '.join(entry.flags)) | |
405 cp.set(k, entry.name, s) | |
406 cp.write(stream) | |
407 | |
408 | |
409 @contextlib.contextmanager | |
410 def tempdir(): | |
411 td = tempfile.mkdtemp() | |
412 try: | |
413 yield td | |
414 finally: | |
415 shutil.rmtree(td) | |
416 | |
417 @contextlib.contextmanager | |
418 def chdir(d): | |
419 cwd = os.getcwd() | |
420 try: | |
421 os.chdir(d) | |
422 yield | |
423 finally: | |
424 os.chdir(cwd) | |
425 | |
426 | |
427 @contextlib.contextmanager | |
428 def socket_timeout(seconds=15): | |
429 cto = socket.getdefaulttimeout() | |
430 try: | |
431 socket.setdefaulttimeout(seconds) | |
432 yield | |
433 finally: | |
434 socket.setdefaulttimeout(cto) | |
435 | |
436 | |
437 class cached_property(object): | |
438 def __init__(self, func): | |
439 self.func = func | |
440 #for attr in ('__name__', '__module__', '__doc__'): | |
441 # setattr(self, attr, getattr(func, attr, None)) | |
442 | |
443 def __get__(self, obj, cls=None): | |
444 if obj is None: | |
445 return self | |
446 value = self.func(obj) | |
447 object.__setattr__(obj, self.func.__name__, value) | |
448 #obj.__dict__[self.func.__name__] = value = self.func(obj) | |
449 return value | |
450 | |
451 def convert_path(pathname): | |
452 """Return 'pathname' as a name that will work on the native filesystem. | |
453 | |
454 The path is split on '/' and put back together again using the current | |
455 directory separator. Needed because filenames in the setup script are | |
456 always supplied in Unix style, and have to be converted to the local | |
457 convention before we can actually use them in the filesystem. Raises | |
458 ValueError on non-Unix-ish systems if 'pathname' either starts or | |
459 ends with a slash. | |
460 """ | |
461 if os.sep == '/': | |
462 return pathname | |
463 if not pathname: | |
464 return pathname | |
465 if pathname[0] == '/': | |
466 raise ValueError("path '%s' cannot be absolute" % pathname) | |
467 if pathname[-1] == '/': | |
468 raise ValueError("path '%s' cannot end with '/'" % pathname) | |
469 | |
470 paths = pathname.split('/') | |
471 while os.curdir in paths: | |
472 paths.remove(os.curdir) | |
473 if not paths: | |
474 return os.curdir | |
475 return os.path.join(*paths) | |
476 | |
477 | |
478 class FileOperator(object): | |
479 def __init__(self, dry_run=False): | |
480 self.dry_run = dry_run | |
481 self.ensured = set() | |
482 self._init_record() | |
483 | |
484 def _init_record(self): | |
485 self.record = False | |
486 self.files_written = set() | |
487 self.dirs_created = set() | |
488 | |
489 def record_as_written(self, path): | |
490 if self.record: | |
491 self.files_written.add(path) | |
492 | |
493 def newer(self, source, target): | |
494 """Tell if the target is newer than the source. | |
495 | |
496 Returns true if 'source' exists and is more recently modified than | |
497 'target', or if 'source' exists and 'target' doesn't. | |
498 | |
499 Returns false if both exist and 'target' is the same age or younger | |
500 than 'source'. Raise PackagingFileError if 'source' does not exist. | |
501 | |
502 Note that this test is not very accurate: files created in the same | |
503 second will have the same "age". | |
504 """ | |
505 if not os.path.exists(source): | |
506 raise DistlibException("file '%r' does not exist" % | |
507 os.path.abspath(source)) | |
508 if not os.path.exists(target): | |
509 return True | |
510 | |
511 return os.stat(source).st_mtime > os.stat(target).st_mtime | |
512 | |
513 def copy_file(self, infile, outfile, check=True): | |
514 """Copy a file respecting dry-run and force flags. | |
515 """ | |
516 self.ensure_dir(os.path.dirname(outfile)) | |
517 logger.info('Copying %s to %s', infile, outfile) | |
518 if not self.dry_run: | |
519 msg = None | |
520 if check: | |
521 if os.path.islink(outfile): | |
522 msg = '%s is a symlink' % outfile | |
523 elif os.path.exists(outfile) and not os.path.isfile(outfile): | |
524 msg = '%s is a non-regular file' % outfile | |
525 if msg: | |
526 raise ValueError(msg + ' which would be overwritten') | |
527 shutil.copyfile(infile, outfile) | |
528 self.record_as_written(outfile) | |
529 | |
530 def copy_stream(self, instream, outfile, encoding=None): | |
531 assert not os.path.isdir(outfile) | |
532 self.ensure_dir(os.path.dirname(outfile)) | |
533 logger.info('Copying stream %s to %s', instream, outfile) | |
534 if not self.dry_run: | |
535 if encoding is None: | |
536 outstream = open(outfile, 'wb') | |
537 else: | |
538 outstream = codecs.open(outfile, 'w', encoding=encoding) | |
539 try: | |
540 shutil.copyfileobj(instream, outstream) | |
541 finally: | |
542 outstream.close() | |
543 self.record_as_written(outfile) | |
544 | |
545 def write_binary_file(self, path, data): | |
546 self.ensure_dir(os.path.dirname(path)) | |
547 if not self.dry_run: | |
548 if os.path.exists(path): | |
549 os.remove(path) | |
550 with open(path, 'wb') as f: | |
551 f.write(data) | |
552 self.record_as_written(path) | |
553 | |
554 def write_text_file(self, path, data, encoding): | |
555 self.write_binary_file(path, data.encode(encoding)) | |
556 | |
557 def set_mode(self, bits, mask, files): | |
558 if os.name == 'posix' or (os.name == 'java' and os._name == 'posix'): | |
559 # Set the executable bits (owner, group, and world) on | |
560 # all the files specified. | |
561 for f in files: | |
562 if self.dry_run: | |
563 logger.info("changing mode of %s", f) | |
564 else: | |
565 mode = (os.stat(f).st_mode | bits) & mask | |
566 logger.info("changing mode of %s to %o", f, mode) | |
567 os.chmod(f, mode) | |
568 | |
569 set_executable_mode = lambda s, f: s.set_mode(0o555, 0o7777, f) | |
570 | |
571 def ensure_dir(self, path): | |
572 path = os.path.abspath(path) | |
573 if path not in self.ensured and not os.path.exists(path): | |
574 self.ensured.add(path) | |
575 d, f = os.path.split(path) | |
576 self.ensure_dir(d) | |
577 logger.info('Creating %s' % path) | |
578 if not self.dry_run: | |
579 os.mkdir(path) | |
580 if self.record: | |
581 self.dirs_created.add(path) | |
582 | |
583 def byte_compile(self, path, optimize=False, force=False, prefix=None, hashed_invalidation=False): | |
584 dpath = cache_from_source(path, not optimize) | |
585 logger.info('Byte-compiling %s to %s', path, dpath) | |
586 if not self.dry_run: | |
587 if force or self.newer(path, dpath): | |
588 if not prefix: | |
589 diagpath = None | |
590 else: | |
591 assert path.startswith(prefix) | |
592 diagpath = path[len(prefix):] | |
593 compile_kwargs = {} | |
594 if hashed_invalidation and hasattr(py_compile, 'PycInvalidationMode'): | |
595 compile_kwargs['invalidation_mode'] = py_compile.PycInvalidationMode.CHECKED_HASH | |
596 py_compile.compile(path, dpath, diagpath, True, **compile_kwargs) # raise error | |
597 self.record_as_written(dpath) | |
598 return dpath | |
599 | |
600 def ensure_removed(self, path): | |
601 if os.path.exists(path): | |
602 if os.path.isdir(path) and not os.path.islink(path): | |
603 logger.debug('Removing directory tree at %s', path) | |
604 if not self.dry_run: | |
605 shutil.rmtree(path) | |
606 if self.record: | |
607 if path in self.dirs_created: | |
608 self.dirs_created.remove(path) | |
609 else: | |
610 if os.path.islink(path): | |
611 s = 'link' | |
612 else: | |
613 s = 'file' | |
614 logger.debug('Removing %s %s', s, path) | |
615 if not self.dry_run: | |
616 os.remove(path) | |
617 if self.record: | |
618 if path in self.files_written: | |
619 self.files_written.remove(path) | |
620 | |
621 def is_writable(self, path): | |
622 result = False | |
623 while not result: | |
624 if os.path.exists(path): | |
625 result = os.access(path, os.W_OK) | |
626 break | |
627 parent = os.path.dirname(path) | |
628 if parent == path: | |
629 break | |
630 path = parent | |
631 return result | |
632 | |
633 def commit(self): | |
634 """ | |
635 Commit recorded changes, turn off recording, return | |
636 changes. | |
637 """ | |
638 assert self.record | |
639 result = self.files_written, self.dirs_created | |
640 self._init_record() | |
641 return result | |
642 | |
643 def rollback(self): | |
644 if not self.dry_run: | |
645 for f in list(self.files_written): | |
646 if os.path.exists(f): | |
647 os.remove(f) | |
648 # dirs should all be empty now, except perhaps for | |
649 # __pycache__ subdirs | |
650 # reverse so that subdirs appear before their parents | |
651 dirs = sorted(self.dirs_created, reverse=True) | |
652 for d in dirs: | |
653 flist = os.listdir(d) | |
654 if flist: | |
655 assert flist == ['__pycache__'] | |
656 sd = os.path.join(d, flist[0]) | |
657 os.rmdir(sd) | |
658 os.rmdir(d) # should fail if non-empty | |
659 self._init_record() | |
660 | |
661 def resolve(module_name, dotted_path): | |
662 if module_name in sys.modules: | |
663 mod = sys.modules[module_name] | |
664 else: | |
665 mod = __import__(module_name) | |
666 if dotted_path is None: | |
667 result = mod | |
668 else: | |
669 parts = dotted_path.split('.') | |
670 result = getattr(mod, parts.pop(0)) | |
671 for p in parts: | |
672 result = getattr(result, p) | |
673 return result | |
674 | |
675 | |
676 class ExportEntry(object): | |
677 def __init__(self, name, prefix, suffix, flags): | |
678 self.name = name | |
679 self.prefix = prefix | |
680 self.suffix = suffix | |
681 self.flags = flags | |
682 | |
683 @cached_property | |
684 def value(self): | |
685 return resolve(self.prefix, self.suffix) | |
686 | |
687 def __repr__(self): # pragma: no cover | |
688 return '<ExportEntry %s = %s:%s %s>' % (self.name, self.prefix, | |
689 self.suffix, self.flags) | |
690 | |
691 def __eq__(self, other): | |
692 if not isinstance(other, ExportEntry): | |
693 result = False | |
694 else: | |
695 result = (self.name == other.name and | |
696 self.prefix == other.prefix and | |
697 self.suffix == other.suffix and | |
698 self.flags == other.flags) | |
699 return result | |
700 | |
701 __hash__ = object.__hash__ | |
702 | |
703 | |
704 ENTRY_RE = re.compile(r'''(?P<name>(\w|[-.+])+) | |
705 \s*=\s*(?P<callable>(\w+)([:\.]\w+)*) | |
706 \s*(\[\s*(?P<flags>[\w-]+(=\w+)?(,\s*\w+(=\w+)?)*)\s*\])? | |
707 ''', re.VERBOSE) | |
708 | |
709 def get_export_entry(specification): | |
710 m = ENTRY_RE.search(specification) | |
711 if not m: | |
712 result = None | |
713 if '[' in specification or ']' in specification: | |
714 raise DistlibException("Invalid specification " | |
715 "'%s'" % specification) | |
716 else: | |
717 d = m.groupdict() | |
718 name = d['name'] | |
719 path = d['callable'] | |
720 colons = path.count(':') | |
721 if colons == 0: | |
722 prefix, suffix = path, None | |
723 else: | |
724 if colons != 1: | |
725 raise DistlibException("Invalid specification " | |
726 "'%s'" % specification) | |
727 prefix, suffix = path.split(':') | |
728 flags = d['flags'] | |
729 if flags is None: | |
730 if '[' in specification or ']' in specification: | |
731 raise DistlibException("Invalid specification " | |
732 "'%s'" % specification) | |
733 flags = [] | |
734 else: | |
735 flags = [f.strip() for f in flags.split(',')] | |
736 result = ExportEntry(name, prefix, suffix, flags) | |
737 return result | |
738 | |
739 | |
740 def get_cache_base(suffix=None): | |
741 """ | |
742 Return the default base location for distlib caches. If the directory does | |
743 not exist, it is created. Use the suffix provided for the base directory, | |
744 and default to '.distlib' if it isn't provided. | |
745 | |
746 On Windows, if LOCALAPPDATA is defined in the environment, then it is | |
747 assumed to be a directory, and will be the parent directory of the result. | |
748 On POSIX, and on Windows if LOCALAPPDATA is not defined, the user's home | |
749 directory - using os.expanduser('~') - will be the parent directory of | |
750 the result. | |
751 | |
752 The result is just the directory '.distlib' in the parent directory as | |
753 determined above, or with the name specified with ``suffix``. | |
754 """ | |
755 if suffix is None: | |
756 suffix = '.distlib' | |
757 if os.name == 'nt' and 'LOCALAPPDATA' in os.environ: | |
758 result = os.path.expandvars('$localappdata') | |
759 else: | |
760 # Assume posix, or old Windows | |
761 result = os.path.expanduser('~') | |
762 # we use 'isdir' instead of 'exists', because we want to | |
763 # fail if there's a file with that name | |
764 if os.path.isdir(result): | |
765 usable = os.access(result, os.W_OK) | |
766 if not usable: | |
767 logger.warning('Directory exists but is not writable: %s', result) | |
768 else: | |
769 try: | |
770 os.makedirs(result) | |
771 usable = True | |
772 except OSError: | |
773 logger.warning('Unable to create %s', result, exc_info=True) | |
774 usable = False | |
775 if not usable: | |
776 result = tempfile.mkdtemp() | |
777 logger.warning('Default location unusable, using %s', result) | |
778 return os.path.join(result, suffix) | |
779 | |
780 | |
781 def path_to_cache_dir(path): | |
782 """ | |
783 Convert an absolute path to a directory name for use in a cache. | |
784 | |
785 The algorithm used is: | |
786 | |
787 #. On Windows, any ``':'`` in the drive is replaced with ``'---'``. | |
788 #. Any occurrence of ``os.sep`` is replaced with ``'--'``. | |
789 #. ``'.cache'`` is appended. | |
790 """ | |
791 d, p = os.path.splitdrive(os.path.abspath(path)) | |
792 if d: | |
793 d = d.replace(':', '---') | |
794 p = p.replace(os.sep, '--') | |
795 return d + p + '.cache' | |
796 | |
797 | |
798 def ensure_slash(s): | |
799 if not s.endswith('/'): | |
800 return s + '/' | |
801 return s | |
802 | |
803 | |
804 def parse_credentials(netloc): | |
805 username = password = None | |
806 if '@' in netloc: | |
807 prefix, netloc = netloc.rsplit('@', 1) | |
808 if ':' not in prefix: | |
809 username = prefix | |
810 else: | |
811 username, password = prefix.split(':', 1) | |
812 if username: | |
813 username = unquote(username) | |
814 if password: | |
815 password = unquote(password) | |
816 return username, password, netloc | |
817 | |
818 | |
819 def get_process_umask(): | |
820 result = os.umask(0o22) | |
821 os.umask(result) | |
822 return result | |
823 | |
824 def is_string_sequence(seq): | |
825 result = True | |
826 i = None | |
827 for i, s in enumerate(seq): | |
828 if not isinstance(s, string_types): | |
829 result = False | |
830 break | |
831 assert i is not None | |
832 return result | |
833 | |
834 PROJECT_NAME_AND_VERSION = re.compile('([a-z0-9_]+([.-][a-z_][a-z0-9_]*)*)-' | |
835 '([a-z0-9_.+-]+)', re.I) | |
836 PYTHON_VERSION = re.compile(r'-py(\d\.?\d?)') | |
837 | |
838 | |
839 def split_filename(filename, project_name=None): | |
840 """ | |
841 Extract name, version, python version from a filename (no extension) | |
842 | |
843 Return name, version, pyver or None | |
844 """ | |
845 result = None | |
846 pyver = None | |
847 filename = unquote(filename).replace(' ', '-') | |
848 m = PYTHON_VERSION.search(filename) | |
849 if m: | |
850 pyver = m.group(1) | |
851 filename = filename[:m.start()] | |
852 if project_name and len(filename) > len(project_name) + 1: | |
853 m = re.match(re.escape(project_name) + r'\b', filename) | |
854 if m: | |
855 n = m.end() | |
856 result = filename[:n], filename[n + 1:], pyver | |
857 if result is None: | |
858 m = PROJECT_NAME_AND_VERSION.match(filename) | |
859 if m: | |
860 result = m.group(1), m.group(3), pyver | |
861 return result | |
862 | |
863 # Allow spaces in name because of legacy dists like "Twisted Core" | |
864 NAME_VERSION_RE = re.compile(r'(?P<name>[\w .-]+)\s*' | |
865 r'\(\s*(?P<ver>[^\s)]+)\)$') | |
866 | |
867 def parse_name_and_version(p): | |
868 """ | |
869 A utility method used to get name and version from a string. | |
870 | |
871 From e.g. a Provides-Dist value. | |
872 | |
873 :param p: A value in a form 'foo (1.0)' | |
874 :return: The name and version as a tuple. | |
875 """ | |
876 m = NAME_VERSION_RE.match(p) | |
877 if not m: | |
878 raise DistlibException('Ill-formed name/version string: \'%s\'' % p) | |
879 d = m.groupdict() | |
880 return d['name'].strip().lower(), d['ver'] | |
881 | |
882 def get_extras(requested, available): | |
883 result = set() | |
884 requested = set(requested or []) | |
885 available = set(available or []) | |
886 if '*' in requested: | |
887 requested.remove('*') | |
888 result |= available | |
889 for r in requested: | |
890 if r == '-': | |
891 result.add(r) | |
892 elif r.startswith('-'): | |
893 unwanted = r[1:] | |
894 if unwanted not in available: | |
895 logger.warning('undeclared extra: %s' % unwanted) | |
896 if unwanted in result: | |
897 result.remove(unwanted) | |
898 else: | |
899 if r not in available: | |
900 logger.warning('undeclared extra: %s' % r) | |
901 result.add(r) | |
902 return result | |
903 # | |
904 # Extended metadata functionality | |
905 # | |
906 | |
907 def _get_external_data(url): | |
908 result = {} | |
909 try: | |
910 # urlopen might fail if it runs into redirections, | |
911 # because of Python issue #13696. Fixed in locators | |
912 # using a custom redirect handler. | |
913 resp = urlopen(url) | |
914 headers = resp.info() | |
915 ct = headers.get('Content-Type') | |
916 if not ct.startswith('application/json'): | |
917 logger.debug('Unexpected response for JSON request: %s', ct) | |
918 else: | |
919 reader = codecs.getreader('utf-8')(resp) | |
920 #data = reader.read().decode('utf-8') | |
921 #result = json.loads(data) | |
922 result = json.load(reader) | |
923 except Exception as e: | |
924 logger.exception('Failed to get external data for %s: %s', url, e) | |
925 return result | |
926 | |
927 _external_data_base_url = 'https://www.red-dove.com/pypi/projects/' | |
928 | |
929 def get_project_data(name): | |
930 url = '%s/%s/project.json' % (name[0].upper(), name) | |
931 url = urljoin(_external_data_base_url, url) | |
932 result = _get_external_data(url) | |
933 return result | |
934 | |
935 def get_package_data(name, version): | |
936 url = '%s/%s/package-%s.json' % (name[0].upper(), name, version) | |
937 url = urljoin(_external_data_base_url, url) | |
938 return _get_external_data(url) | |
939 | |
940 | |
941 class Cache(object): | |
942 """ | |
943 A class implementing a cache for resources that need to live in the file system | |
944 e.g. shared libraries. This class was moved from resources to here because it | |
945 could be used by other modules, e.g. the wheel module. | |
946 """ | |
947 | |
948 def __init__(self, base): | |
949 """ | |
950 Initialise an instance. | |
951 | |
952 :param base: The base directory where the cache should be located. | |
953 """ | |
954 # we use 'isdir' instead of 'exists', because we want to | |
955 # fail if there's a file with that name | |
956 if not os.path.isdir(base): # pragma: no cover | |
957 os.makedirs(base) | |
958 if (os.stat(base).st_mode & 0o77) != 0: | |
959 logger.warning('Directory \'%s\' is not private', base) | |
960 self.base = os.path.abspath(os.path.normpath(base)) | |
961 | |
962 def prefix_to_dir(self, prefix): | |
963 """ | |
964 Converts a resource prefix to a directory name in the cache. | |
965 """ | |
966 return path_to_cache_dir(prefix) | |
967 | |
968 def clear(self): | |
969 """ | |
970 Clear the cache. | |
971 """ | |
972 not_removed = [] | |
973 for fn in os.listdir(self.base): | |
974 fn = os.path.join(self.base, fn) | |
975 try: | |
976 if os.path.islink(fn) or os.path.isfile(fn): | |
977 os.remove(fn) | |
978 elif os.path.isdir(fn): | |
979 shutil.rmtree(fn) | |
980 except Exception: | |
981 not_removed.append(fn) | |
982 return not_removed | |
983 | |
984 | |
985 class EventMixin(object): | |
986 """ | |
987 A very simple publish/subscribe system. | |
988 """ | |
989 def __init__(self): | |
990 self._subscribers = {} | |
991 | |
992 def add(self, event, subscriber, append=True): | |
993 """ | |
994 Add a subscriber for an event. | |
995 | |
996 :param event: The name of an event. | |
997 :param subscriber: The subscriber to be added (and called when the | |
998 event is published). | |
999 :param append: Whether to append or prepend the subscriber to an | |
1000 existing subscriber list for the event. | |
1001 """ | |
1002 subs = self._subscribers | |
1003 if event not in subs: | |
1004 subs[event] = deque([subscriber]) | |
1005 else: | |
1006 sq = subs[event] | |
1007 if append: | |
1008 sq.append(subscriber) | |
1009 else: | |
1010 sq.appendleft(subscriber) | |
1011 | |
1012 def remove(self, event, subscriber): | |
1013 """ | |
1014 Remove a subscriber for an event. | |
1015 | |
1016 :param event: The name of an event. | |
1017 :param subscriber: The subscriber to be removed. | |
1018 """ | |
1019 subs = self._subscribers | |
1020 if event not in subs: | |
1021 raise ValueError('No subscribers: %r' % event) | |
1022 subs[event].remove(subscriber) | |
1023 | |
1024 def get_subscribers(self, event): | |
1025 """ | |
1026 Return an iterator for the subscribers for an event. | |
1027 :param event: The event to return subscribers for. | |
1028 """ | |
1029 return iter(self._subscribers.get(event, ())) | |
1030 | |
1031 def publish(self, event, *args, **kwargs): | |
1032 """ | |
1033 Publish a event and return a list of values returned by its | |
1034 subscribers. | |
1035 | |
1036 :param event: The event to publish. | |
1037 :param args: The positional arguments to pass to the event's | |
1038 subscribers. | |
1039 :param kwargs: The keyword arguments to pass to the event's | |
1040 subscribers. | |
1041 """ | |
1042 result = [] | |
1043 for subscriber in self.get_subscribers(event): | |
1044 try: | |
1045 value = subscriber(event, *args, **kwargs) | |
1046 except Exception: | |
1047 logger.exception('Exception during event publication') | |
1048 value = None | |
1049 result.append(value) | |
1050 logger.debug('publish %s: args = %s, kwargs = %s, result = %s', | |
1051 event, args, kwargs, result) | |
1052 return result | |
1053 | |
1054 # | |
1055 # Simple sequencing | |
1056 # | |
1057 class Sequencer(object): | |
1058 def __init__(self): | |
1059 self._preds = {} | |
1060 self._succs = {} | |
1061 self._nodes = set() # nodes with no preds/succs | |
1062 | |
1063 def add_node(self, node): | |
1064 self._nodes.add(node) | |
1065 | |
1066 def remove_node(self, node, edges=False): | |
1067 if node in self._nodes: | |
1068 self._nodes.remove(node) | |
1069 if edges: | |
1070 for p in set(self._preds.get(node, ())): | |
1071 self.remove(p, node) | |
1072 for s in set(self._succs.get(node, ())): | |
1073 self.remove(node, s) | |
1074 # Remove empties | |
1075 for k, v in list(self._preds.items()): | |
1076 if not v: | |
1077 del self._preds[k] | |
1078 for k, v in list(self._succs.items()): | |
1079 if not v: | |
1080 del self._succs[k] | |
1081 | |
1082 def add(self, pred, succ): | |
1083 assert pred != succ | |
1084 self._preds.setdefault(succ, set()).add(pred) | |
1085 self._succs.setdefault(pred, set()).add(succ) | |
1086 | |
1087 def remove(self, pred, succ): | |
1088 assert pred != succ | |
1089 try: | |
1090 preds = self._preds[succ] | |
1091 succs = self._succs[pred] | |
1092 except KeyError: # pragma: no cover | |
1093 raise ValueError('%r not a successor of anything' % succ) | |
1094 try: | |
1095 preds.remove(pred) | |
1096 succs.remove(succ) | |
1097 except KeyError: # pragma: no cover | |
1098 raise ValueError('%r not a successor of %r' % (succ, pred)) | |
1099 | |
1100 def is_step(self, step): | |
1101 return (step in self._preds or step in self._succs or | |
1102 step in self._nodes) | |
1103 | |
1104 def get_steps(self, final): | |
1105 if not self.is_step(final): | |
1106 raise ValueError('Unknown: %r' % final) | |
1107 result = [] | |
1108 todo = [] | |
1109 seen = set() | |
1110 todo.append(final) | |
1111 while todo: | |
1112 step = todo.pop(0) | |
1113 if step in seen: | |
1114 # if a step was already seen, | |
1115 # move it to the end (so it will appear earlier | |
1116 # when reversed on return) ... but not for the | |
1117 # final step, as that would be confusing for | |
1118 # users | |
1119 if step != final: | |
1120 result.remove(step) | |
1121 result.append(step) | |
1122 else: | |
1123 seen.add(step) | |
1124 result.append(step) | |
1125 preds = self._preds.get(step, ()) | |
1126 todo.extend(preds) | |
1127 return reversed(result) | |
1128 | |
1129 @property | |
1130 def strong_connections(self): | |
1131 #http://en.wikipedia.org/wiki/Tarjan%27s_strongly_connected_components_algorithm | |
1132 index_counter = [0] | |
1133 stack = [] | |
1134 lowlinks = {} | |
1135 index = {} | |
1136 result = [] | |
1137 | |
1138 graph = self._succs | |
1139 | |
1140 def strongconnect(node): | |
1141 # set the depth index for this node to the smallest unused index | |
1142 index[node] = index_counter[0] | |
1143 lowlinks[node] = index_counter[0] | |
1144 index_counter[0] += 1 | |
1145 stack.append(node) | |
1146 | |
1147 # Consider successors | |
1148 try: | |
1149 successors = graph[node] | |
1150 except Exception: | |
1151 successors = [] | |
1152 for successor in successors: | |
1153 if successor not in lowlinks: | |
1154 # Successor has not yet been visited | |
1155 strongconnect(successor) | |
1156 lowlinks[node] = min(lowlinks[node],lowlinks[successor]) | |
1157 elif successor in stack: | |
1158 # the successor is in the stack and hence in the current | |
1159 # strongly connected component (SCC) | |
1160 lowlinks[node] = min(lowlinks[node],index[successor]) | |
1161 | |
1162 # If `node` is a root node, pop the stack and generate an SCC | |
1163 if lowlinks[node] == index[node]: | |
1164 connected_component = [] | |
1165 | |
1166 while True: | |
1167 successor = stack.pop() | |
1168 connected_component.append(successor) | |
1169 if successor == node: break | |
1170 component = tuple(connected_component) | |
1171 # storing the result | |
1172 result.append(component) | |
1173 | |
1174 for node in graph: | |
1175 if node not in lowlinks: | |
1176 strongconnect(node) | |
1177 | |
1178 return result | |
1179 | |
1180 @property | |
1181 def dot(self): | |
1182 result = ['digraph G {'] | |
1183 for succ in self._preds: | |
1184 preds = self._preds[succ] | |
1185 for pred in preds: | |
1186 result.append(' %s -> %s;' % (pred, succ)) | |
1187 for node in self._nodes: | |
1188 result.append(' %s;' % node) | |
1189 result.append('}') | |
1190 return '\n'.join(result) | |
1191 | |
1192 # | |
1193 # Unarchiving functionality for zip, tar, tgz, tbz, whl | |
1194 # | |
1195 | |
1196 ARCHIVE_EXTENSIONS = ('.tar.gz', '.tar.bz2', '.tar', '.zip', | |
1197 '.tgz', '.tbz', '.whl') | |
1198 | |
1199 def unarchive(archive_filename, dest_dir, format=None, check=True): | |
1200 | |
1201 def check_path(path): | |
1202 if not isinstance(path, text_type): | |
1203 path = path.decode('utf-8') | |
1204 p = os.path.abspath(os.path.join(dest_dir, path)) | |
1205 if not p.startswith(dest_dir) or p[plen] != os.sep: | |
1206 raise ValueError('path outside destination: %r' % p) | |
1207 | |
1208 dest_dir = os.path.abspath(dest_dir) | |
1209 plen = len(dest_dir) | |
1210 archive = None | |
1211 if format is None: | |
1212 if archive_filename.endswith(('.zip', '.whl')): | |
1213 format = 'zip' | |
1214 elif archive_filename.endswith(('.tar.gz', '.tgz')): | |
1215 format = 'tgz' | |
1216 mode = 'r:gz' | |
1217 elif archive_filename.endswith(('.tar.bz2', '.tbz')): | |
1218 format = 'tbz' | |
1219 mode = 'r:bz2' | |
1220 elif archive_filename.endswith('.tar'): | |
1221 format = 'tar' | |
1222 mode = 'r' | |
1223 else: # pragma: no cover | |
1224 raise ValueError('Unknown format for %r' % archive_filename) | |
1225 try: | |
1226 if format == 'zip': | |
1227 archive = ZipFile(archive_filename, 'r') | |
1228 if check: | |
1229 names = archive.namelist() | |
1230 for name in names: | |
1231 check_path(name) | |
1232 else: | |
1233 archive = tarfile.open(archive_filename, mode) | |
1234 if check: | |
1235 names = archive.getnames() | |
1236 for name in names: | |
1237 check_path(name) | |
1238 if format != 'zip' and sys.version_info[0] < 3: | |
1239 # See Python issue 17153. If the dest path contains Unicode, | |
1240 # tarfile extraction fails on Python 2.x if a member path name | |
1241 # contains non-ASCII characters - it leads to an implicit | |
1242 # bytes -> unicode conversion using ASCII to decode. | |
1243 for tarinfo in archive.getmembers(): | |
1244 if not isinstance(tarinfo.name, text_type): | |
1245 tarinfo.name = tarinfo.name.decode('utf-8') | |
1246 archive.extractall(dest_dir) | |
1247 | |
1248 finally: | |
1249 if archive: | |
1250 archive.close() | |
1251 | |
1252 | |
1253 def zip_dir(directory): | |
1254 """zip a directory tree into a BytesIO object""" | |
1255 result = io.BytesIO() | |
1256 dlen = len(directory) | |
1257 with ZipFile(result, "w") as zf: | |
1258 for root, dirs, files in os.walk(directory): | |
1259 for name in files: | |
1260 full = os.path.join(root, name) | |
1261 rel = root[dlen:] | |
1262 dest = os.path.join(rel, name) | |
1263 zf.write(full, dest) | |
1264 return result | |
1265 | |
1266 # | |
1267 # Simple progress bar | |
1268 # | |
1269 | |
1270 UNITS = ('', 'K', 'M', 'G','T','P') | |
1271 | |
1272 | |
1273 class Progress(object): | |
1274 unknown = 'UNKNOWN' | |
1275 | |
1276 def __init__(self, minval=0, maxval=100): | |
1277 assert maxval is None or maxval >= minval | |
1278 self.min = self.cur = minval | |
1279 self.max = maxval | |
1280 self.started = None | |
1281 self.elapsed = 0 | |
1282 self.done = False | |
1283 | |
1284 def update(self, curval): | |
1285 assert self.min <= curval | |
1286 assert self.max is None or curval <= self.max | |
1287 self.cur = curval | |
1288 now = time.time() | |
1289 if self.started is None: | |
1290 self.started = now | |
1291 else: | |
1292 self.elapsed = now - self.started | |
1293 | |
1294 def increment(self, incr): | |
1295 assert incr >= 0 | |
1296 self.update(self.cur + incr) | |
1297 | |
1298 def start(self): | |
1299 self.update(self.min) | |
1300 return self | |
1301 | |
1302 def stop(self): | |
1303 if self.max is not None: | |
1304 self.update(self.max) | |
1305 self.done = True | |
1306 | |
1307 @property | |
1308 def maximum(self): | |
1309 return self.unknown if self.max is None else self.max | |
1310 | |
1311 @property | |
1312 def percentage(self): | |
1313 if self.done: | |
1314 result = '100 %' | |
1315 elif self.max is None: | |
1316 result = ' ?? %' | |
1317 else: | |
1318 v = 100.0 * (self.cur - self.min) / (self.max - self.min) | |
1319 result = '%3d %%' % v | |
1320 return result | |
1321 | |
1322 def format_duration(self, duration): | |
1323 if (duration <= 0) and self.max is None or self.cur == self.min: | |
1324 result = '??:??:??' | |
1325 #elif duration < 1: | |
1326 # result = '--:--:--' | |
1327 else: | |
1328 result = time.strftime('%H:%M:%S', time.gmtime(duration)) | |
1329 return result | |
1330 | |
1331 @property | |
1332 def ETA(self): | |
1333 if self.done: | |
1334 prefix = 'Done' | |
1335 t = self.elapsed | |
1336 #import pdb; pdb.set_trace() | |
1337 else: | |
1338 prefix = 'ETA ' | |
1339 if self.max is None: | |
1340 t = -1 | |
1341 elif self.elapsed == 0 or (self.cur == self.min): | |
1342 t = 0 | |
1343 else: | |
1344 #import pdb; pdb.set_trace() | |
1345 t = float(self.max - self.min) | |
1346 t /= self.cur - self.min | |
1347 t = (t - 1) * self.elapsed | |
1348 return '%s: %s' % (prefix, self.format_duration(t)) | |
1349 | |
1350 @property | |
1351 def speed(self): | |
1352 if self.elapsed == 0: | |
1353 result = 0.0 | |
1354 else: | |
1355 result = (self.cur - self.min) / self.elapsed | |
1356 for unit in UNITS: | |
1357 if result < 1000: | |
1358 break | |
1359 result /= 1000.0 | |
1360 return '%d %sB/s' % (result, unit) | |
1361 | |
1362 # | |
1363 # Glob functionality | |
1364 # | |
1365 | |
1366 RICH_GLOB = re.compile(r'\{([^}]*)\}') | |
1367 _CHECK_RECURSIVE_GLOB = re.compile(r'[^/\\,{]\*\*|\*\*[^/\\,}]') | |
1368 _CHECK_MISMATCH_SET = re.compile(r'^[^{]*\}|\{[^}]*$') | |
1369 | |
1370 | |
1371 def iglob(path_glob): | |
1372 """Extended globbing function that supports ** and {opt1,opt2,opt3}.""" | |
1373 if _CHECK_RECURSIVE_GLOB.search(path_glob): | |
1374 msg = """invalid glob %r: recursive glob "**" must be used alone""" | |
1375 raise ValueError(msg % path_glob) | |
1376 if _CHECK_MISMATCH_SET.search(path_glob): | |
1377 msg = """invalid glob %r: mismatching set marker '{' or '}'""" | |
1378 raise ValueError(msg % path_glob) | |
1379 return _iglob(path_glob) | |
1380 | |
1381 | |
1382 def _iglob(path_glob): | |
1383 rich_path_glob = RICH_GLOB.split(path_glob, 1) | |
1384 if len(rich_path_glob) > 1: | |
1385 assert len(rich_path_glob) == 3, rich_path_glob | |
1386 prefix, set, suffix = rich_path_glob | |
1387 for item in set.split(','): | |
1388 for path in _iglob(''.join((prefix, item, suffix))): | |
1389 yield path | |
1390 else: | |
1391 if '**' not in path_glob: | |
1392 for item in std_iglob(path_glob): | |
1393 yield item | |
1394 else: | |
1395 prefix, radical = path_glob.split('**', 1) | |
1396 if prefix == '': | |
1397 prefix = '.' | |
1398 if radical == '': | |
1399 radical = '*' | |
1400 else: | |
1401 # we support both | |
1402 radical = radical.lstrip('/') | |
1403 radical = radical.lstrip('\\') | |
1404 for path, dir, files in os.walk(prefix): | |
1405 path = os.path.normpath(path) | |
1406 for fn in _iglob(os.path.join(path, radical)): | |
1407 yield fn | |
1408 | |
1409 if ssl: | |
1410 from .compat import (HTTPSHandler as BaseHTTPSHandler, match_hostname, | |
1411 CertificateError) | |
1412 | |
1413 | |
1414 # | |
1415 # HTTPSConnection which verifies certificates/matches domains | |
1416 # | |
1417 | |
1418 class HTTPSConnection(httplib.HTTPSConnection): | |
1419 ca_certs = None # set this to the path to the certs file (.pem) | |
1420 check_domain = True # only used if ca_certs is not None | |
1421 | |
1422 # noinspection PyPropertyAccess | |
1423 def connect(self): | |
1424 sock = socket.create_connection((self.host, self.port), self.timeout) | |
1425 if getattr(self, '_tunnel_host', False): | |
1426 self.sock = sock | |
1427 self._tunnel() | |
1428 | |
1429 if not hasattr(ssl, 'SSLContext'): | |
1430 # For 2.x | |
1431 if self.ca_certs: | |
1432 cert_reqs = ssl.CERT_REQUIRED | |
1433 else: | |
1434 cert_reqs = ssl.CERT_NONE | |
1435 self.sock = ssl.wrap_socket(sock, self.key_file, self.cert_file, | |
1436 cert_reqs=cert_reqs, | |
1437 ssl_version=ssl.PROTOCOL_SSLv23, | |
1438 ca_certs=self.ca_certs) | |
1439 else: # pragma: no cover | |
1440 context = ssl.SSLContext(ssl.PROTOCOL_SSLv23) | |
1441 if hasattr(ssl, 'OP_NO_SSLv2'): | |
1442 context.options |= ssl.OP_NO_SSLv2 | |
1443 if self.cert_file: | |
1444 context.load_cert_chain(self.cert_file, self.key_file) | |
1445 kwargs = {} | |
1446 if self.ca_certs: | |
1447 context.verify_mode = ssl.CERT_REQUIRED | |
1448 context.load_verify_locations(cafile=self.ca_certs) | |
1449 if getattr(ssl, 'HAS_SNI', False): | |
1450 kwargs['server_hostname'] = self.host | |
1451 self.sock = context.wrap_socket(sock, **kwargs) | |
1452 if self.ca_certs and self.check_domain: | |
1453 try: | |
1454 match_hostname(self.sock.getpeercert(), self.host) | |
1455 logger.debug('Host verified: %s', self.host) | |
1456 except CertificateError: # pragma: no cover | |
1457 self.sock.shutdown(socket.SHUT_RDWR) | |
1458 self.sock.close() | |
1459 raise | |
1460 | |
1461 class HTTPSHandler(BaseHTTPSHandler): | |
1462 def __init__(self, ca_certs, check_domain=True): | |
1463 BaseHTTPSHandler.__init__(self) | |
1464 self.ca_certs = ca_certs | |
1465 self.check_domain = check_domain | |
1466 | |
1467 def _conn_maker(self, *args, **kwargs): | |
1468 """ | |
1469 This is called to create a connection instance. Normally you'd | |
1470 pass a connection class to do_open, but it doesn't actually check for | |
1471 a class, and just expects a callable. As long as we behave just as a | |
1472 constructor would have, we should be OK. If it ever changes so that | |
1473 we *must* pass a class, we'll create an UnsafeHTTPSConnection class | |
1474 which just sets check_domain to False in the class definition, and | |
1475 choose which one to pass to do_open. | |
1476 """ | |
1477 result = HTTPSConnection(*args, **kwargs) | |
1478 if self.ca_certs: | |
1479 result.ca_certs = self.ca_certs | |
1480 result.check_domain = self.check_domain | |
1481 return result | |
1482 | |
1483 def https_open(self, req): | |
1484 try: | |
1485 return self.do_open(self._conn_maker, req) | |
1486 except URLError as e: | |
1487 if 'certificate verify failed' in str(e.reason): | |
1488 raise CertificateError('Unable to verify server certificate ' | |
1489 'for %s' % req.host) | |
1490 else: | |
1491 raise | |
1492 | |
1493 # | |
1494 # To prevent against mixing HTTP traffic with HTTPS (examples: A Man-In-The- | |
1495 # Middle proxy using HTTP listens on port 443, or an index mistakenly serves | |
1496 # HTML containing a http://xyz link when it should be https://xyz), | |
1497 # you can use the following handler class, which does not allow HTTP traffic. | |
1498 # | |
1499 # It works by inheriting from HTTPHandler - so build_opener won't add a | |
1500 # handler for HTTP itself. | |
1501 # | |
1502 class HTTPSOnlyHandler(HTTPSHandler, HTTPHandler): | |
1503 def http_open(self, req): | |
1504 raise URLError('Unexpected HTTP request on what should be a secure ' | |
1505 'connection: %s' % req) | |
1506 | |
1507 # | |
1508 # XML-RPC with timeouts | |
1509 # | |
1510 | |
1511 _ver_info = sys.version_info[:2] | |
1512 | |
1513 if _ver_info == (2, 6): | |
1514 class HTTP(httplib.HTTP): | |
1515 def __init__(self, host='', port=None, **kwargs): | |
1516 if port == 0: # 0 means use port 0, not the default port | |
1517 port = None | |
1518 self._setup(self._connection_class(host, port, **kwargs)) | |
1519 | |
1520 | |
1521 if ssl: | |
1522 class HTTPS(httplib.HTTPS): | |
1523 def __init__(self, host='', port=None, **kwargs): | |
1524 if port == 0: # 0 means use port 0, not the default port | |
1525 port = None | |
1526 self._setup(self._connection_class(host, port, **kwargs)) | |
1527 | |
1528 | |
1529 class Transport(xmlrpclib.Transport): | |
1530 def __init__(self, timeout, use_datetime=0): | |
1531 self.timeout = timeout | |
1532 xmlrpclib.Transport.__init__(self, use_datetime) | |
1533 | |
1534 def make_connection(self, host): | |
1535 h, eh, x509 = self.get_host_info(host) | |
1536 if _ver_info == (2, 6): | |
1537 result = HTTP(h, timeout=self.timeout) | |
1538 else: | |
1539 if not self._connection or host != self._connection[0]: | |
1540 self._extra_headers = eh | |
1541 self._connection = host, httplib.HTTPConnection(h) | |
1542 result = self._connection[1] | |
1543 return result | |
1544 | |
1545 if ssl: | |
1546 class SafeTransport(xmlrpclib.SafeTransport): | |
1547 def __init__(self, timeout, use_datetime=0): | |
1548 self.timeout = timeout | |
1549 xmlrpclib.SafeTransport.__init__(self, use_datetime) | |
1550 | |
1551 def make_connection(self, host): | |
1552 h, eh, kwargs = self.get_host_info(host) | |
1553 if not kwargs: | |
1554 kwargs = {} | |
1555 kwargs['timeout'] = self.timeout | |
1556 if _ver_info == (2, 6): | |
1557 result = HTTPS(host, None, **kwargs) | |
1558 else: | |
1559 if not self._connection or host != self._connection[0]: | |
1560 self._extra_headers = eh | |
1561 self._connection = host, httplib.HTTPSConnection(h, None, | |
1562 **kwargs) | |
1563 result = self._connection[1] | |
1564 return result | |
1565 | |
1566 | |
1567 class ServerProxy(xmlrpclib.ServerProxy): | |
1568 def __init__(self, uri, **kwargs): | |
1569 self.timeout = timeout = kwargs.pop('timeout', None) | |
1570 # The above classes only come into play if a timeout | |
1571 # is specified | |
1572 if timeout is not None: | |
1573 scheme, _ = splittype(uri) | |
1574 use_datetime = kwargs.get('use_datetime', 0) | |
1575 if scheme == 'https': | |
1576 tcls = SafeTransport | |
1577 else: | |
1578 tcls = Transport | |
1579 kwargs['transport'] = t = tcls(timeout, use_datetime=use_datetime) | |
1580 self.transport = t | |
1581 xmlrpclib.ServerProxy.__init__(self, uri, **kwargs) | |
1582 | |
1583 # | |
1584 # CSV functionality. This is provided because on 2.x, the csv module can't | |
1585 # handle Unicode. However, we need to deal with Unicode in e.g. RECORD files. | |
1586 # | |
1587 | |
1588 def _csv_open(fn, mode, **kwargs): | |
1589 if sys.version_info[0] < 3: | |
1590 mode += 'b' | |
1591 else: | |
1592 kwargs['newline'] = '' | |
1593 # Python 3 determines encoding from locale. Force 'utf-8' | |
1594 # file encoding to match other forced utf-8 encoding | |
1595 kwargs['encoding'] = 'utf-8' | |
1596 return open(fn, mode, **kwargs) | |
1597 | |
1598 | |
1599 class CSVBase(object): | |
1600 defaults = { | |
1601 'delimiter': str(','), # The strs are used because we need native | |
1602 'quotechar': str('"'), # str in the csv API (2.x won't take | |
1603 'lineterminator': str('\n') # Unicode) | |
1604 } | |
1605 | |
1606 def __enter__(self): | |
1607 return self | |
1608 | |
1609 def __exit__(self, *exc_info): | |
1610 self.stream.close() | |
1611 | |
1612 | |
1613 class CSVReader(CSVBase): | |
1614 def __init__(self, **kwargs): | |
1615 if 'stream' in kwargs: | |
1616 stream = kwargs['stream'] | |
1617 if sys.version_info[0] >= 3: | |
1618 # needs to be a text stream | |
1619 stream = codecs.getreader('utf-8')(stream) | |
1620 self.stream = stream | |
1621 else: | |
1622 self.stream = _csv_open(kwargs['path'], 'r') | |
1623 self.reader = csv.reader(self.stream, **self.defaults) | |
1624 | |
1625 def __iter__(self): | |
1626 return self | |
1627 | |
1628 def next(self): | |
1629 result = next(self.reader) | |
1630 if sys.version_info[0] < 3: | |
1631 for i, item in enumerate(result): | |
1632 if not isinstance(item, text_type): | |
1633 result[i] = item.decode('utf-8') | |
1634 return result | |
1635 | |
1636 __next__ = next | |
1637 | |
1638 class CSVWriter(CSVBase): | |
1639 def __init__(self, fn, **kwargs): | |
1640 self.stream = _csv_open(fn, 'w') | |
1641 self.writer = csv.writer(self.stream, **self.defaults) | |
1642 | |
1643 def writerow(self, row): | |
1644 if sys.version_info[0] < 3: | |
1645 r = [] | |
1646 for item in row: | |
1647 if isinstance(item, text_type): | |
1648 item = item.encode('utf-8') | |
1649 r.append(item) | |
1650 row = r | |
1651 self.writer.writerow(row) | |
1652 | |
1653 # | |
1654 # Configurator functionality | |
1655 # | |
1656 | |
1657 class Configurator(BaseConfigurator): | |
1658 | |
1659 value_converters = dict(BaseConfigurator.value_converters) | |
1660 value_converters['inc'] = 'inc_convert' | |
1661 | |
1662 def __init__(self, config, base=None): | |
1663 super(Configurator, self).__init__(config) | |
1664 self.base = base or os.getcwd() | |
1665 | |
1666 def configure_custom(self, config): | |
1667 def convert(o): | |
1668 if isinstance(o, (list, tuple)): | |
1669 result = type(o)([convert(i) for i in o]) | |
1670 elif isinstance(o, dict): | |
1671 if '()' in o: | |
1672 result = self.configure_custom(o) | |
1673 else: | |
1674 result = {} | |
1675 for k in o: | |
1676 result[k] = convert(o[k]) | |
1677 else: | |
1678 result = self.convert(o) | |
1679 return result | |
1680 | |
1681 c = config.pop('()') | |
1682 if not callable(c): | |
1683 c = self.resolve(c) | |
1684 props = config.pop('.', None) | |
1685 # Check for valid identifiers | |
1686 args = config.pop('[]', ()) | |
1687 if args: | |
1688 args = tuple([convert(o) for o in args]) | |
1689 items = [(k, convert(config[k])) for k in config if valid_ident(k)] | |
1690 kwargs = dict(items) | |
1691 result = c(*args, **kwargs) | |
1692 if props: | |
1693 for n, v in props.items(): | |
1694 setattr(result, n, convert(v)) | |
1695 return result | |
1696 | |
1697 def __getitem__(self, key): | |
1698 result = self.config[key] | |
1699 if isinstance(result, dict) and '()' in result: | |
1700 self.config[key] = result = self.configure_custom(result) | |
1701 return result | |
1702 | |
1703 def inc_convert(self, value): | |
1704 """Default converter for the inc:// protocol.""" | |
1705 if not os.path.isabs(value): | |
1706 value = os.path.join(self.base, value) | |
1707 with codecs.open(value, 'r', encoding='utf-8') as f: | |
1708 result = json.load(f) | |
1709 return result | |
1710 | |
1711 | |
1712 class SubprocessMixin(object): | |
1713 """ | |
1714 Mixin for running subprocesses and capturing their output | |
1715 """ | |
1716 def __init__(self, verbose=False, progress=None): | |
1717 self.verbose = verbose | |
1718 self.progress = progress | |
1719 | |
1720 def reader(self, stream, context): | |
1721 """ | |
1722 Read lines from a subprocess' output stream and either pass to a progress | |
1723 callable (if specified) or write progress information to sys.stderr. | |
1724 """ | |
1725 progress = self.progress | |
1726 verbose = self.verbose | |
1727 while True: | |
1728 s = stream.readline() | |
1729 if not s: | |
1730 break | |
1731 if progress is not None: | |
1732 progress(s, context) | |
1733 else: | |
1734 if not verbose: | |
1735 sys.stderr.write('.') | |
1736 else: | |
1737 sys.stderr.write(s.decode('utf-8')) | |
1738 sys.stderr.flush() | |
1739 stream.close() | |
1740 | |
1741 def run_command(self, cmd, **kwargs): | |
1742 p = subprocess.Popen(cmd, stdout=subprocess.PIPE, | |
1743 stderr=subprocess.PIPE, **kwargs) | |
1744 t1 = threading.Thread(target=self.reader, args=(p.stdout, 'stdout')) | |
1745 t1.start() | |
1746 t2 = threading.Thread(target=self.reader, args=(p.stderr, 'stderr')) | |
1747 t2.start() | |
1748 p.wait() | |
1749 t1.join() | |
1750 t2.join() | |
1751 if self.progress is not None: | |
1752 self.progress('done.', 'main') | |
1753 elif self.verbose: | |
1754 sys.stderr.write('done.\n') | |
1755 return p | |
1756 | |
1757 | |
1758 def normalize_name(name): | |
1759 """Normalize a python package name a la PEP 503""" | |
1760 # https://www.python.org/dev/peps/pep-0503/#normalized-names | |
1761 return re.sub('[-_.]+', '-', name).lower() |