Commit | Line | Data |
---|---|---|
1e4a197e RD |
1 | """distutils.util |
2 | ||
3 | Miscellaneous utility functions -- anything that doesn't fit into | |
4 | one of the other *util.py modules. | |
5 | """ | |
6 | ||
7 | __revision__ = "$Id$" | |
8 | ||
9 | import sys, os, string, re | |
10 | from distutils.errors import DistutilsPlatformError | |
11 | from distutils.dep_util import newer | |
12 | from distutils.spawn import spawn | |
13 | from distutils import log | |
14 | ||
15 | def get_platform (): | |
16 | """Return a string that identifies the current platform. This is used | |
17 | mainly to distinguish platform-specific build directories and | |
18 | platform-specific built distributions. Typically includes the OS name | |
19 | and version and the architecture (as supplied by 'os.uname()'), | |
20 | although the exact information included depends on the OS; eg. for IRIX | |
21 | the architecture isn't particularly important (IRIX only runs on SGI | |
22 | hardware), but for Linux the kernel version isn't particularly | |
23 | important. | |
24 | ||
25 | Examples of returned values: | |
26 | linux-i586 | |
27 | linux-alpha (?) | |
28 | solaris-2.6-sun4u | |
29 | irix-5.3 | |
30 | irix64-6.2 | |
31 | ||
32 | For non-POSIX platforms, currently just returns 'sys.platform'. | |
33 | """ | |
34 | if os.name != "posix" or not hasattr(os, 'uname'): | |
35 | # XXX what about the architecture? NT is Intel or Alpha, | |
36 | # Mac OS is M68k or PPC, etc. | |
37 | return sys.platform | |
38 | ||
39 | # Try to distinguish various flavours of Unix | |
40 | ||
41 | (osname, host, release, version, machine) = os.uname() | |
42 | ||
43 | # Convert the OS name to lowercase, remove '/' characters | |
44 | # (to accommodate BSD/OS), and translate spaces (for "Power Macintosh") | |
45 | osname = string.lower(osname) | |
46 | osname = string.replace(osname, '/', '') | |
47 | machine = string.replace(machine, ' ', '_') | |
48 | ||
49 | if osname[:5] == "linux": | |
50 | # At least on Linux/Intel, 'machine' is the processor -- | |
51 | # i386, etc. | |
52 | # XXX what about Alpha, SPARC, etc? | |
53 | return "%s-%s" % (osname, machine) | |
54 | elif osname[:5] == "sunos": | |
55 | if release[0] >= "5": # SunOS 5 == Solaris 2 | |
56 | osname = "solaris" | |
57 | release = "%d.%s" % (int(release[0]) - 3, release[2:]) | |
58 | # fall through to standard osname-release-machine representation | |
59 | elif osname[:4] == "irix": # could be "irix64"! | |
60 | return "%s-%s" % (osname, release) | |
61 | elif osname[:3] == "aix": | |
62 | return "%s-%s.%s" % (osname, version, release) | |
63 | elif osname[:6] == "cygwin": | |
64 | osname = "cygwin" | |
65 | rel_re = re.compile (r'[\d.]+') | |
66 | m = rel_re.match(release) | |
67 | if m: | |
68 | release = m.group() | |
69 | ||
70 | return "%s-%s-%s" % (osname, release, machine) | |
71 | ||
72 | # get_platform () | |
73 | ||
74 | ||
75 | def convert_path (pathname): | |
76 | """Return 'pathname' as a name that will work on the native filesystem, | |
77 | i.e. split it on '/' and put it back together again using the current | |
78 | directory separator. Needed because filenames in the setup script are | |
79 | always supplied in Unix style, and have to be converted to the local | |
80 | convention before we can actually use them in the filesystem. Raises | |
81 | ValueError on non-Unix-ish systems if 'pathname' either starts or | |
82 | ends with a slash. | |
83 | """ | |
84 | if os.sep == '/': | |
85 | return pathname | |
86 | if not pathname: | |
87 | return pathname | |
88 | if pathname[0] == '/': | |
89 | raise ValueError, "path '%s' cannot be absolute" % pathname | |
90 | if pathname[-1] == '/': | |
91 | raise ValueError, "path '%s' cannot end with '/'" % pathname | |
92 | ||
93 | paths = string.split(pathname, '/') | |
94 | while '.' in paths: | |
95 | paths.remove('.') | |
96 | if not paths: | |
97 | return os.curdir | |
98 | return apply(os.path.join, paths) | |
99 | ||
100 | # convert_path () | |
101 | ||
102 | ||
103 | def change_root (new_root, pathname): | |
104 | """Return 'pathname' with 'new_root' prepended. If 'pathname' is | |
105 | relative, this is equivalent to "os.path.join(new_root,pathname)". | |
106 | Otherwise, it requires making 'pathname' relative and then joining the | |
107 | two, which is tricky on DOS/Windows and Mac OS. | |
108 | """ | |
109 | if os.name == 'posix': | |
110 | if not os.path.isabs(pathname): | |
111 | return os.path.join(new_root, pathname) | |
112 | else: | |
113 | return os.path.join(new_root, pathname[1:]) | |
114 | ||
115 | elif os.name == 'nt': | |
116 | (drive, path) = os.path.splitdrive(pathname) | |
117 | if path[0] == '\\': | |
118 | path = path[1:] | |
119 | return os.path.join(new_root, path) | |
120 | ||
121 | elif os.name == 'os2': | |
122 | (drive, path) = os.path.splitdrive(pathname) | |
123 | if path[0] == os.sep: | |
124 | path = path[1:] | |
125 | return os.path.join(new_root, path) | |
126 | ||
127 | elif os.name == 'mac': | |
128 | if not os.path.isabs(pathname): | |
129 | return os.path.join(new_root, pathname) | |
130 | else: | |
131 | # Chop off volume name from start of path | |
132 | elements = string.split(pathname, ":", 1) | |
133 | pathname = ":" + elements[1] | |
134 | return os.path.join(new_root, pathname) | |
135 | ||
136 | else: | |
137 | raise DistutilsPlatformError, \ | |
138 | "nothing known about platform '%s'" % os.name | |
139 | ||
140 | ||
141 | _environ_checked = 0 | |
142 | def check_environ (): | |
143 | """Ensure that 'os.environ' has all the environment variables we | |
144 | guarantee that users can use in config files, command-line options, | |
145 | etc. Currently this includes: | |
146 | HOME - user's home directory (Unix only) | |
147 | PLAT - description of the current platform, including hardware | |
148 | and OS (see 'get_platform()') | |
149 | """ | |
150 | global _environ_checked | |
151 | if _environ_checked: | |
152 | return | |
153 | ||
154 | if os.name == 'posix' and not os.environ.has_key('HOME'): | |
155 | import pwd | |
156 | os.environ['HOME'] = pwd.getpwuid(os.getuid())[5] | |
157 | ||
158 | if not os.environ.has_key('PLAT'): | |
159 | os.environ['PLAT'] = get_platform() | |
160 | ||
161 | _environ_checked = 1 | |
162 | ||
163 | ||
164 | def subst_vars (s, local_vars): | |
165 | """Perform shell/Perl-style variable substitution on 'string'. Every | |
166 | occurrence of '$' followed by a name is considered a variable, and | |
167 | variable is substituted by the value found in the 'local_vars' | |
168 | dictionary, or in 'os.environ' if it's not in 'local_vars'. | |
169 | 'os.environ' is first checked/augmented to guarantee that it contains | |
170 | certain values: see 'check_environ()'. Raise ValueError for any | |
171 | variables not found in either 'local_vars' or 'os.environ'. | |
172 | """ | |
173 | check_environ() | |
174 | def _subst (match, local_vars=local_vars): | |
175 | var_name = match.group(1) | |
176 | if local_vars.has_key(var_name): | |
177 | return str(local_vars[var_name]) | |
178 | else: | |
179 | return os.environ[var_name] | |
180 | ||
181 | try: | |
182 | return re.sub(r'\$([a-zA-Z_][a-zA-Z_0-9]*)', _subst, s) | |
183 | except KeyError, var: | |
184 | raise ValueError, "invalid variable '$%s'" % var | |
185 | ||
186 | # subst_vars () | |
187 | ||
188 | ||
189 | def grok_environment_error (exc, prefix="error: "): | |
190 | """Generate a useful error message from an EnvironmentError (IOError or | |
191 | OSError) exception object. Handles Python 1.5.1 and 1.5.2 styles, and | |
192 | does what it can to deal with exception objects that don't have a | |
193 | filename (which happens when the error is due to a two-file operation, | |
194 | such as 'rename()' or 'link()'. Returns the error message as a string | |
195 | prefixed with 'prefix'. | |
196 | """ | |
197 | # check for Python 1.5.2-style {IO,OS}Error exception objects | |
198 | if hasattr(exc, 'filename') and hasattr(exc, 'strerror'): | |
199 | if exc.filename: | |
200 | error = prefix + "%s: %s" % (exc.filename, exc.strerror) | |
201 | else: | |
202 | # two-argument functions in posix module don't | |
203 | # include the filename in the exception object! | |
204 | error = prefix + "%s" % exc.strerror | |
205 | else: | |
206 | error = prefix + str(exc[-1]) | |
207 | ||
208 | return error | |
209 | ||
210 | ||
211 | # Needed by 'split_quoted()' | |
212 | _wordchars_re = re.compile(r'[^\\\'\"%s ]*' % string.whitespace) | |
213 | _squote_re = re.compile(r"'(?:[^'\\]|\\.)*'") | |
214 | _dquote_re = re.compile(r'"(?:[^"\\]|\\.)*"') | |
215 | ||
216 | def split_quoted (s): | |
217 | """Split a string up according to Unix shell-like rules for quotes and | |
218 | backslashes. In short: words are delimited by spaces, as long as those | |
219 | spaces are not escaped by a backslash, or inside a quoted string. | |
220 | Single and double quotes are equivalent, and the quote characters can | |
221 | be backslash-escaped. The backslash is stripped from any two-character | |
222 | escape sequence, leaving only the escaped character. The quote | |
223 | characters are stripped from any quoted string. Returns a list of | |
224 | words. | |
225 | """ | |
226 | ||
227 | # This is a nice algorithm for splitting up a single string, since it | |
228 | # doesn't require character-by-character examination. It was a little | |
229 | # bit of a brain-bender to get it working right, though... | |
230 | ||
231 | s = string.strip(s) | |
232 | words = [] | |
233 | pos = 0 | |
234 | ||
235 | while s: | |
236 | m = _wordchars_re.match(s, pos) | |
237 | end = m.end() | |
238 | if end == len(s): | |
239 | words.append(s[:end]) | |
240 | break | |
241 | ||
242 | if s[end] in string.whitespace: # unescaped, unquoted whitespace: now | |
243 | words.append(s[:end]) # we definitely have a word delimiter | |
244 | s = string.lstrip(s[end:]) | |
245 | pos = 0 | |
246 | ||
247 | elif s[end] == '\\': # preserve whatever is being escaped; | |
248 | # will become part of the current word | |
249 | s = s[:end] + s[end+1:] | |
250 | pos = end+1 | |
251 | ||
252 | else: | |
253 | if s[end] == "'": # slurp singly-quoted string | |
254 | m = _squote_re.match(s, end) | |
255 | elif s[end] == '"': # slurp doubly-quoted string | |
256 | m = _dquote_re.match(s, end) | |
257 | else: | |
258 | raise RuntimeError, \ | |
259 | "this can't happen (bad char '%c')" % s[end] | |
260 | ||
261 | if m is None: | |
262 | raise ValueError, \ | |
263 | "bad string (mismatched %s quotes?)" % s[end] | |
264 | ||
265 | (beg, end) = m.span() | |
266 | s = s[:beg] + s[beg+1:end-1] + s[end:] | |
267 | pos = m.end() - 2 | |
268 | ||
269 | if pos >= len(s): | |
270 | words.append(s) | |
271 | break | |
272 | ||
273 | return words | |
274 | ||
275 | # split_quoted () | |
276 | ||
277 | ||
278 | def execute (func, args, msg=None, verbose=0, dry_run=0): | |
279 | """Perform some action that affects the outside world (eg. by | |
280 | writing to the filesystem). Such actions are special because they | |
281 | are disabled by the 'dry_run' flag. This method takes care of all | |
282 | that bureaucracy for you; all you have to do is supply the | |
283 | function to call and an argument tuple for it (to embody the | |
284 | "external action" being performed), and an optional message to | |
285 | print. | |
286 | """ | |
287 | if msg is None: | |
288 | msg = "%s%s" % (func.__name__, `args`) | |
289 | if msg[-2:] == ',)': # correct for singleton tuple | |
290 | msg = msg[0:-2] + ')' | |
291 | ||
292 | log.info(msg) | |
293 | if not dry_run: | |
294 | apply(func, args) | |
295 | ||
296 | ||
297 | def strtobool (val): | |
298 | """Convert a string representation of truth to true (1) or false (0). | |
299 | ||
300 | True values are 'y', 'yes', 't', 'true', 'on', and '1'; false values | |
301 | are 'n', 'no', 'f', 'false', 'off', and '0'. Raises ValueError if | |
302 | 'val' is anything else. | |
303 | """ | |
304 | val = string.lower(val) | |
305 | if val in ('y', 'yes', 't', 'true', 'on', '1'): | |
306 | return 1 | |
307 | elif val in ('n', 'no', 'f', 'false', 'off', '0'): | |
308 | return 0 | |
309 | else: | |
310 | raise ValueError, "invalid truth value %s" % `val` | |
311 | ||
312 | ||
313 | def byte_compile (py_files, | |
314 | optimize=0, force=0, | |
315 | prefix=None, base_dir=None, | |
316 | verbose=1, dry_run=0, | |
317 | direct=None): | |
318 | """Byte-compile a collection of Python source files to either .pyc | |
319 | or .pyo files in the same directory. 'py_files' is a list of files | |
320 | to compile; any files that don't end in ".py" are silently skipped. | |
321 | 'optimize' must be one of the following: | |
322 | 0 - don't optimize (generate .pyc) | |
323 | 1 - normal optimization (like "python -O") | |
324 | 2 - extra optimization (like "python -OO") | |
325 | If 'force' is true, all files are recompiled regardless of | |
326 | timestamps. | |
327 | ||
328 | The source filename encoded in each bytecode file defaults to the | |
329 | filenames listed in 'py_files'; you can modify these with 'prefix' and | |
330 | 'basedir'. 'prefix' is a string that will be stripped off of each | |
331 | source filename, and 'base_dir' is a directory name that will be | |
332 | prepended (after 'prefix' is stripped). You can supply either or both | |
333 | (or neither) of 'prefix' and 'base_dir', as you wish. | |
334 | ||
335 | If 'dry_run' is true, doesn't actually do anything that would | |
336 | affect the filesystem. | |
337 | ||
338 | Byte-compilation is either done directly in this interpreter process | |
339 | with the standard py_compile module, or indirectly by writing a | |
340 | temporary script and executing it. Normally, you should let | |
341 | 'byte_compile()' figure out to use direct compilation or not (see | |
342 | the source for details). The 'direct' flag is used by the script | |
343 | generated in indirect mode; unless you know what you're doing, leave | |
344 | it set to None. | |
345 | """ | |
346 | ||
347 | # First, if the caller didn't force us into direct or indirect mode, | |
348 | # figure out which mode we should be in. We take a conservative | |
349 | # approach: choose direct mode *only* if the current interpreter is | |
350 | # in debug mode and optimize is 0. If we're not in debug mode (-O | |
351 | # or -OO), we don't know which level of optimization this | |
352 | # interpreter is running with, so we can't do direct | |
353 | # byte-compilation and be certain that it's the right thing. Thus, | |
354 | # always compile indirectly if the current interpreter is in either | |
355 | # optimize mode, or if either optimization level was requested by | |
356 | # the caller. | |
357 | if direct is None: | |
358 | direct = (__debug__ and optimize == 0) | |
359 | ||
360 | # "Indirect" byte-compilation: write a temporary script and then | |
361 | # run it with the appropriate flags. | |
362 | if not direct: | |
363 | try: | |
364 | from tempfile import mkstemp | |
365 | (script_fd, script_name) = mkstemp(".py") | |
366 | except ImportError: | |
367 | from tempfile import mktemp | |
368 | (script_fd, script_name) = None, mktemp(".py") | |
369 | log.info("writing byte-compilation script '%s'", script_name) | |
370 | if not dry_run: | |
371 | if script_fd is not None: | |
372 | script = os.fdopen(script_fd, "w") | |
373 | else: | |
374 | script = open(script_name, "w") | |
375 | ||
376 | script.write("""\ | |
377 | from distutils.util import byte_compile | |
378 | files = [ | |
379 | """) | |
380 | ||
381 | # XXX would be nice to write absolute filenames, just for | |
382 | # safety's sake (script should be more robust in the face of | |
383 | # chdir'ing before running it). But this requires abspath'ing | |
384 | # 'prefix' as well, and that breaks the hack in build_lib's | |
385 | # 'byte_compile()' method that carefully tacks on a trailing | |
386 | # slash (os.sep really) to make sure the prefix here is "just | |
387 | # right". This whole prefix business is rather delicate -- the | |
388 | # problem is that it's really a directory, but I'm treating it | |
389 | # as a dumb string, so trailing slashes and so forth matter. | |
390 | ||
391 | #py_files = map(os.path.abspath, py_files) | |
392 | #if prefix: | |
393 | # prefix = os.path.abspath(prefix) | |
394 | ||
395 | script.write(string.join(map(repr, py_files), ",\n") + "]\n") | |
396 | script.write(""" | |
397 | byte_compile(files, optimize=%s, force=%s, | |
398 | prefix=%s, base_dir=%s, | |
399 | verbose=%s, dry_run=0, | |
400 | direct=1) | |
401 | """ % (`optimize`, `force`, `prefix`, `base_dir`, `verbose`)) | |
402 | ||
403 | script.close() | |
404 | ||
405 | cmd = [sys.executable, script_name] | |
406 | if optimize == 1: | |
407 | cmd.insert(1, "-O") | |
408 | elif optimize == 2: | |
409 | cmd.insert(1, "-OO") | |
410 | spawn(cmd, dry_run=dry_run) | |
411 | execute(os.remove, (script_name,), "removing %s" % script_name, | |
412 | dry_run=dry_run) | |
413 | ||
414 | # "Direct" byte-compilation: use the py_compile module to compile | |
415 | # right here, right now. Note that the script generated in indirect | |
416 | # mode simply calls 'byte_compile()' in direct mode, a weird sort of | |
417 | # cross-process recursion. Hey, it works! | |
418 | else: | |
419 | from py_compile import compile | |
420 | ||
421 | for file in py_files: | |
422 | if file[-3:] != ".py": | |
423 | # This lets us be lazy and not filter filenames in | |
424 | # the "install_lib" command. | |
425 | continue | |
426 | ||
427 | # Terminology from the py_compile module: | |
428 | # cfile - byte-compiled file | |
429 | # dfile - purported source filename (same as 'file' by default) | |
430 | cfile = file + (__debug__ and "c" or "o") | |
431 | dfile = file | |
432 | if prefix: | |
433 | if file[:len(prefix)] != prefix: | |
434 | raise ValueError, \ | |
435 | ("invalid prefix: filename %s doesn't start with %s" | |
436 | % (`file`, `prefix`)) | |
437 | dfile = dfile[len(prefix):] | |
438 | if base_dir: | |
439 | dfile = os.path.join(base_dir, dfile) | |
440 | ||
441 | cfile_base = os.path.basename(cfile) | |
442 | if direct: | |
443 | if force or newer(file, cfile): | |
444 | log.info("byte-compiling %s to %s", file, cfile_base) | |
445 | if not dry_run: | |
446 | compile(file, cfile, dfile) | |
447 | else: | |
448 | log.debug("skipping byte-compilation of %s to %s", | |
449 | file, cfile_base) | |
450 | ||
451 | # byte_compile () | |
452 | ||
453 | def rfc822_escape (header): | |
454 | """Return a version of the string escaped for inclusion in an | |
455 | RFC-822 header, by ensuring there are 8 spaces space after each newline. | |
456 | """ | |
457 | lines = string.split(header, '\n') | |
458 | lines = map(string.strip, lines) | |
459 | header = string.join(lines, '\n' + 8*' ') | |
460 | return header |