]> git.saurik.com Git - wxWidgets.git/blame - wxPython/distutils/util.py
test wxString's char<->wchar_t ctors
[wxWidgets.git] / wxPython / distutils / util.py
CommitLineData
1e4a197e
RD
1"""distutils.util
2
3Miscellaneous utility functions -- anything that doesn't fit into
4one of the other *util.py modules.
5"""
6
7__revision__ = "$Id$"
8
9import sys, os, string, re
10from distutils.errors import DistutilsPlatformError
11from distutils.dep_util import newer
12from distutils.spawn import spawn
13from distutils import log
14
15def get_platform ():
16 """Return a string that identifies the current platform. This is used
17 mainly to distinguish platform-specific build directories and
18 platform-specific built distributions. Typically includes the OS name
19 and version and the architecture (as supplied by 'os.uname()'),
20 although the exact information included depends on the OS; eg. for IRIX
21 the architecture isn't particularly important (IRIX only runs on SGI
22 hardware), but for Linux the kernel version isn't particularly
23 important.
24
25 Examples of returned values:
26 linux-i586
27 linux-alpha (?)
28 solaris-2.6-sun4u
29 irix-5.3
30 irix64-6.2
31
32 For non-POSIX platforms, currently just returns 'sys.platform'.
33 """
34 if os.name != "posix" or not hasattr(os, 'uname'):
35 # XXX what about the architecture? NT is Intel or Alpha,
36 # Mac OS is M68k or PPC, etc.
37 return sys.platform
38
39 # Try to distinguish various flavours of Unix
40
41 (osname, host, release, version, machine) = os.uname()
42
43 # Convert the OS name to lowercase, remove '/' characters
44 # (to accommodate BSD/OS), and translate spaces (for "Power Macintosh")
45 osname = string.lower(osname)
46 osname = string.replace(osname, '/', '')
47 machine = string.replace(machine, ' ', '_')
48
49 if osname[:5] == "linux":
50 # At least on Linux/Intel, 'machine' is the processor --
51 # i386, etc.
52 # XXX what about Alpha, SPARC, etc?
53 return "%s-%s" % (osname, machine)
54 elif osname[:5] == "sunos":
55 if release[0] >= "5": # SunOS 5 == Solaris 2
56 osname = "solaris"
57 release = "%d.%s" % (int(release[0]) - 3, release[2:])
58 # fall through to standard osname-release-machine representation
59 elif osname[:4] == "irix": # could be "irix64"!
60 return "%s-%s" % (osname, release)
61 elif osname[:3] == "aix":
62 return "%s-%s.%s" % (osname, version, release)
63 elif osname[:6] == "cygwin":
64 osname = "cygwin"
65 rel_re = re.compile (r'[\d.]+')
66 m = rel_re.match(release)
67 if m:
68 release = m.group()
69
70 return "%s-%s-%s" % (osname, release, machine)
71
72# get_platform ()
73
74
75def convert_path (pathname):
76 """Return 'pathname' as a name that will work on the native filesystem,
77 i.e. split it on '/' and put it back together again using the current
78 directory separator. Needed because filenames in the setup script are
79 always supplied in Unix style, and have to be converted to the local
80 convention before we can actually use them in the filesystem. Raises
81 ValueError on non-Unix-ish systems if 'pathname' either starts or
82 ends with a slash.
83 """
84 if os.sep == '/':
85 return pathname
86 if not pathname:
87 return pathname
88 if pathname[0] == '/':
89 raise ValueError, "path '%s' cannot be absolute" % pathname
90 if pathname[-1] == '/':
91 raise ValueError, "path '%s' cannot end with '/'" % pathname
92
93 paths = string.split(pathname, '/')
94 while '.' in paths:
95 paths.remove('.')
96 if not paths:
97 return os.curdir
98 return apply(os.path.join, paths)
99
100# convert_path ()
101
102
103def change_root (new_root, pathname):
104 """Return 'pathname' with 'new_root' prepended. If 'pathname' is
105 relative, this is equivalent to "os.path.join(new_root,pathname)".
106 Otherwise, it requires making 'pathname' relative and then joining the
107 two, which is tricky on DOS/Windows and Mac OS.
108 """
109 if os.name == 'posix':
110 if not os.path.isabs(pathname):
111 return os.path.join(new_root, pathname)
112 else:
113 return os.path.join(new_root, pathname[1:])
114
115 elif os.name == 'nt':
116 (drive, path) = os.path.splitdrive(pathname)
117 if path[0] == '\\':
118 path = path[1:]
119 return os.path.join(new_root, path)
120
121 elif os.name == 'os2':
122 (drive, path) = os.path.splitdrive(pathname)
123 if path[0] == os.sep:
124 path = path[1:]
125 return os.path.join(new_root, path)
126
127 elif os.name == 'mac':
128 if not os.path.isabs(pathname):
129 return os.path.join(new_root, pathname)
130 else:
131 # Chop off volume name from start of path
132 elements = string.split(pathname, ":", 1)
133 pathname = ":" + elements[1]
134 return os.path.join(new_root, pathname)
135
136 else:
137 raise DistutilsPlatformError, \
138 "nothing known about platform '%s'" % os.name
139
140
141_environ_checked = 0
142def check_environ ():
143 """Ensure that 'os.environ' has all the environment variables we
144 guarantee that users can use in config files, command-line options,
145 etc. Currently this includes:
146 HOME - user's home directory (Unix only)
147 PLAT - description of the current platform, including hardware
148 and OS (see 'get_platform()')
149 """
150 global _environ_checked
151 if _environ_checked:
152 return
153
154 if os.name == 'posix' and not os.environ.has_key('HOME'):
155 import pwd
156 os.environ['HOME'] = pwd.getpwuid(os.getuid())[5]
157
158 if not os.environ.has_key('PLAT'):
159 os.environ['PLAT'] = get_platform()
160
161 _environ_checked = 1
162
163
164def subst_vars (s, local_vars):
165 """Perform shell/Perl-style variable substitution on 'string'. Every
166 occurrence of '$' followed by a name is considered a variable, and
167 variable is substituted by the value found in the 'local_vars'
168 dictionary, or in 'os.environ' if it's not in 'local_vars'.
169 'os.environ' is first checked/augmented to guarantee that it contains
170 certain values: see 'check_environ()'. Raise ValueError for any
171 variables not found in either 'local_vars' or 'os.environ'.
172 """
173 check_environ()
174 def _subst (match, local_vars=local_vars):
175 var_name = match.group(1)
176 if local_vars.has_key(var_name):
177 return str(local_vars[var_name])
178 else:
179 return os.environ[var_name]
180
181 try:
182 return re.sub(r'\$([a-zA-Z_][a-zA-Z_0-9]*)', _subst, s)
183 except KeyError, var:
184 raise ValueError, "invalid variable '$%s'" % var
185
186# subst_vars ()
187
188
189def grok_environment_error (exc, prefix="error: "):
190 """Generate a useful error message from an EnvironmentError (IOError or
191 OSError) exception object. Handles Python 1.5.1 and 1.5.2 styles, and
192 does what it can to deal with exception objects that don't have a
193 filename (which happens when the error is due to a two-file operation,
194 such as 'rename()' or 'link()'. Returns the error message as a string
195 prefixed with 'prefix'.
196 """
197 # check for Python 1.5.2-style {IO,OS}Error exception objects
198 if hasattr(exc, 'filename') and hasattr(exc, 'strerror'):
199 if exc.filename:
200 error = prefix + "%s: %s" % (exc.filename, exc.strerror)
201 else:
202 # two-argument functions in posix module don't
203 # include the filename in the exception object!
204 error = prefix + "%s" % exc.strerror
205 else:
206 error = prefix + str(exc[-1])
207
208 return error
209
210
211# Needed by 'split_quoted()'
212_wordchars_re = re.compile(r'[^\\\'\"%s ]*' % string.whitespace)
213_squote_re = re.compile(r"'(?:[^'\\]|\\.)*'")
214_dquote_re = re.compile(r'"(?:[^"\\]|\\.)*"')
215
216def split_quoted (s):
217 """Split a string up according to Unix shell-like rules for quotes and
218 backslashes. In short: words are delimited by spaces, as long as those
219 spaces are not escaped by a backslash, or inside a quoted string.
220 Single and double quotes are equivalent, and the quote characters can
221 be backslash-escaped. The backslash is stripped from any two-character
222 escape sequence, leaving only the escaped character. The quote
223 characters are stripped from any quoted string. Returns a list of
224 words.
225 """
226
227 # This is a nice algorithm for splitting up a single string, since it
228 # doesn't require character-by-character examination. It was a little
229 # bit of a brain-bender to get it working right, though...
230
231 s = string.strip(s)
232 words = []
233 pos = 0
234
235 while s:
236 m = _wordchars_re.match(s, pos)
237 end = m.end()
238 if end == len(s):
239 words.append(s[:end])
240 break
241
242 if s[end] in string.whitespace: # unescaped, unquoted whitespace: now
243 words.append(s[:end]) # we definitely have a word delimiter
244 s = string.lstrip(s[end:])
245 pos = 0
246
247 elif s[end] == '\\': # preserve whatever is being escaped;
248 # will become part of the current word
249 s = s[:end] + s[end+1:]
250 pos = end+1
251
252 else:
253 if s[end] == "'": # slurp singly-quoted string
254 m = _squote_re.match(s, end)
255 elif s[end] == '"': # slurp doubly-quoted string
256 m = _dquote_re.match(s, end)
257 else:
258 raise RuntimeError, \
259 "this can't happen (bad char '%c')" % s[end]
260
261 if m is None:
262 raise ValueError, \
263 "bad string (mismatched %s quotes?)" % s[end]
264
265 (beg, end) = m.span()
266 s = s[:beg] + s[beg+1:end-1] + s[end:]
267 pos = m.end() - 2
268
269 if pos >= len(s):
270 words.append(s)
271 break
272
273 return words
274
275# split_quoted ()
276
277
278def execute (func, args, msg=None, verbose=0, dry_run=0):
279 """Perform some action that affects the outside world (eg. by
280 writing to the filesystem). Such actions are special because they
281 are disabled by the 'dry_run' flag. This method takes care of all
282 that bureaucracy for you; all you have to do is supply the
283 function to call and an argument tuple for it (to embody the
284 "external action" being performed), and an optional message to
285 print.
286 """
287 if msg is None:
288 msg = "%s%s" % (func.__name__, `args`)
289 if msg[-2:] == ',)': # correct for singleton tuple
290 msg = msg[0:-2] + ')'
291
292 log.info(msg)
293 if not dry_run:
294 apply(func, args)
295
296
297def strtobool (val):
298 """Convert a string representation of truth to true (1) or false (0).
299
300 True values are 'y', 'yes', 't', 'true', 'on', and '1'; false values
301 are 'n', 'no', 'f', 'false', 'off', and '0'. Raises ValueError if
302 'val' is anything else.
303 """
304 val = string.lower(val)
305 if val in ('y', 'yes', 't', 'true', 'on', '1'):
306 return 1
307 elif val in ('n', 'no', 'f', 'false', 'off', '0'):
308 return 0
309 else:
310 raise ValueError, "invalid truth value %s" % `val`
311
312
313def byte_compile (py_files,
314 optimize=0, force=0,
315 prefix=None, base_dir=None,
316 verbose=1, dry_run=0,
317 direct=None):
318 """Byte-compile a collection of Python source files to either .pyc
319 or .pyo files in the same directory. 'py_files' is a list of files
320 to compile; any files that don't end in ".py" are silently skipped.
321 'optimize' must be one of the following:
322 0 - don't optimize (generate .pyc)
323 1 - normal optimization (like "python -O")
324 2 - extra optimization (like "python -OO")
325 If 'force' is true, all files are recompiled regardless of
326 timestamps.
327
328 The source filename encoded in each bytecode file defaults to the
329 filenames listed in 'py_files'; you can modify these with 'prefix' and
330 'basedir'. 'prefix' is a string that will be stripped off of each
331 source filename, and 'base_dir' is a directory name that will be
332 prepended (after 'prefix' is stripped). You can supply either or both
333 (or neither) of 'prefix' and 'base_dir', as you wish.
334
335 If 'dry_run' is true, doesn't actually do anything that would
336 affect the filesystem.
337
338 Byte-compilation is either done directly in this interpreter process
339 with the standard py_compile module, or indirectly by writing a
340 temporary script and executing it. Normally, you should let
341 'byte_compile()' figure out to use direct compilation or not (see
342 the source for details). The 'direct' flag is used by the script
343 generated in indirect mode; unless you know what you're doing, leave
344 it set to None.
345 """
346
347 # First, if the caller didn't force us into direct or indirect mode,
348 # figure out which mode we should be in. We take a conservative
349 # approach: choose direct mode *only* if the current interpreter is
350 # in debug mode and optimize is 0. If we're not in debug mode (-O
351 # or -OO), we don't know which level of optimization this
352 # interpreter is running with, so we can't do direct
353 # byte-compilation and be certain that it's the right thing. Thus,
354 # always compile indirectly if the current interpreter is in either
355 # optimize mode, or if either optimization level was requested by
356 # the caller.
357 if direct is None:
358 direct = (__debug__ and optimize == 0)
359
360 # "Indirect" byte-compilation: write a temporary script and then
361 # run it with the appropriate flags.
362 if not direct:
363 try:
364 from tempfile import mkstemp
365 (script_fd, script_name) = mkstemp(".py")
366 except ImportError:
367 from tempfile import mktemp
368 (script_fd, script_name) = None, mktemp(".py")
369 log.info("writing byte-compilation script '%s'", script_name)
370 if not dry_run:
371 if script_fd is not None:
372 script = os.fdopen(script_fd, "w")
373 else:
374 script = open(script_name, "w")
375
376 script.write("""\
377from distutils.util import byte_compile
378files = [
379""")
380
381 # XXX would be nice to write absolute filenames, just for
382 # safety's sake (script should be more robust in the face of
383 # chdir'ing before running it). But this requires abspath'ing
384 # 'prefix' as well, and that breaks the hack in build_lib's
385 # 'byte_compile()' method that carefully tacks on a trailing
386 # slash (os.sep really) to make sure the prefix here is "just
387 # right". This whole prefix business is rather delicate -- the
388 # problem is that it's really a directory, but I'm treating it
389 # as a dumb string, so trailing slashes and so forth matter.
390
391 #py_files = map(os.path.abspath, py_files)
392 #if prefix:
393 # prefix = os.path.abspath(prefix)
394
395 script.write(string.join(map(repr, py_files), ",\n") + "]\n")
396 script.write("""
397byte_compile(files, optimize=%s, force=%s,
398 prefix=%s, base_dir=%s,
399 verbose=%s, dry_run=0,
400 direct=1)
401""" % (`optimize`, `force`, `prefix`, `base_dir`, `verbose`))
402
403 script.close()
404
405 cmd = [sys.executable, script_name]
406 if optimize == 1:
407 cmd.insert(1, "-O")
408 elif optimize == 2:
409 cmd.insert(1, "-OO")
410 spawn(cmd, dry_run=dry_run)
411 execute(os.remove, (script_name,), "removing %s" % script_name,
412 dry_run=dry_run)
413
414 # "Direct" byte-compilation: use the py_compile module to compile
415 # right here, right now. Note that the script generated in indirect
416 # mode simply calls 'byte_compile()' in direct mode, a weird sort of
417 # cross-process recursion. Hey, it works!
418 else:
419 from py_compile import compile
420
421 for file in py_files:
422 if file[-3:] != ".py":
423 # This lets us be lazy and not filter filenames in
424 # the "install_lib" command.
425 continue
426
427 # Terminology from the py_compile module:
428 # cfile - byte-compiled file
429 # dfile - purported source filename (same as 'file' by default)
430 cfile = file + (__debug__ and "c" or "o")
431 dfile = file
432 if prefix:
433 if file[:len(prefix)] != prefix:
434 raise ValueError, \
435 ("invalid prefix: filename %s doesn't start with %s"
436 % (`file`, `prefix`))
437 dfile = dfile[len(prefix):]
438 if base_dir:
439 dfile = os.path.join(base_dir, dfile)
440
441 cfile_base = os.path.basename(cfile)
442 if direct:
443 if force or newer(file, cfile):
444 log.info("byte-compiling %s to %s", file, cfile_base)
445 if not dry_run:
446 compile(file, cfile, dfile)
447 else:
448 log.debug("skipping byte-compilation of %s to %s",
449 file, cfile_base)
450
451# byte_compile ()
452
453def rfc822_escape (header):
454 """Return a version of the string escaped for inclusion in an
455 RFC-822 header, by ensuring there are 8 spaces space after each newline.
456 """
457 lines = string.split(header, '\n')
458 lines = map(string.strip, lines)
459 header = string.join(lines, '\n' + 8*' ')
460 return header