]>
Commit | Line | Data |
---|---|---|
b5fe885e A |
1 | /*- |
2 | * Copyright (c) 2005 - Garance Alistair Drosehn <gad@FreeBSD.org>. | |
3 | * All rights reserved. | |
4 | * | |
5 | * Redistribution and use in source and binary forms, with or without | |
6 | * modification, are permitted provided that the following conditions | |
7 | * are met: | |
8 | * 1. Redistributions of source code must retain the above copyright | |
9 | * notice, this list of conditions and the following disclaimer. | |
10 | * 2. Redistributions in binary form must reproduce the above copyright | |
11 | * notice, this list of conditions and the following disclaimer in the | |
12 | * documentation and/or other materials provided with the distribution. | |
13 | * | |
14 | * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND | |
15 | * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE | |
16 | * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE | |
17 | * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE | |
18 | * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL | |
19 | * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS | |
20 | * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) | |
21 | * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT | |
22 | * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY | |
23 | * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF | |
24 | * SUCH DAMAGE. | |
25 | * | |
26 | * The views and conclusions contained in the software and documentation | |
27 | * are those of the authors and should not be interpreted as representing | |
28 | * official policies, either expressed or implied, of the FreeBSD Project. | |
29 | */ | |
30 | ||
31 | #include <sys/cdefs.h> | |
32 | __FBSDID("$FreeBSD$"); | |
33 | ||
34 | #include <sys/stat.h> | |
35 | #include <sys/param.h> | |
36 | #include <err.h> | |
37 | #include <errno.h> | |
38 | #include <ctype.h> | |
39 | #include <stdio.h> | |
40 | #include <stdlib.h> | |
41 | #include <string.h> | |
42 | #include <unistd.h> | |
43 | ||
44 | #include "envopts.h" | |
45 | ||
46 | static const char * | |
47 | expand_vars(int in_thisarg, char **thisarg_p, char **dest_p, | |
48 | const char **src_p); | |
49 | static int is_there(char *candidate); | |
50 | ||
51 | /* | |
52 | * The is*() routines take a parameter of 'int', but expect values in the range | |
53 | * of unsigned char. Define some wrappers which take a value of type 'char', | |
54 | * whether signed or unsigned, and ensure the value ends up in the right range. | |
55 | */ | |
56 | #define isalnumch(Anychar) isalnum((u_char)(Anychar)) | |
57 | #define isalphach(Anychar) isalpha((u_char)(Anychar)) | |
58 | #define isspacech(Anychar) isspace((u_char)(Anychar)) | |
59 | ||
60 | /* | |
61 | * Routine to determine if a given fully-qualified filename is executable. | |
62 | * This is copied almost verbatim from FreeBSD's usr.bin/which/which.c. | |
63 | */ | |
64 | static int | |
65 | is_there(char *candidate) | |
66 | { | |
67 | struct stat fin; | |
68 | ||
69 | /* XXX work around access(2) false positives for superuser */ | |
70 | if (access(candidate, X_OK) == 0 && | |
71 | stat(candidate, &fin) == 0 && | |
72 | S_ISREG(fin.st_mode) && | |
73 | (getuid() != 0 || | |
74 | (fin.st_mode & (S_IXUSR | S_IXGRP | S_IXOTH)) != 0)) { | |
75 | if (env_verbosity > 1) | |
76 | fprintf(stderr, "#env matched:\t'%s'\n", candidate); | |
77 | return (1); | |
78 | } | |
79 | return (0); | |
80 | } | |
81 | ||
82 | /** | |
83 | * Routine to search through an alternate path-list, looking for a given | |
84 | * filename to execute. If the file is found, replace the original | |
85 | * unqualified name with a fully-qualified path. This allows `env' to | |
86 | * execute programs from a specific strict list of possible paths, without | |
87 | * changing the value of PATH seen by the program which will be executed. | |
88 | * E.G.: | |
89 | * #!/usr/bin/env -S-P/usr/local/bin:/usr/bin perl | |
90 | * will execute /usr/local/bin/perl or /usr/bin/perl (whichever is found | |
91 | * first), no matter what the current value of PATH is, and without | |
92 | * changing the value of PATH that the script will see when it runs. | |
93 | * | |
94 | * This is similar to the print_matches() routine in usr.bin/which/which.c. | |
95 | */ | |
96 | void | |
97 | search_paths(char *path, char **argv) | |
98 | { | |
99 | char candidate[PATH_MAX]; | |
100 | const char *d; | |
101 | char *filename, *fqname; | |
102 | ||
103 | /* If the file has a `/' in it, then no search is done */ | |
104 | filename = *argv; | |
105 | if (strchr(filename, '/') != NULL) | |
106 | return; | |
107 | ||
108 | if (env_verbosity > 1) { | |
109 | fprintf(stderr, "#env Searching:\t'%s'\n", path); | |
110 | fprintf(stderr, "#env for file:\t'%s'\n", filename); | |
111 | } | |
112 | ||
113 | fqname = NULL; | |
114 | while ((d = strsep(&path, ":")) != NULL) { | |
115 | if (*d == '\0') | |
116 | d = "."; | |
117 | if (snprintf(candidate, sizeof(candidate), "%s/%s", d, | |
118 | filename) >= (int)sizeof(candidate)) | |
119 | continue; | |
120 | if (is_there(candidate)) { | |
121 | fqname = candidate; | |
122 | break; | |
123 | } | |
124 | } | |
125 | ||
126 | if (fqname == NULL) { | |
127 | errno = ENOENT; | |
128 | err(127, "%s", filename); | |
129 | } | |
130 | *argv = strdup(candidate); | |
131 | } | |
132 | ||
133 | /** | |
134 | * Routine to split a string into multiple parameters, while recognizing a | |
135 | * few special characters. It recognizes both single and double-quoted | |
136 | * strings. This processing is designed entirely for the benefit of the | |
137 | * parsing of "#!"-lines (aka "shebang" lines == the first line of an | |
138 | * executable script). Different operating systems parse that line in very | |
139 | * different ways, and this split-on-spaces processing is meant to provide | |
140 | * ways to specify arbitrary arguments on that line, no matter how the OS | |
141 | * parses it. | |
142 | * | |
143 | * Within a single-quoted string, the two characters "\'" are treated as | |
144 | * a literal "'" character to add to the string, and "\\" are treated as | |
145 | * a literal "\" character to add. Other than that, all characters are | |
146 | * copied until the processing gets to a terminating "'". | |
147 | * | |
148 | * Within a double-quoted string, many more "\"-style escape sequences | |
149 | * are recognized, mostly copied from what is recognized in the `printf' | |
150 | * command. Some OS's will not allow a literal blank character to be | |
151 | * included in the one argument that they recognize on a shebang-line, | |
152 | * so a few additional escape-sequences are defined to provide ways to | |
153 | * specify blanks. | |
154 | * | |
155 | * Within a double-quoted string "\_" is turned into a literal blank. | |
156 | * (Inside of a single-quoted string, the two characters are just copied) | |
157 | * Outside of a quoted string, "\_" is treated as both a blank, and the | |
158 | * end of the current argument. So with a shelbang-line of: | |
159 | * #!/usr/bin/env -SA=avalue\_perl | |
160 | * the -S value would be broken up into arguments "A=avalue" and "perl". | |
161 | */ | |
162 | void | |
163 | split_spaces(const char *str, int *origind, int *origc, char ***origv) | |
164 | { | |
165 | static const char *nullarg = ""; | |
166 | const char *bq_src, *copystr, *src; | |
167 | char *dest, **newargv, *newstr, **nextarg, **oldarg; | |
168 | int addcount, bq_destlen, copychar, found_sep, in_arg, in_dq, in_sq; | |
169 | ||
170 | /* | |
171 | * Ignore leading space on the string, and then malloc enough room | |
172 | * to build a copy of it. The copy might end up shorter than the | |
173 | * original, due to quoted strings and '\'-processing. | |
174 | */ | |
175 | while (isspacech(*str)) | |
176 | str++; | |
177 | if (*str == '\0') | |
178 | return; | |
179 | newstr = malloc(strlen(str) + 1); | |
180 | ||
181 | /* | |
182 | * Allocate plenty of space for the new array of arg-pointers, | |
183 | * and start that array off with the first element of the old | |
184 | * array. | |
185 | */ | |
186 | newargv = malloc((*origc + (strlen(str) / 2) + 2) * sizeof(char *)); | |
187 | nextarg = newargv; | |
188 | *nextarg++ = **origv; | |
189 | ||
190 | /* Come up with the new args by splitting up the given string. */ | |
191 | addcount = 0; | |
192 | bq_destlen = in_arg = in_dq = in_sq = 0; | |
193 | bq_src = NULL; | |
194 | for (src = str, dest = newstr; *src != '\0'; src++) { | |
195 | /* | |
196 | * This switch will look at a character in *src, and decide | |
197 | * what should be copied to *dest. It only decides what | |
198 | * character(s) to copy, it should not modify *dest. In some | |
199 | * cases, it will look at multiple characters from *src. | |
200 | */ | |
201 | copychar = found_sep = 0; | |
202 | copystr = NULL; | |
203 | switch (*src) { | |
204 | case '"': | |
205 | if (in_sq) | |
206 | copychar = *src; | |
207 | else if (in_dq) | |
208 | in_dq = 0; | |
209 | else { | |
210 | /* | |
211 | * Referencing nullarg ensures that a new | |
212 | * argument is created, even if this quoted | |
213 | * string ends up with zero characters. | |
214 | */ | |
215 | copystr = nullarg; | |
216 | in_dq = 1; | |
217 | bq_destlen = dest - *(nextarg - 1); | |
218 | bq_src = src; | |
219 | } | |
220 | break; | |
221 | case '$': | |
222 | if (in_sq) | |
223 | copychar = *src; | |
224 | else { | |
225 | copystr = expand_vars(in_arg, (nextarg - 1), | |
226 | &dest, &src); | |
227 | } | |
228 | break; | |
229 | case '\'': | |
230 | if (in_dq) | |
231 | copychar = *src; | |
232 | else if (in_sq) | |
233 | in_sq = 0; | |
234 | else { | |
235 | /* | |
236 | * Referencing nullarg ensures that a new | |
237 | * argument is created, even if this quoted | |
238 | * string ends up with zero characters. | |
239 | */ | |
240 | copystr = nullarg; | |
241 | in_sq = 1; | |
242 | bq_destlen = dest - *(nextarg - 1); | |
243 | bq_src = src; | |
244 | } | |
245 | break; | |
246 | case '\\': | |
247 | if (in_sq) { | |
248 | /* | |
249 | * Inside single-quoted strings, only the | |
250 | * "\'" and "\\" are recognized as special | |
251 | * strings. | |
252 | */ | |
253 | copychar = *(src + 1); | |
254 | if (copychar == '\'' || copychar == '\\') | |
255 | src++; | |
256 | else | |
257 | copychar = *src; | |
258 | break; | |
259 | } | |
260 | src++; | |
261 | switch (*src) { | |
262 | case '"': | |
263 | case '#': | |
264 | case '$': | |
265 | case '\'': | |
266 | case '\\': | |
267 | copychar = *src; | |
268 | break; | |
269 | case '_': | |
270 | /* | |
271 | * Alternate way to get a blank, which allows | |
272 | * that blank be used to separate arguments | |
273 | * when it is not inside a quoted string. | |
274 | */ | |
275 | if (in_dq) | |
276 | copychar = ' '; | |
277 | else { | |
278 | found_sep = 1; | |
279 | src++; | |
280 | } | |
281 | break; | |
282 | case 'c': | |
283 | /* | |
284 | * Ignore remaining characters in the -S string. | |
285 | * This would not make sense if found in the | |
286 | * middle of a quoted string. | |
287 | */ | |
288 | if (in_dq) | |
289 | errx(1, "Sequence '\\%c' is not allowed" | |
290 | " in quoted strings", *src); | |
291 | goto str_done; | |
292 | case 'f': | |
293 | copychar = '\f'; | |
294 | break; | |
295 | case 'n': | |
296 | copychar = '\n'; | |
297 | break; | |
298 | case 'r': | |
299 | copychar = '\r'; | |
300 | break; | |
301 | case 't': | |
302 | copychar = '\t'; | |
303 | break; | |
304 | case 'v': | |
305 | copychar = '\v'; | |
306 | break; | |
307 | default: | |
308 | if (isspacech(*src)) | |
309 | copychar = *src; | |
310 | else | |
311 | errx(1, "Invalid sequence '\\%c' in -S", | |
312 | *src); | |
313 | } | |
314 | break; | |
315 | default: | |
316 | if ((in_dq || in_sq) && in_arg) | |
317 | copychar = *src; | |
318 | else if (isspacech(*src)) | |
319 | found_sep = 1; | |
320 | else { | |
321 | /* | |
322 | * If the first character of a new argument | |
323 | * is `#', then ignore the remaining chars. | |
324 | */ | |
325 | if (!in_arg && *src == '#') | |
326 | goto str_done; | |
327 | copychar = *src; | |
328 | } | |
329 | } | |
330 | /* | |
331 | * Now that the switch has determined what (if anything) | |
332 | * needs to be copied, copy whatever that is to *dest. | |
333 | */ | |
334 | if (copychar || copystr != NULL) { | |
335 | if (!in_arg) { | |
336 | /* This is the first byte of a new argument */ | |
337 | *nextarg++ = dest; | |
338 | addcount++; | |
339 | in_arg = 1; | |
340 | } | |
341 | if (copychar) | |
342 | *dest++ = (char)copychar; | |
343 | else if (copystr != NULL) | |
344 | while (*copystr != '\0') | |
345 | *dest++ = *copystr++; | |
346 | } else if (found_sep) { | |
347 | *dest++ = '\0'; | |
348 | while (isspacech(*src)) | |
349 | src++; | |
350 | --src; | |
351 | in_arg = 0; | |
352 | } | |
353 | } | |
354 | str_done: | |
355 | *dest = '\0'; | |
356 | *nextarg = NULL; | |
357 | if (in_dq || in_sq) { | |
358 | errx(1, "No terminating quote for string: %.*s%s", | |
359 | bq_destlen, *(nextarg - 1), bq_src); | |
360 | } | |
361 | if (env_verbosity > 1) { | |
362 | fprintf(stderr, "#env split -S:\t'%s'\n", str); | |
363 | oldarg = newargv + 1; | |
364 | fprintf(stderr, "#env into:\t'%s'\n", *oldarg); | |
365 | for (oldarg++; *oldarg; oldarg++) | |
366 | fprintf(stderr, "#env &\t'%s'\n", *oldarg); | |
367 | } | |
368 | ||
369 | /* Copy the unprocessed arg-pointers from the original array */ | |
370 | for (oldarg = *origv + *origind; *oldarg; oldarg++) | |
371 | *nextarg++ = *oldarg; | |
372 | *nextarg = NULL; | |
373 | ||
374 | /* Update optind/argc/argv in the calling routine */ | |
375 | *origind = 1; | |
376 | *origc += addcount; | |
377 | *origv = newargv; | |
378 | } | |
379 | ||
380 | /** | |
381 | * Routine to split expand any environment variables referenced in the string | |
382 | * that -S is processing. For now it only supports the form ${VARNAME}. It | |
383 | * explicitly does not support $VARNAME, and obviously can not handle special | |
384 | * shell-variables such as $?, $*, $1, etc. It is called with *src_p pointing | |
385 | * at the initial '$', and if successful it will update *src_p, *dest_p, and | |
386 | * possibly *thisarg_p in the calling routine. | |
387 | */ | |
388 | static const char * | |
389 | expand_vars(int in_thisarg, char **thisarg_p, char **dest_p, const char **src_p) | |
390 | { | |
391 | const char *vbegin, *vend, *vvalue; | |
392 | char *newstr, *vname; | |
393 | int bad_reference; | |
394 | size_t namelen, newlen; | |
395 | ||
396 | bad_reference = 1; | |
397 | vbegin = vend = (*src_p) + 1; | |
398 | if (*vbegin++ == '{') | |
399 | if (*vbegin == '_' || isalphach(*vbegin)) { | |
400 | vend = vbegin + 1; | |
401 | while (*vend == '_' || isalnumch(*vend)) | |
402 | vend++; | |
403 | if (*vend == '}') | |
404 | bad_reference = 0; | |
405 | } | |
406 | if (bad_reference) | |
407 | errx(1, "Only ${VARNAME} expansion is supported, error at: %s", | |
408 | *src_p); | |
409 | ||
410 | /* | |
411 | * We now know we have a valid environment variable name, so update | |
412 | * the caller's source-pointer to the last character in that reference, | |
413 | * and then pick up the matching value. If the variable is not found, | |
414 | * or if it has a null value, then our work here is done. | |
415 | */ | |
416 | *src_p = vend; | |
417 | namelen = vend - vbegin + 1; | |
418 | vname = malloc(namelen); | |
419 | strlcpy(vname, vbegin, namelen); | |
420 | vvalue = getenv(vname); | |
421 | if (vvalue == NULL || *vvalue == '\0') { | |
422 | if (env_verbosity > 2) | |
423 | fprintf(stderr, | |
424 | "#env replacing ${%s} with null string\n", | |
425 | vname); | |
426 | free(vname); | |
427 | return (NULL); | |
428 | } | |
429 | ||
430 | if (env_verbosity > 2) | |
431 | fprintf(stderr, "#env expanding ${%s} into '%s'\n", vname, | |
432 | vvalue); | |
433 | ||
434 | /* | |
435 | * There is some value to copy to the destination. If the value is | |
436 | * shorter than the ${VARNAME} reference that it replaces, then our | |
437 | * caller can just copy the value to the existing destination. | |
438 | */ | |
439 | if (strlen(vname) + 3 >= strlen(vvalue)) { | |
440 | free(vname); | |
441 | return (vvalue); | |
442 | } | |
443 | ||
444 | /* | |
445 | * The value is longer than the string it replaces, which means the | |
446 | * present destination area is too small to hold it. Create a new | |
447 | * destination area, and update the caller's 'dest' variable to match. | |
448 | * If the caller has already started copying some info for 'thisarg' | |
449 | * into the present destination, then the new destination area must | |
450 | * include a copy of that data, and the pointer to 'thisarg' must also | |
451 | * be updated. Note that it is still the caller which copies this | |
452 | * vvalue to the new *dest. | |
453 | */ | |
454 | newlen = strlen(vvalue) + strlen(*src_p) + 1; | |
455 | if (in_thisarg) { | |
456 | **dest_p = '\0'; /* Provide terminator for 'thisarg' */ | |
457 | newlen += strlen(*thisarg_p); | |
458 | newstr = malloc(newlen); | |
459 | strcpy(newstr, *thisarg_p); | |
460 | *thisarg_p = newstr; | |
461 | } else { | |
462 | newstr = malloc(newlen); | |
463 | *newstr = '\0'; | |
464 | } | |
465 | *dest_p = strchr(newstr, '\0'); | |
466 | free(vname); | |
467 | return (vvalue); | |
468 | } |