glibc/posix/wordexp.c
Ulrich Drepper 1ffaaca2a3 Update.
1998-09-14 22:46  Tim Waugh  <tim@cyberelk.demon.co.uk>

	* posix/wordexp-test.c: Chet Ramey confirmed that bash's behaviour
	for field-splitting 🔤 is correct, and that two fields should
	result. Revert tests to reflect this.

	* posix/wordexp.c (w_emptyword): Remove function.
	(exec_comm): Don't use w_emptyword.
	(parse_param): Likewise.
1998-09-14 15:22:40 +00:00

2252 lines
46 KiB
C

/* POSIX.2 wordexp implementation.
Copyright (C) 1997, 1998 Free Software Foundation, Inc.
This file is part of the GNU C Library.
Contributed by Tim Waugh <tim@cyberelk.demon.co.uk>.
The GNU C Library is free software; you can redistribute it and/or
modify it under the terms of the GNU Library General Public License as
published by the Free Software Foundation; either version 2 of the
License, or (at your option) any later version.
The GNU C Library is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
Library General Public License for more details.
You should have received a copy of the GNU Library General Public
License along with the GNU C Library; see the file COPYING.LIB. If not,
write to the Free Software Foundation, Inc., 59 Temple Place - Suite 330,
Boston, MA 02111-1307, USA. */
#include <wordexp.h>
#include <signal.h>
#include <stdlib.h>
#include <pwd.h>
#include <sys/types.h>
#include <string.h>
#include <glob.h>
#include <ctype.h>
#include <sys/time.h>
#include <sys/types.h>
#include <sys/wait.h>
#include <unistd.h>
#include <fcntl.h>
#include <sys/stat.h>
#include <paths.h>
#include <errno.h>
#include <sys/param.h>
#include <stdio.h>
#include <fnmatch.h>
#include <stdio-common/_itoa.h>
/* Undefine the following line for the production version. */
/* #define NDEBUG 1 */
#include <assert.h>
/*
* This is a recursive-descent-style word expansion routine.
*/
/* These variables are defined and initialized in the startup code. */
extern int __libc_argc;
extern char **__libc_argv;
/* Some forward declarations */
static int parse_dollars (char **word, size_t *word_length, size_t *max_length,
const char *words, size_t *offset, int flags,
wordexp_t *pwordexp, const char *ifs,
const char *ifs_white, int quoted)
internal_function;
static int parse_backtick (char **word, size_t *word_length,
size_t *max_length, const char *words,
size_t *offset, int flags, wordexp_t *pwordexp,
const char *ifs, const char *ifs_white)
internal_function;
static int parse_dquote (char **word, size_t *word_length, size_t *max_length,
const char *words, size_t *offset, int flags,
wordexp_t *pwordexp, const char *ifs,
const char *ifs_white)
internal_function;
static int eval_expr (char *expr, long int *result) internal_function;
/* The w_*() functions manipulate word lists. */
#define W_CHUNK (100)
/* Result of w_newword will be ignored if it the last word. */
static inline char *
w_newword (size_t *actlen, size_t *maxlen)
{
*actlen = *maxlen = 0;
return NULL;
}
static inline char *
w_addchar (char *buffer, size_t *actlen, size_t *maxlen, char ch)
/* (lengths exclude trailing zero) */
{
/* Add a character to the buffer, allocating room for it if needed.
*/
if (*actlen == *maxlen)
{
char *old_buffer = buffer;
assert (buffer == NULL || *maxlen != 0);
*maxlen += W_CHUNK;
buffer = realloc (buffer, 1 + *maxlen);
if (buffer == NULL)
free (old_buffer);
}
if (buffer != NULL)
{
buffer[*actlen] = ch;
buffer[++(*actlen)] = '\0';
}
return buffer;
}
static char *
internal_function
w_addmem (char *buffer, size_t *actlen, size_t *maxlen, const char *str,
size_t len)
{
/* Add a string to the buffer, allocating room for it if needed.
*/
if (*actlen + len > *maxlen)
{
char *old_buffer = buffer;
assert (buffer == NULL || *maxlen != 0);
*maxlen += MAX (2 * len, W_CHUNK);
buffer = realloc (old_buffer, 1 + *maxlen);
if (buffer == NULL)
free (old_buffer);
}
if (buffer != NULL)
{
*((char *) __mempcpy (&buffer[*actlen], str, len)) = '\0';
*actlen += len;
}
return buffer;
}
static char *
internal_function
w_addstr (char *buffer, size_t *actlen, size_t *maxlen, const char *str)
/* (lengths exclude trailing zero) */
{
/* Add a string to the buffer, allocating room for it if needed.
*/
size_t len;
assert (str != NULL); /* w_addstr only called from this file */
len = strlen (str);
return w_addmem (buffer, actlen, maxlen, str, len);
}
static int
internal_function
w_addword (wordexp_t *pwordexp, char *word)
{
/* Add a word to the wordlist */
size_t num_p;
char **new_wordv;
/* Internally, NULL acts like "". Convert NULLs to "" before
* the caller sees them.
*/
if (word == NULL)
{
word = __strdup ("");
if (word == NULL)
goto no_space;
}
num_p = 2 + pwordexp->we_wordc + pwordexp->we_offs;
new_wordv = realloc (pwordexp->we_wordv, sizeof (char *) * num_p);
if (new_wordv != NULL)
{
pwordexp->we_wordv = new_wordv;
pwordexp->we_wordv[pwordexp->we_wordc++] = word;
pwordexp->we_wordv[pwordexp->we_wordc] = NULL;
return 0;
}
no_space:
return WRDE_NOSPACE;
}
/* The parse_*() functions should leave *offset being the offset in 'words'
* to the last character processed.
*/
static int
internal_function
parse_backslash (char **word, size_t *word_length, size_t *max_length,
const char *words, size_t *offset)
{
/* We are poised _at_ a backslash, not in quotes */
switch (words[1 + *offset])
{
case 0:
/* Backslash is last character of input words */
return WRDE_SYNTAX;
case '\n':
++(*offset);
break;
default:
*word = w_addchar (*word, word_length, max_length, words[1 + *offset]);
if (*word == NULL)
return WRDE_NOSPACE;
++(*offset);
break;
}
return 0;
}
static int
internal_function
parse_qtd_backslash (char **word, size_t *word_length, size_t *max_length,
const char *words, size_t *offset)
{
/* We are poised _at_ a backslash, inside quotes */
switch (words[1 + *offset])
{
case 0:
/* Backslash is last character of input words */
return WRDE_SYNTAX;
case '\n':
++(*offset);
break;
case '$':
case '`':
case '"':
case '\\':
*word = w_addchar (*word, word_length, max_length, words[1 + *offset]);
if (*word == NULL)
return WRDE_NOSPACE;
++(*offset);
break;
default:
*word = w_addchar (*word, word_length, max_length, words[*offset]);
if (*word != NULL)
*word = w_addchar (*word, word_length, max_length, words[1 + *offset]);
if (*word == NULL)
return WRDE_NOSPACE;
++(*offset);
break;
}
return 0;
}
static int
internal_function
parse_tilde (char **word, size_t *word_length, size_t *max_length,
const char *words, size_t *offset, size_t wordc)
{
/* We are poised _at_ a tilde */
size_t i;
if (*word_length != 0)
{
if (!((*word)[*word_length - 1] == '=' && wordc == 0))
{
if (!((*word)[*word_length - 1] == ':'
&& strchr (*word, '=') && wordc == 0))
{
*word = w_addchar (*word, word_length, max_length, '~');
return *word ? 0 : WRDE_NOSPACE;
}
}
}
for (i = 1 + *offset; words[i]; i++)
{
if (words[i] == ':' || words[i] == '/' || words[i] == ' ' ||
words[i] == '\t' || words[i] == 0 )
break;
if (words[i] == '\\')
{
*word = w_addchar (*word, word_length, max_length, '~');
return *word ? 0 : WRDE_NOSPACE;
}
}
if (i == 1 + *offset)
{
/* Tilde appears on its own */
uid_t uid;
struct passwd pwd, *tpwd;
int buflen = 1000;
char* buffer = __alloca (buflen);
int result;
uid = __getuid ();
while ((result = __getpwuid_r (uid, &pwd, buffer, buflen, &tpwd)) != 0
&& errno == ERANGE)
{
buflen += 1000;
buffer = __alloca (buflen);
}
if (result == 0 && pwd.pw_dir != NULL)
{
*word = w_addstr (*word, word_length, max_length, pwd.pw_dir);
if (*word == NULL)
return WRDE_NOSPACE;
}
else
{
*word = w_addchar (*word, word_length, max_length, '~');
if (*word == NULL)
return WRDE_NOSPACE;
}
}
else
{
/* Look up user name in database to get home directory */
char *user = __strndup (&words[1 + *offset], i - *offset);
struct passwd pwd, *tpwd;
int buflen = 1000;
char* buffer = __alloca (buflen);
int result;
while ((result = __getpwnam_r (user, &pwd, buffer, buflen, &tpwd)) != 0
&& errno == ERANGE)
{
buflen += 1000;
buffer = __alloca (buflen);
}
if (result == 0 && pwd.pw_dir)
*word = w_addstr (*word, word_length, max_length, pwd.pw_dir);
else
{
/* (invalid login name) */
*word = w_addchar (*word, word_length, max_length, '~');
if (*word != NULL)
*word = w_addstr (*word, word_length, max_length, user);
}
*offset = i - 1;
}
return *word ? 0 : WRDE_NOSPACE;
}
static int
internal_function
do_parse_glob (const char *glob_word, char **word, size_t *word_length,
size_t *max_length, wordexp_t *pwordexp, const char *ifs,
const char *ifs_white)
{
int error;
int match;
glob_t globbuf;
error = glob (glob_word, GLOB_NOCHECK, NULL, &globbuf);
if (error != 0)
{
/* We can only run into memory problems. */
assert (error == GLOB_NOSPACE);
return WRDE_NOSPACE;
}
if (ifs && !*ifs)
{
/* No field splitting allowed. */
assert (globbuf.gl_pathv[0] != NULL);
*word = w_addstr (*word, word_length, max_length, globbuf.gl_pathv[0]);
for (match = 1; match < globbuf.gl_pathc && *word != NULL; ++match)
{
*word = w_addchar (*word, word_length, max_length, ' ');
if (*word != NULL)
*word = w_addstr (*word, word_length, max_length,
globbuf.gl_pathv[match]);
}
globfree (&globbuf);
return *word ? 0 : WRDE_NOSPACE;
}
assert (ifs == NULL || *ifs != '\0');
if (*word != NULL)
{
free (*word);
*word = w_newword (word_length, max_length);
}
for (match = 0; match < globbuf.gl_pathc; ++match)
{
char *matching_word = __strdup (globbuf.gl_pathv[match]);
if (matching_word == NULL || w_addword (pwordexp, matching_word))
{
globfree (&globbuf);
return WRDE_NOSPACE;
}
}
globfree (&globbuf);
return 0;
}
static int
internal_function
parse_glob (char **word, size_t *word_length, size_t *max_length,
const char *words, size_t *offset, int flags,
wordexp_t *pwordexp, const char *ifs, const char *ifs_white)
{
/* We are poised just after a '*', a '[' or a '?'. */
int error = WRDE_NOSPACE;
int quoted = 0; /* 1 if singly-quoted, 2 if doubly */
int i;
wordexp_t glob_list; /* List of words to glob */
glob_list.we_wordc = 0;
glob_list.we_wordv = NULL;
glob_list.we_offs = 0;
for (; words[*offset] != '\0'; ++*offset)
{
if ((ifs && strchr (ifs, words[*offset])) ||
(!ifs && strchr (" \t\n", words[*offset])))
/* Reached IFS */
break;
/* Sort out quoting */
if (words[*offset] == '\'')
{
if (quoted == 0)
{
quoted = 1;
continue;
}
else if (quoted == 1)
{
quoted = 0;
continue;
}
}
else if (words[*offset] == '"')
{
if (quoted == 0)
{
quoted = 2;
continue;
}
else if (quoted == 2)
{
quoted = 0;
continue;
}
}
/* Sort out other special characters */
if (quoted != 1 && words[*offset] == '$')
{
error = parse_dollars (word, word_length, max_length, words,
offset, flags, &glob_list, ifs, ifs_white,
quoted == 2);
if (error)
goto tidy_up;
continue;
}
else if (words[*offset] == '\\')
{
if (quoted)
error = parse_qtd_backslash (word, word_length, max_length,
words, offset);
else
error = parse_backslash (word, word_length, max_length,
words, offset);
if (error)
goto tidy_up;
continue;
}
*word = w_addchar (*word, word_length, max_length, words[*offset]);
if (*word == NULL)
goto tidy_up;
}
/* Don't forget to re-parse the character we stopped at. */
--*offset;
/* Glob the words */
error = w_addword (&glob_list, *word);
*word = w_newword (word_length, max_length);
for (i = 0; error == 0 && i < glob_list.we_wordc; i++)
error = do_parse_glob (glob_list.we_wordv[i], word, word_length,
max_length, pwordexp, ifs, ifs_white);
/* Now tidy up */
tidy_up:
wordfree (&glob_list);
return error;
}
static int
internal_function
parse_squote (char **word, size_t *word_length, size_t *max_length,
const char *words, size_t *offset)
{
/* We are poised just after a single quote */
for (; words[*offset]; ++(*offset))
{
if (words[*offset] != '\'')
{
*word = w_addchar (*word, word_length, max_length, words[*offset]);
if (*word == NULL)
return WRDE_NOSPACE;
}
else return 0;
}
/* Unterminated string */
return WRDE_SYNTAX;
}
/* Functions to evaluate an arithmetic expression */
static int
internal_function
eval_expr_val (char **expr, long int *result)
{
int sgn = +1;
char *digit;
/* Skip white space */
for (digit = *expr; digit && *digit && isspace (*digit); ++digit);
switch (*digit)
{
case '(':
/* Scan for closing paren */
for (++digit; **expr && **expr != ')'; ++(*expr));
/* Is there one? */
if (!**expr)
return WRDE_SYNTAX;
*(*expr)++ = 0;
if (eval_expr (digit, result))
return WRDE_SYNTAX;
return 0;
case '+': /* Positive value */
++digit;
break;
case '-': /* Negative value */
++digit;
sgn = -1;
break;
default:
if (!isdigit (*digit))
return WRDE_SYNTAX;
}
*result = 0;
for (; *digit && isdigit (*digit); ++digit)
*result = (*result * 10) + (*digit - '0');
*expr = digit;
*result *= sgn;
return 0;
}
static int
internal_function
eval_expr_multdiv (char **expr, long int *result)
{
long int arg;
/* Read a Value */
if (eval_expr_val (expr, result) != 0)
return WRDE_SYNTAX;
while (**expr)
{
/* Skip white space */
for (; *expr && **expr && isspace (**expr); ++(*expr));
if (**expr == '*')
{
++(*expr);
if (eval_expr_val (expr, &arg) != 0)
return WRDE_SYNTAX;
*result *= arg;
}
else if (**expr == '/')
{
++(*expr);
if (eval_expr_val (expr, &arg) != 0)
return WRDE_SYNTAX;
*result /= arg;
}
else break;
}
return 0;
}
static int
internal_function
eval_expr (char *expr, long int *result)
{
long int arg;
/* Read a Multdiv */
if (eval_expr_multdiv (&expr, result) != 0)
return WRDE_SYNTAX;
while (*expr)
{
/* Skip white space */
for (; expr && *expr && isspace (*expr); ++expr);
if (*expr == '+')
{
++expr;
if (eval_expr_multdiv (&expr, &arg) != 0)
return WRDE_SYNTAX;
*result += arg;
}
else if (*expr == '-')
{
++expr;
if (eval_expr_multdiv (&expr, &arg) != 0)
return WRDE_SYNTAX;
*result -= arg;
}
else break;
}
return 0;
}
static int
internal_function
parse_arith (char **word, size_t *word_length, size_t *max_length,
const char *words, size_t *offset, int flags, int bracket)
{
/* We are poised just after "$((" or "$[" */
int error;
int paren_depth = 1;
size_t expr_length;
size_t expr_maxlen;
char *expr;
expr = w_newword (&expr_length, &expr_maxlen);
for (; words[*offset]; ++(*offset))
{
switch (words[*offset])
{
case '$':
error = parse_dollars (&expr, &expr_length, &expr_maxlen,
words, offset, flags, NULL, NULL, NULL, 1);
/* The ``1'' here is to tell parse_dollars not to
* split the fields.
*/
if (error)
{
free (expr);
return error;
}
break;
case '`':
(*offset)++;
error = parse_backtick (&expr, &expr_length, &expr_maxlen,
words, offset, flags, NULL, NULL, NULL);
/* The first NULL here is to tell parse_backtick not to
* split the fields.
*/
if (error)
{
free (expr);
return error;
}
break;
case '\\':
error = parse_qtd_backslash (&expr, &expr_length, &expr_maxlen,
words, offset);
if (error)
{
free (expr);
return error;
}
/* I think that a backslash within an
* arithmetic expansion is bound to
* cause an error sooner or later anyway though.
*/
break;
case ')':
if (--paren_depth == 0)
{
char result[21]; /* 21 = ceil(log10(2^64)) + 1 */
long int numresult = 0;
long long int convertme;
if (bracket || words[1 + *offset] != ')')
{
free (expr);
return WRDE_SYNTAX;
}
++(*offset);
/* Go - evaluate. */
if (*expr && eval_expr (expr, &numresult) != 0)
{
free (expr);
return WRDE_SYNTAX;
}
if (numresult < 0)
{
convertme = -numresult;
*word = w_addchar (*word, word_length, max_length, '-');
if (!*word)
{
free (expr);
return WRDE_NOSPACE;
}
}
else
convertme = numresult;
result[20] = '\0';
*word = w_addstr (*word, word_length, max_length,
_itoa (convertme, &result[20], 10, 0));
free (expr);
return *word ? 0 : WRDE_NOSPACE;
}
expr = w_addchar (expr, &expr_length, &expr_maxlen, words[*offset]);
if (expr == NULL)
return WRDE_NOSPACE;
break;
case ']':
if (bracket && paren_depth == 1)
{
char result[21]; /* 21 = ceil(log10(2^64)) + 1 */
long int numresult = 0;
/* Go - evaluate. */
if (*expr && eval_expr (expr, &numresult) != 0)
{
free (expr);
return WRDE_SYNTAX;
}
result[20] = '\0';
*word = w_addstr (*word, word_length, max_length,
_itoa_word (numresult, &result[20], 10, 0));
free (expr);
return *word ? 0 : WRDE_NOSPACE;
}
free (expr);
return WRDE_SYNTAX;
case '\n':
case ';':
case '{':
case '}':
free (expr);
return WRDE_BADCHAR;
case '(':
++paren_depth;
default:
expr = w_addchar (expr, &expr_length, &expr_maxlen, words[*offset]);
if (expr == NULL)
return WRDE_NOSPACE;
}
}
/* Premature end */
free (expr);
return WRDE_SYNTAX;
}
/* Function to execute a command and retrieve the results */
/* pwordexp contains NULL if field-splitting is forbidden */
static int
internal_function
exec_comm (char *comm, char **word, size_t *word_length, size_t *max_length,
int flags, wordexp_t *pwordexp, const char *ifs,
const char *ifs_white)
{
int fildes[2];
int bufsize = 128;
int buflen;
int i;
char *buffer;
pid_t pid;
/* Don't fork() unless necessary */
if (!comm || !*comm)
return 0;
if (__pipe (fildes))
/* Bad */
return WRDE_NOSPACE;
if ((pid = __fork ()) < 0)
{
/* Bad */
__close (fildes[0]);
__close (fildes[1]);
return WRDE_NOSPACE;
}
if (pid == 0)
{
/* Child */
const char *args[4] = { _PATH_BSHELL, "-c", comm, NULL };
/* Redirect output. */
__dup2 (fildes[1], 1);
__close (fildes[1]);
/* Redirect stderr to /dev/null if we have to. */
if ((flags & WRDE_SHOWERR) == 0)
{
int fd;
__close (2);
fd = __open (_PATH_DEVNULL, O_WRONLY);
if (fd >= 0 && fd != 2)
{
__dup2 (fd, 2);
__close (fd);
}
}
__close (fildes[0]);
__execve (_PATH_BSHELL, (char *const *) args, __environ);
/* Bad. What now? */
abort ();
}
/* Parent */
__close (fildes[1]);
buffer = __alloca (bufsize);
if (!pwordexp)
{ /* Quoted - no field splitting */
while (1)
{
if ((buflen = __read (fildes[0], buffer, bufsize)) < 1)
{
if (__waitpid (pid, NULL, WNOHANG) == 0)
continue;
if ((buflen = __read (fildes[0], buffer, bufsize)) < 1)
break;
}
*word = w_addmem (*word, word_length, max_length, buffer, buflen);
if (*word == NULL)
goto no_space;
}
}
else
/* Not quoted - split fields */
{
int copying = 0;
/* 'copying' is:
* 0 when searching for first character in a field not IFS white space
* 1 when copying the text of a field
* 2 when searching for possible non-whitespace IFS
*/
while (1)
{
if ((buflen = __read (fildes[0], buffer, bufsize)) < 1)
{
if (__waitpid (pid, NULL, WNOHANG) == 0)
continue;
if ((__read (fildes[0], buffer, bufsize)) < 1)
break;
}
for (i = 0; i < buflen; ++i)
{
if (strchr (ifs, buffer[i]) != NULL)
{
/* Current character is IFS */
if (strchr (ifs_white, buffer[i]) == NULL)
{
/* Current character is IFS but not whitespace */
if (copying == 2)
{
/* current character
* |
* V
* eg: text<space><comma><space>moretext
*
* So, strip whitespace IFS (like at the start)
*/
copying = 0;
continue;
}
copying = 0;
/* fall through and delimit field.. */
}
else
{
/* Current character is IFS white space */
/* If not copying a field, ignore it */
if (copying != 1)
continue;
/* End of field (search for non-ws IFS afterwards) */
copying = 2;
}
/* First IFS white space, or IFS non-whitespace.
* Delimit the field. Nulls are converted by w_addword. */
if (w_addword (pwordexp, *word) == WRDE_NOSPACE)
goto no_space;
*word = w_newword (word_length, max_length);
/* fall back round the loop.. */
}
else
{
/* Not IFS character */
copying = 1;
*word = w_addchar (*word, word_length, max_length,
buffer[i]);
if (*word == NULL)
goto no_space;
}
}
}
}
/* Bash chops off trailing newlines, which seems sensible. */
while (*word_length > 0 && (*word)[*word_length - 1] == '\n')
{
(*word)[--*word_length] = '\0';
/* If the last word was entirely newlines, turn it into a new word
* which can be ignored if there's nothing following it. */
if (*word_length == 0)
{
free (*word);
*word = w_newword (word_length, max_length);
break;
}
}
__close (fildes[0]);
return 0;
no_space:
__kill (pid, SIGKILL);
__waitpid (pid, NULL, 0);
__close (fildes[0]);
return WRDE_NOSPACE;
}
static int
internal_function
parse_comm (char **word, size_t *word_length, size_t *max_length,
const char *words, size_t *offset, int flags, wordexp_t *pwordexp,
const char *ifs, const char *ifs_white)
{
/* We are poised just after "$(" */
int paren_depth = 1;
int error = 0;
int quoted = 0; /* 1 for singly-quoted, 2 for doubly-quoted */
size_t comm_length;
size_t comm_maxlen;
char *comm = w_newword (&comm_length, &comm_maxlen);
for (; words[*offset]; ++(*offset))
{
switch (words[*offset])
{
case '\'':
if (quoted == 0)
quoted = 1;
else if (quoted == 1)
quoted = 0;
break;
case '"':
if (quoted == 0)
quoted = 2;
else if (quoted == 2)
quoted = 0;
break;
case ')':
if (!quoted && --paren_depth == 0)
{
/* Go -- give script to the shell */
if (comm)
{
error = exec_comm (comm, word, word_length, max_length,
flags, pwordexp, ifs, ifs_white);
free (comm);
}
return error;
}
/* This is just part of the script */
break;
case '(':
if (!quoted)
++paren_depth;
}
comm = w_addchar (comm, &comm_length, &comm_maxlen, words[*offset]);
if (comm == NULL)
return WRDE_NOSPACE;
}
/* Premature end */
if (comm)
free (comm);
return WRDE_SYNTAX;
}
static int
internal_function
parse_param (char **word, size_t *word_length, size_t *max_length,
const char *words, size_t *offset, int flags, wordexp_t *pwordexp,
const char *ifs, const char *ifs_white, int quoted)
{
/* We are poised just after "$" */
enum action
{
ACT_NONE,
ACT_RP_SHORT_LEFT = '#',
ACT_RP_LONG_LEFT = 'L',
ACT_RP_SHORT_RIGHT = '%',
ACT_RP_LONG_RIGHT = 'R',
ACT_NULL_ERROR = '?',
ACT_NULL_SUBST = '-',
ACT_NONNULL_SUBST = '+',
ACT_NULL_ASSIGN = '='
};
size_t env_length;
size_t env_maxlen;
size_t pat_length;
size_t pat_maxlen;
size_t start = *offset;
char *env;
char *pattern;
char *value = NULL;
enum action action = ACT_NONE;
int depth = 0;
int colon_seen = 0;
int seen_hash = 0;
int free_value = 0;
int pattern_is_quoted = 0; /* 1 for singly-quoted, 2 for doubly-quoted */
int error;
int special = 0;
char buffer[21];
int brace = words[*offset] == '{';
env = w_newword (&env_length, &env_maxlen);
pattern = w_newword (&pat_length, &pat_maxlen);
if (brace)
++*offset;
/* First collect the parameter name. */
if (words[*offset] == '#')
{
seen_hash = 1;
if (!brace)
goto envsubst;
++*offset;
}
if (isalpha (words[*offset]) || words[*offset] == '_')
{
/* Normal parameter name. */
do
{
env = w_addchar (env, &env_length, &env_maxlen,
words[*offset]);
if (env == NULL)
goto no_space;
}
while (isalnum (words[++*offset]) || words[*offset] == '_');
}
else if (isdigit (words[*offset]))
{
/* Numeric parameter name. */
special = 1;
do
{
env = w_addchar (env, &env_length, &env_maxlen,
words[*offset]);
if (env == NULL)
goto no_space;
if (!brace)
goto envsubst;
}
while (isdigit(words[++*offset]));
}
else if (strchr ("*@$", words[*offset]) != NULL)
{
/* Special parameter. */
special = 1;
env = w_addchar (env, &env_length, &env_maxlen,
words[*offset]);
if (env == NULL)
goto no_space;
++*offset;
}
else
{
if (brace)
goto syntax;
}
if (brace)
{
/* Check for special action to be applied to the value. */
switch (words[*offset])
{
case '}':
/* Evaluate. */
goto envsubst;
case '#':
action = ACT_RP_SHORT_LEFT;
if (words[1 + *offset] == '#')
{
++*offset;
action = ACT_RP_LONG_LEFT;
}
break;
case '%':
action = ACT_RP_SHORT_RIGHT;
if (words[1 + *offset] == '%')
{
++*offset;
action = ACT_RP_LONG_RIGHT;
}
break;
case ':':
if (strchr ("-=?+", words[1 + *offset]) == NULL)
goto syntax;
colon_seen = 1;
action = words[++*offset];
break;
case '-':
case '=':
case '?':
case '+':
action = words[*offset];
break;
default:
goto syntax;
}
/* Now collect the pattern. */
++*offset;
for (; words[*offset]; ++(*offset))
{
switch (words[*offset])
{
case '{':
if (!pattern_is_quoted)
++depth;
break;
case '}':
if (!pattern_is_quoted)
{
if (depth == 0)
goto envsubst;
--depth;
}
break;
case '\\':
if (!pattern_is_quoted && words[++*offset] == '\0')
goto syntax;
break;
case '\'':
if (pattern_is_quoted == 0)
pattern_is_quoted = 1;
else if (pattern_is_quoted == 1)
pattern_is_quoted = 0;
break;
case '"':
if (pattern_is_quoted == 0)
pattern_is_quoted = 2;
else if (pattern_is_quoted == 2)
pattern_is_quoted = 0;
break;
}
pattern = w_addchar (pattern, &pat_length, &pat_maxlen,
words[*offset]);
if (pattern == NULL)
goto no_space;
}
}
/* End of input string -- remember to reparse the character that we
* stopped at. */
--(*offset);
envsubst:
if (words[start] == '{' && words[*offset] != '}')
goto syntax;
if (env == NULL)
{
if (seen_hash)
{
/* $# expands to the number of positional parameters */
buffer[20] = '\0';
value = _itoa_word (__libc_argc - 1, &buffer[20], 10, 0);
seen_hash = 0;
}
else
{
/* Just $ on its own */
*offset = start - 1;
*word = w_addchar (*word, word_length, max_length, '$');
return *word ? 0 : WRDE_NOSPACE;
}
}
/* Is it a numeric parameter? */
else if (isdigit (env[0]))
{
int n = atoi (env);
if (n >= __libc_argc)
/* Substitute NULL. */
value = NULL;
else
/* Replace with appropriate positional parameter. */
value = __libc_argv[n];
}
/* Is it a special parameter? */
else if (special)
{
/* Is it `$$'? */
if (*env == '$')
{
buffer[20] = '\0';
value = _itoa_word (__getpid (), &buffer[20], 10, 0);
}
/* Is it `${#*}' or `${#@}'? */
else if ((*env == '*' || *env == '@') && seen_hash)
{
buffer[20] = '\0';
value = _itoa_word (__libc_argc > 0 ? __libc_argc - 1 : 0,
&buffer[20], 10, 0);
*word = w_addstr (*word, word_length, max_length, value);
free (env);
if (pattern)
free (pattern);
return *word ? 0 : WRDE_NOSPACE;
}
/* Is it `$*' or `$@' (unquoted) ? */
else if (*env == '*' || (*env == '@' && !quoted))
{
size_t plist_len = 0;
int p;
char *end;
/* Build up value parameter by parameter (copy them) */
for (p = 1; __libc_argv[p]; ++p)
plist_len += strlen (__libc_argv[p]) + 1; /* for space */
value = malloc (plist_len);
if (value == NULL)
goto no_space;
end = value;
*end = 0;
for (p = 1; __libc_argv[p]; ++p)
{
if (p > 1)
*end++ = ' ';
end = __stpcpy (end, __libc_argv[p]);
}
free_value = 1;
}
else
{
/* Must be a quoted `$@' */
assert (*env == '@' && quoted);
/* Each parameter is a separate word ("$@") */
if (__libc_argc == 2)
value = __libc_argv[1];
else if (__libc_argc > 2)
{
int p;
/* Append first parameter to current word. */
value = w_addstr (*word, word_length, max_length,
__libc_argv[1]);
if (value == NULL || w_addword (pwordexp, value))
goto no_space;
for (p = 2; __libc_argv[p + 1]; p++)
{
char *newword = __strdup (__libc_argv[p]);
if (newword == NULL || w_addword (pwordexp, newword))
goto no_space;
}
/* Start a new word with the last parameter. */
*word = w_newword (word_length, max_length);
value = __libc_argv[p];
}
else
{
free (env);
free (pattern);
return 0;
}
}
}
else
value = getenv (env);
if (value == NULL && (flags & WRDE_UNDEF))
{
/* Variable not defined. */
error = WRDE_BADVAL;
goto do_error;
}
if (action != ACT_NONE)
{
switch (action)
{
case ACT_RP_SHORT_LEFT:
case ACT_RP_LONG_LEFT:
case ACT_RP_SHORT_RIGHT:
case ACT_RP_LONG_RIGHT:
{
char *p;
char c;
char *end;
if (value == NULL || pattern == NULL || *pattern == '\0')
break;
end = value + strlen (value);
switch (action)
{
case ACT_RP_SHORT_LEFT:
for (p = value; p <= end; ++p)
{
c = *p;
*p = '\0';
if (fnmatch (pattern, value, 0) != FNM_NOMATCH)
{
*p = c;
if (free_value)
{
char *newval = __strdup (p);
if (newval == NULL)
{
free (value);
goto no_space;
}
free (value);
value = newval;
}
else
value = p;
break;
}
*p = c;
}
break;
case ACT_RP_LONG_LEFT:
for (p = end; p >= value; --p)
{
c = *p;
*p = '\0';
if (fnmatch (pattern, value, 0) != FNM_NOMATCH)
{
*p = c;
if (free_value)
{
char *newval = __strdup (p);
if (newval == NULL)
{
free (value);
goto no_space;
}
free (value);
value = newval;
}
else
value = p;
break;
}
*p = c;
}
break;
case ACT_RP_SHORT_RIGHT:
for (p = end; p >= value; --p)
{
if (fnmatch (pattern, p, 0) != FNM_NOMATCH)
{
char *newval;
newval = malloc (p - value + 1);
if (newval == NULL)
{
if (free_value)
free (value);
goto no_space;
}
*(char *) __mempcpy (newval, value, p - value) = '\0';
if (free_value)
free (value);
value = newval;
free_value = 1;
break;
}
}
break;
case ACT_RP_LONG_RIGHT:
for (p = value; p <= end; ++p)
{
if (fnmatch (pattern, p, 0) != FNM_NOMATCH)
{
char *newval;
newval = malloc (p - value + 1);
if (newval == NULL)
{
if (free_value)
free (value);
goto no_space;
}
*(char *) __mempcpy (newval, value, p - value) = '\0';
if (free_value)
free (value);
value = newval;
free_value = 1;
break;
}
}
break;
default:
break;
}
break;
}
case ACT_NULL_ERROR:
if (value && *value)
/* Substitute parameter */
break;
if (!colon_seen && value)
/* Substitute NULL */
error = 0;
else if (*pattern)
{
/* Expand 'pattern' and write it to stderr */
wordexp_t we;
error = wordexp (pattern, &we, flags);
if (error == 0)
{
int i;
fprintf (stderr, "%s:", env);
for (i = 0; i < we.we_wordc; ++i)
{
fprintf (stderr, " %s", we.we_wordv[i]);
}
fprintf (stderr, "\n");
error = WRDE_BADVAL;
}
wordfree (&we);
}
else
{
fprintf (stderr, "%s: parameter null or not set\n", env);
error = WRDE_BADVAL;
}
if (free_value)
free (value);
goto do_error;
case ACT_NULL_SUBST:
if (value && *value)
/* Substitute parameter */
break;
if (!colon_seen && value)
{
/* Substitute NULL */
if (free_value)
free (value);
goto success;
}
subst_word:
{
/* Substitute word */
wordexp_t we;
int i;
if (free_value)
free (value);
if (quoted)
{
/* No field-splitting is allowed, so imagine
quotes around the word. */
char *qtd_pattern = malloc (3 + strlen (pattern));
if (qtd_pattern)
sprintf (qtd_pattern, "\"%s\"", pattern);
free (pattern);
pattern = qtd_pattern;
}
if (pattern == NULL && (pattern = __strdup ("")) == NULL)
goto no_space;
error = wordexp (pattern, &we, flags);
if (error)
goto do_error;
/* Fingers crossed that the quotes worked.. */
assert (!quoted || we.we_wordc == 1);
/* Substitute */
for (i = 0; i < we.we_wordc; ++i)
if ((error = w_addword (pwordexp, __strdup (we.we_wordv[i])))
!= 0)
break;
if (i < we.we_wordc)
{
/* Ran out of space */
wordfree (&we);
goto do_error;
}
if (action == ACT_NULL_ASSIGN)
{
char *words;
char *cp;
size_t words_size = 0;
if (special)
/* Cannot assign special parameters. */
goto syntax;
for (i = 0; i < we.we_wordc; i++)
words_size += strlen (we.we_wordv[i]) + 1; /* for <space> */
words_size++;
cp = words = __alloca (words_size);
*words = 0;
for (i = 0; i < we.we_wordc - 1; i++)
{
cp = __stpcpy (cp, we.we_wordv[i]);
*cp++ = ' ';
}
strcpy (cp, we.we_wordv[i]);
/* Also assign */
setenv (env, words, 1);
}
wordfree (&we);
goto success;
}
case ACT_NONNULL_SUBST:
if (value && *value)
goto subst_word;
if (!colon_seen && value)
goto subst_word;
/* Substitute NULL */
if (free_value)
free (value);
goto success;
case ACT_NULL_ASSIGN:
if (value && *value)
/* Substitute parameter */
break;
if (!colon_seen && value)
{
/* Substitute NULL */
if (free_value)
free (value);
goto success;
}
/* This checks for '=' so it knows to assign */
goto subst_word;
default:
assert (! "Unrecognised action!");
}
}
free (env); env = NULL;
free (pattern); pattern = NULL;
if (seen_hash)
{
char param_length[21];
param_length[20] = '\0';
*word = w_addstr (*word, word_length, max_length,
_itoa_word (value ? strlen (value) : 0,
&param_length[20], 10, 0));
if (free_value)
{
assert (value != NULL);
free (value);
}
return *word ? 0 : WRDE_NOSPACE;
}
if (value == NULL)
return 0;
if (quoted || !pwordexp)
{
/* Quoted - no field split */
*word = w_addstr (*word, word_length, max_length, value);
if (free_value)
free (value);
return *word ? 0 : WRDE_NOSPACE;
}
else
{
/* Need to field-split */
char *value_copy = __strdup (value); /* Don't modify value */
char *field_begin = value_copy;
int seen_nonws_ifs = 0;
if (free_value)
free (value);
if (value_copy == NULL)
goto no_space;
do
{
char *field_end = field_begin;
char *next_field;
/* If this isn't the first field, start a new word */
if (field_begin != value_copy)
{
if (w_addword (pwordexp, *word) == WRDE_NOSPACE)
{
free (value_copy);
goto no_space;
}
*word = w_newword (word_length, max_length);
}
/* Skip IFS whitespace before the field */
field_begin += strspn (field_begin, ifs_white);
if (!seen_nonws_ifs && *field_begin == 0)
/* Nothing but whitespace */
break;
/* Search for the end of the field */
field_end = field_begin + strcspn (field_begin, ifs);
/* Set up pointer to the character after end of field and
skip whitespace IFS after it. */
next_field = field_end + strspn (field_end, ifs_white);
/* Skip at most one non-whitespace IFS character after the field */
seen_nonws_ifs = 0;
if (*next_field && strchr (ifs, *next_field))
{
seen_nonws_ifs = 1;
next_field++;
}
/* Null-terminate it */
*field_end = 0;
/* Tag a copy onto the current word */
*word = w_addstr (*word, word_length, max_length, field_begin);
if (*word == NULL && *field_begin != '\0')
{
free (value_copy);
goto no_space;
}
field_begin = next_field;
}
while (seen_nonws_ifs || *field_begin);
free (value_copy);
}
return 0;
success:
error = 0;
goto do_error;
no_space:
error = WRDE_NOSPACE;
goto do_error;
syntax:
error = WRDE_SYNTAX;
do_error:
if (env)
free (env);
if (pattern)
free (pattern);
return error;
}
static int
internal_function
parse_dollars (char **word, size_t *word_length, size_t *max_length,
const char *words, size_t *offset, int flags,
wordexp_t *pwordexp, const char *ifs, const char *ifs_white,
int quoted)
{
/* We are poised _at_ "$" */
switch (words[1 + *offset])
{
case '"':
case '\'':
case 0:
*word = w_addchar (*word, word_length, max_length, '$');
return *word ? 0 : WRDE_NOSPACE;
case '(':
if (words[2 + *offset] == '(')
{
/* Differentiate between $((1+3)) and $((echo);(ls)) */
int i = 3 + *offset;
int depth = 0;
while (words[i] && !(depth == 0 && words[i] == ')'))
{
if (words[i] == '(')
++depth;
else if (words[i] == ')')
--depth;
++i;
}
if (words[i] == ')' && words[i + 1] == ')')
{
(*offset) += 3;
/* Call parse_arith -- 0 is for "no brackets" */
return parse_arith (word, word_length, max_length, words, offset,
flags, 0);
}
}
if (flags & WRDE_NOCMD)
return WRDE_CMDSUB;
(*offset) += 2;
return parse_comm (word, word_length, max_length, words, offset, flags,
quoted? NULL : pwordexp, ifs, ifs_white);
case '[':
(*offset) += 2;
/* Call parse_arith -- 1 is for "brackets" */
return parse_arith (word, word_length, max_length, words, offset, flags,
1);
case '{':
default:
++(*offset); /* parse_param needs to know if "{" is there */
return parse_param (word, word_length, max_length, words, offset, flags,
pwordexp, ifs, ifs_white, quoted);
}
}
static int
parse_backtick (char **word, size_t *word_length, size_t *max_length,
const char *words, size_t *offset, int flags,
wordexp_t *pwordexp, const char *ifs, const char *ifs_white)
{
/* We are poised just after "`" */
int error;
int squoting = 0;
size_t comm_length;
size_t comm_maxlen;
char *comm = w_newword (&comm_length, &comm_maxlen);
for (; words[*offset]; ++(*offset))
{
switch (words[*offset])
{
case '`':
/* Go -- give the script to the shell */
error = exec_comm (comm, word, word_length, max_length, flags,
pwordexp, ifs, ifs_white);
free (comm);
return error;
case '\\':
if (squoting)
{
error = parse_qtd_backslash (&comm, &comm_length, &comm_maxlen,
words, offset);
if (error)
{
free (comm);
return error;
}
break;
}
++(*offset);
error = parse_backslash (&comm, &comm_length, &comm_maxlen, words,
offset);
if (error)
{
free (comm);
return error;
}
break;
case '\'':
squoting = 1 - squoting;
default:
comm = w_addchar (comm, &comm_length, &comm_maxlen, words[*offset]);
if (comm == NULL)
return WRDE_NOSPACE;
}
}
/* Premature end */
free (comm);
return WRDE_SYNTAX;
}
static int
internal_function
parse_dquote (char **word, size_t *word_length, size_t *max_length,
const char *words, size_t *offset, int flags,
wordexp_t *pwordexp, const char * ifs, const char * ifs_white)
{
/* We are poised just after a double-quote */
int error;
for (; words[*offset]; ++(*offset))
{
switch (words[*offset])
{
case '"':
return 0;
case '$':
error = parse_dollars (word, word_length, max_length, words, offset,
flags, pwordexp, ifs, ifs_white, 1);
/* The ``1'' here is to tell parse_dollars not to
* split the fields. It may need to, however ("$@").
*/
if (error)
return error;
break;
case '`':
if (flags & WRDE_NOCMD)
return WRDE_CMDSUB;
++(*offset);
error = parse_backtick (word, word_length, max_length, words,
offset, flags, NULL, NULL, NULL);
/* The first NULL here is to tell parse_backtick not to
* split the fields.
*/
if (error)
return error;
break;
case '\\':
error = parse_qtd_backslash (word, word_length, max_length, words,
offset);
if (error)
return error;
break;
default:
*word = w_addchar (*word, word_length, max_length, words[*offset]);
if (*word == NULL)
return WRDE_NOSPACE;
}
}
/* Unterminated string */
return WRDE_SYNTAX;
}
/*
* wordfree() is to be called after pwordexp is finished with.
*/
void
wordfree (wordexp_t *pwordexp)
{
/* wordexp can set pwordexp to NULL */
if (pwordexp && pwordexp->we_wordv)
{
char **wordv = pwordexp->we_wordv;
for (wordv += pwordexp->we_offs; *wordv; ++wordv)
free (*wordv);
free (pwordexp->we_wordv);
pwordexp->we_wordv = NULL;
}
}
/*
* wordexp()
*/
int
wordexp (const char *words, wordexp_t *pwordexp, int flags)
{
size_t wordv_offset;
size_t words_offset;
size_t word_length;
size_t max_length;
char *word = w_newword (&word_length, &max_length);
int error;
char *ifs;
char ifs_white[4];
char **old_wordv = pwordexp->we_wordv;
size_t old_wordc = (flags & WRDE_REUSE) ? pwordexp->we_wordc : 0;
if (flags & WRDE_REUSE)
{
/* Minimal implementation of WRDE_REUSE for now */
wordfree (pwordexp);
old_wordv = NULL;
}
if (flags & WRDE_DOOFFS)
{
pwordexp->we_wordv = calloc (1 + pwordexp->we_offs, sizeof (char *));
if (pwordexp->we_wordv == NULL)
{
error = WRDE_NOSPACE;
goto do_error;
}
}
else
{
pwordexp->we_wordv = calloc (1, sizeof (char *));
if (pwordexp->we_wordv == NULL)
{
error = WRDE_NOSPACE;
goto do_error;
}
pwordexp->we_offs = 0;
}
if ((flags & WRDE_APPEND) == 0)
pwordexp->we_wordc = 0;
wordv_offset = pwordexp->we_offs + pwordexp->we_wordc;
/* Find out what the field separators are.
* There are two types: whitespace and non-whitespace.
*/
ifs = getenv ("IFS");
if (!ifs)
/* IFS unset - use <space><tab><newline>. */
ifs = strcpy (ifs_white, " \t\n");
else
{
char *ifsch = ifs;
char *whch = ifs_white;
/* Start off with no whitespace IFS characters */
ifs_white[0] = '\0';
while (*ifsch != '\0')
{
if ((*ifsch == ' ') || (*ifsch == '\t') || (*ifsch == '\n'))
{
/* Whitespace IFS. See first whether it is already in our
collection. */
char *runp = ifs_white;
while (runp < whch && *runp != '\0' && *runp != *ifsch)
++runp;
if (runp == whch)
*whch++ = *ifsch;
}
++ifsch;
}
*whch = '\0';
}
for (words_offset = 0 ; words[words_offset] ; ++words_offset)
switch (words[words_offset])
{
case '\\':
error = parse_backslash (&word, &word_length, &max_length, words,
&words_offset);
if (error)
goto do_error;
break;
case '$':
error = parse_dollars (&word, &word_length, &max_length, words,
&words_offset, flags, pwordexp, ifs, ifs_white,
0);
if (error)
goto do_error;
break;
case '`':
if (flags & WRDE_NOCMD)
{
error = WRDE_CMDSUB;
goto do_error;
}
++words_offset;
error = parse_backtick (&word, &word_length, &max_length, words,
&words_offset, flags, pwordexp, ifs,
ifs_white);
if (error)
goto do_error;
break;
case '"':
++words_offset;
error = parse_dquote (&word, &word_length, &max_length, words,
&words_offset, flags, pwordexp, ifs, ifs_white);
if (error)
goto do_error;
break;
case '\'':
++words_offset;
error = parse_squote (&word, &word_length, &max_length, words,
&words_offset);
if (error)
goto do_error;
break;
case '~':
error = parse_tilde (&word, &word_length, &max_length, words,
&words_offset, pwordexp->we_wordc);
if (error)
goto do_error;
break;
case '*':
case '[':
case '?':
error = parse_glob (&word, &word_length, &max_length, words,
&words_offset, flags, pwordexp, ifs, ifs_white);
if (error)
goto do_error;
break;
default:
/* Is it a word separator? */
if (strchr (" \t", words[words_offset]) == NULL)
{
char ch = words[words_offset];
/* Not a word separator -- but is it a valid word char? */
if (strchr ("\n|&;<>(){}", ch))
{
/* Fail */
wordfree (pwordexp);
pwordexp->we_wordc = 0;
pwordexp->we_wordv = old_wordv;
return WRDE_BADCHAR;
}
/* "Ordinary" character -- add it to word */
/* Convert IFS chars to blanks -- bash does this */
if (strchr (ifs, ch))
ch = ' ';
word = w_addchar (word, &word_length, &max_length,
ch);
if (word == NULL)
{
error = WRDE_NOSPACE;
goto do_error;
}
break;
}
/* If a word has been delimited, add it to the list. */
if (word != NULL)
{
error = w_addword (pwordexp, word);
if (error)
goto do_error;
}
word = w_newword (&word_length, &max_length);
}
/* End of string */
/* There was a word separator at the end */
if (word == NULL) /* i.e. w_newword */
return 0;
/* There was no field separator at the end */
return w_addword (pwordexp, word);
do_error:
/* Error:
* free memory used (unless error is WRDE_NOSPACE), and
* set we_wordc and wd_wordv back to what they were.
*/
if (word != NULL)
free (word);
if (error == WRDE_NOSPACE)
return WRDE_NOSPACE;
wordfree (pwordexp);
pwordexp->we_wordv = old_wordv;
pwordexp->we_wordc = old_wordc;
return error;
}