1998-09-16 00:47  Tim Waugh  <tim@cyberelk.demon.co.uk>

	* posix/wordexp-test.c: If expansion or substitution occurs
	anywhere in a word, the entire word is subject to field-splitting.

	* posix/wordexp.c (parse_glob): Look for end of word instead of
	end of field when deciding what to glob.
	(field_split_word): New function, now the only place where
	field-splitting is performed.
	(parse_dollars): New parameter - tell the caller if
	field-splitting should be performed on this word.

	* posix/wordexp-test.c (testit): Only call wordfree if wordexp
	succeeded (or failed with WRDE_NOSPACE).

1998-09-15 19:53 1998  Tim Waugh  <tim@cyberelk.demon.co.uk>

	* posix/wordexp.c (wordexp): Don't convert IFS characters to
	blanks.

	* posix/wordexp-test.c: Words not the result of expansion or
	substitution should remain unchanged.
This commit is contained in:
Ulrich Drepper 1998-09-15 21:24:37 +00:00
parent aa2bc6a32d
commit a8125d8552
3 changed files with 181 additions and 200 deletions

View File

@ -1,3 +1,26 @@
1998-09-16 00:47 Tim Waugh <tim@cyberelk.demon.co.uk>
* posix/wordexp-test.c: If expansion or substitution occurs
anywhere in a word, the entire word is subject to field-splitting.
* posix/wordexp.c (parse_glob): Look for end of word instead of
end of field when deciding what to glob.
(field_split_word): New function, now the only place where
field-splitting is performed.
(parse_dollars): New parameter - tell the caller if
field-splitting should be performed on this word.
* posix/wordexp-test.c (testit): Only call wordfree if wordexp
succeeded (or failed with WRDE_NOSPACE).
1998-09-15 19:53 1998 Tim Waugh <tim@cyberelk.demon.co.uk>
* posix/wordexp.c (wordexp): Don't convert IFS characters to
blanks.
* posix/wordexp-test.c: Words not the result of expansion or
substitution should remain unchanged.
1998-09-15 Ulrich Drepper <drepper@cygnus.com> 1998-09-15 Ulrich Drepper <drepper@cygnus.com>
* elf/dynamic-link.h [!ELF_MACHINE_PLTREL_OVERLAP] * elf/dynamic-link.h [!ELF_MACHINE_PLTREL_OVERLAP]

View File

@ -43,7 +43,7 @@ struct test_case_struct
{ 0, NULL, "one two", 0, 2, { "one", "two", }, IFS }, { 0, NULL, "one two", 0, 2, { "one", "two", }, IFS },
{ 0, NULL, "one two three", 0, 3, { "one", "two", "three", }, IFS }, { 0, NULL, "one two three", 0, 3, { "one", "two", "three", }, IFS },
{ 0, NULL, " \tfoo\t\tbar ", 0, 2, { "foo", "bar", }, IFS }, { 0, NULL, " \tfoo\t\tbar ", 0, 2, { "foo", "bar", }, IFS },
{ 0, NULL, "red , white blue", 0, 4, { "red", " ", "white", "blue", }, " ," }, { 0, NULL, "red , white blue", 0, 4, { "red", ",", "white", "blue", }, " ," },
{ 0, NULL, "one two three", 0, 3, { "one", "two", "three", }, "" }, { 0, NULL, "one two three", 0, 3, { "one", "two", "three", }, "" },
{ 0, NULL, "one \"two three\"", 0, 2, { "one", "two three", }, IFS }, { 0, NULL, "one \"two three\"", 0, 2, { "one", "two three", }, IFS },
{ 0, NULL, "one \"two three\"", 0, 2, { "one", "two three", }, "" }, { 0, NULL, "one \"two three\"", 0, 2, { "one", "two three", }, "" },
@ -60,10 +60,11 @@ struct test_case_struct
{ 0, NULL, "$(echo :abc:\\ )", 0, 2, { "", "abc", }, ": " }, { 0, NULL, "$(echo :abc:\\ )", 0, 2, { "", "abc", }, ": " },
{ 0, NULL, "$(echo :abc\\ )", 0, 2, { "", "abc", }, ": " }, { 0, NULL, "$(echo :abc\\ )", 0, 2, { "", "abc", }, ": " },
{ 0, ":abc:", "$(echo $var)", 0, 2, { "", "abc", }, ":" }, { 0, ":abc:", "$(echo $var)", 0, 2, { "", "abc", }, ":" },
{ 0, NULL, ":abc:", 0, 1, { " abc ", }, ":" }, { 0, NULL, ":abc:", 0, 1, { ":abc:", }, ":" },
{ 0, NULL, "$(echo :abc:)def", 0, 3, { "", "abc", "def", }, ":" }, { 0, NULL, "$(echo :abc:)def", 0, 3, { "", "abc", "def", }, ":" },
{ 0, NULL, "$(echo abc:de)f", 0, 2, { "abc", "def", }, ":" }, { 0, NULL, "$(echo abc:de)f", 0, 2, { "abc", "def", }, ":" },
{ 0, NULL, "$(echo abc:de)f:ghi", 0, 2, { "abc", "def ghi", }, ":" }, { 0, NULL, "$(echo abc:de)f:ghi", 0, 3, { "abc", "def", "ghi", }, ":" },
{ 0, NULL, "abc:d$(echo ef:ghi)", 0, 3, { "abc", "def", "ghi", }, ":" },
{ 0, "abc:", "$var$(echo def:ghi)", 0, 3, { "abc", "def", "ghi", }, ":" }, { 0, "abc:", "$var$(echo def:ghi)", 0, 3, { "abc", "def", "ghi", }, ":" },
{ 0, "abc:d", "$var$(echo ef:ghi)", 0, 3, { "abc", "def", "ghi", }, ":" }, { 0, "abc:d", "$var$(echo ef:ghi)", 0, 3, { "abc", "def", "ghi", }, ":" },
{ 0, "def:ghi", "$(echo abc:)$var", 0, 3, { "abc", "def", "ghi", }, ":" }, { 0, "def:ghi", "$(echo abc:)$var", 0, 3, { "abc", "def", "ghi", }, ":" },
@ -308,6 +309,7 @@ testit (struct test_case_struct *tc)
else else
printf ("OK\n"); printf ("OK\n");
if (retval == 0 || retval == WRDE_NOSPACE)
wordfree (&we); wordfree (&we);
return bzzzt; return bzzzt;

View File

@ -56,7 +56,7 @@ extern char **__libc_argv;
static int parse_dollars (char **word, size_t *word_length, size_t *max_length, static int parse_dollars (char **word, size_t *word_length, size_t *max_length,
const char *words, size_t *offset, int flags, const char *words, size_t *offset, int flags,
wordexp_t *pwordexp, const char *ifs, wordexp_t *pwordexp, const char *ifs,
const char *ifs_white, int quoted) const char *ifs_white, int quoted, int *fsplit)
internal_function; internal_function;
static int parse_backtick (char **word, size_t *word_length, static int parse_backtick (char **word, size_t *word_length,
size_t *max_length, const char *words, size_t *max_length, const char *words,
@ -183,6 +183,78 @@ no_space:
return WRDE_NOSPACE; return WRDE_NOSPACE;
} }
static int
internal_function
field_split_word (char *word, wordexp_t *pwordexp, const char *ifs,
const char *ifs_white)
{
size_t field_length;
size_t field_maxlen;
char *field = w_newword (&field_length, &field_maxlen);
char *field_begin = word;
int seen_nonws_ifs = 0;
if (!word)
return 0;
do
{
char *field_end = field_begin;
char *next_field;
/* If this isn't the first field, start a new word */
if (field_begin != word)
{
if (w_addword (pwordexp, field) == WRDE_NOSPACE)
goto no_space;
field = w_newword (&field_length, &field_maxlen);
}
/* Skip IFS whitespace before the field */
field_begin += strspn (field_begin, ifs_white);
if (!seen_nonws_ifs && *field_begin == 0)
/* Nothing but whitespace */
break;
/* Search for the end of the field */
field_end = field_begin + strcspn (field_begin, ifs);
/* Set up pointer to the character after end of field and
skip whitespace IFS after it. */
next_field = field_end + strspn (field_end, ifs_white);
/* Skip at most one non-whitespace IFS character after the field */
seen_nonws_ifs = 0;
if (*next_field && strchr (ifs, *next_field))
{
seen_nonws_ifs = 1;
next_field++;
}
/* Null-terminate it */
*field_end = 0;
/* Tag a copy onto the current word */
field = w_addstr (field, &field_length, &field_maxlen, field_begin);
if (field == NULL && *field_begin != '\0')
goto no_space;
field_begin = next_field;
}
while (seen_nonws_ifs || *field_begin);
if (field && w_addword (pwordexp, field))
goto no_space;
return 0;
no_space:
return WRDE_NOSPACE;
}
/* The parse_*() functions should leave *offset being the offset in 'words' /* The parse_*() functions should leave *offset being the offset in 'words'
* to the last character processed. * to the last character processed.
*/ */
@ -424,15 +496,15 @@ parse_glob (char **word, size_t *word_length, size_t *max_length,
int quoted = 0; /* 1 if singly-quoted, 2 if doubly */ int quoted = 0; /* 1 if singly-quoted, 2 if doubly */
int i; int i;
wordexp_t glob_list; /* List of words to glob */ wordexp_t glob_list; /* List of words to glob */
int fieldsplit = 0;
glob_list.we_wordc = 0; glob_list.we_wordc = 0;
glob_list.we_wordv = NULL; glob_list.we_wordv = NULL;
glob_list.we_offs = 0; glob_list.we_offs = 0;
for (; words[*offset] != '\0'; ++*offset) for (; words[*offset] != '\0'; ++*offset)
{ {
if ((ifs && strchr (ifs, words[*offset])) || if (strchr (" \t\n", words[*offset]))
(!ifs && strchr (" \t\n", words[*offset]))) /* Reached end of word */
/* Reached IFS */
break; break;
/* Sort out quoting */ /* Sort out quoting */
@ -468,7 +540,7 @@ parse_glob (char **word, size_t *word_length, size_t *max_length,
{ {
error = parse_dollars (word, word_length, max_length, words, error = parse_dollars (word, word_length, max_length, words,
offset, flags, &glob_list, ifs, ifs_white, offset, flags, &glob_list, ifs, ifs_white,
quoted == 2); quoted == 2, &fieldsplit);
if (error) if (error)
goto tidy_up; goto tidy_up;
@ -497,8 +569,16 @@ parse_glob (char **word, size_t *word_length, size_t *max_length,
/* Don't forget to re-parse the character we stopped at. */ /* Don't forget to re-parse the character we stopped at. */
--*offset; --*offset;
/* Glob the words */ if (fieldsplit)
{
error = field_split_word (*word, &glob_list, ifs, ifs_white);
if (*word)
free (*word);
}
else
error = w_addword (&glob_list, *word); error = w_addword (&glob_list, *word);
/* Glob the words */
*word = w_newword (word_length, max_length); *word = w_newword (word_length, max_length);
for (i = 0; error == 0 && i < glob_list.we_wordc; i++) for (i = 0; error == 0 && i < glob_list.we_wordc; i++)
error = do_parse_glob (glob_list.we_wordv[i], word, word_length, error = do_parse_glob (glob_list.we_wordv[i], word, word_length,
@ -676,7 +756,8 @@ parse_arith (char **word, size_t *word_length, size_t *max_length,
{ {
case '$': case '$':
error = parse_dollars (&expr, &expr_length, &expr_maxlen, error = parse_dollars (&expr, &expr_length, &expr_maxlen,
words, offset, flags, NULL, NULL, NULL, 1); words, offset, flags, NULL, NULL, NULL, 1,
NULL);
/* The ``1'' here is to tell parse_dollars not to /* The ``1'' here is to tell parse_dollars not to
* split the fields. * split the fields.
*/ */
@ -871,9 +952,7 @@ exec_comm (char *comm, char **word, size_t *word_length, size_t *max_length,
__close (fildes[1]); __close (fildes[1]);
buffer = __alloca (bufsize); buffer = __alloca (bufsize);
if (!pwordexp) /* Read fildes[0] and put it into a word. */
{ /* Quoted - no field splitting */
while (1) while (1)
{ {
if ((buflen = __read (fildes[0], buffer, bufsize)) < 1) if ((buflen = __read (fildes[0], buffer, bufsize)) < 1)
@ -888,84 +967,6 @@ exec_comm (char *comm, char **word, size_t *word_length, size_t *max_length,
if (*word == NULL) if (*word == NULL)
goto no_space; goto no_space;
} }
}
else
/* Not quoted - split fields */
{
int copying = 0;
/* 'copying' is:
* 0 when searching for first character in a field not IFS white space
* 1 when copying the text of a field
* 2 when searching for possible non-whitespace IFS
*/
while (1)
{
if ((buflen = __read (fildes[0], buffer, bufsize)) < 1)
{
if (__waitpid (pid, NULL, WNOHANG) == 0)
continue;
if ((__read (fildes[0], buffer, bufsize)) < 1)
break;
}
for (i = 0; i < buflen; ++i)
{
if (strchr (ifs, buffer[i]) != NULL)
{
/* Current character is IFS */
if (strchr (ifs_white, buffer[i]) == NULL)
{
/* Current character is IFS but not whitespace */
if (copying == 2)
{
/* current character
* |
* V
* eg: text<space><comma><space>moretext
*
* So, strip whitespace IFS (like at the start)
*/
copying = 0;
continue;
}
copying = 0;
/* fall through and delimit field.. */
}
else
{
/* Current character is IFS white space */
/* If not copying a field, ignore it */
if (copying != 1)
continue;
/* End of field (search for non-ws IFS afterwards) */
copying = 2;
}
/* First IFS white space, or IFS non-whitespace.
* Delimit the field. Nulls are converted by w_addword. */
if (w_addword (pwordexp, *word) == WRDE_NOSPACE)
goto no_space;
*word = w_newword (word_length, max_length);
/* fall back round the loop.. */
}
else
{
/* Not IFS character */
copying = 1;
*word = w_addchar (*word, word_length, max_length,
buffer[i]);
if (*word == NULL)
goto no_space;
}
}
}
}
/* Bash chops off trailing newlines, which seems sensible. */ /* Bash chops off trailing newlines, which seems sensible. */
while (*word_length > 0 && (*word)[*word_length - 1] == '\n') while (*word_length > 0 && (*word)[*word_length - 1] == '\n')
@ -1701,87 +1702,11 @@ envsubst:
if (value == NULL) if (value == NULL)
return 0; return 0;
if (quoted || !pwordexp)
{
/* Quoted - no field split */
*word = w_addstr (*word, word_length, max_length, value); *word = w_addstr (*word, word_length, max_length, value);
if (free_value) if (free_value)
free (value); free (value);
return *word ? 0 : WRDE_NOSPACE; return *word ? 0 : WRDE_NOSPACE;
}
else
{
/* Need to field-split */
char *value_copy = __strdup (value); /* Don't modify value */
char *field_begin = value_copy;
int seen_nonws_ifs = 0;
if (free_value)
free (value);
if (value_copy == NULL)
goto no_space;
do
{
char *field_end = field_begin;
char *next_field;
/* If this isn't the first field, start a new word */
if (field_begin != value_copy)
{
if (w_addword (pwordexp, *word) == WRDE_NOSPACE)
{
free (value_copy);
goto no_space;
}
*word = w_newword (word_length, max_length);
}
/* Skip IFS whitespace before the field */
field_begin += strspn (field_begin, ifs_white);
if (!seen_nonws_ifs && *field_begin == 0)
/* Nothing but whitespace */
break;
/* Search for the end of the field */
field_end = field_begin + strcspn (field_begin, ifs);
/* Set up pointer to the character after end of field and
skip whitespace IFS after it. */
next_field = field_end + strspn (field_end, ifs_white);
/* Skip at most one non-whitespace IFS character after the field */
seen_nonws_ifs = 0;
if (*next_field && strchr (ifs, *next_field))
{
seen_nonws_ifs = 1;
next_field++;
}
/* Null-terminate it */
*field_end = 0;
/* Tag a copy onto the current word */
*word = w_addstr (*word, word_length, max_length, field_begin);
if (*word == NULL && *field_begin != '\0')
{
free (value_copy);
goto no_space;
}
field_begin = next_field;
}
while (seen_nonws_ifs || *field_begin);
free (value_copy);
}
return 0;
success: success:
error = 0; error = 0;
@ -1809,7 +1734,7 @@ internal_function
parse_dollars (char **word, size_t *word_length, size_t *max_length, parse_dollars (char **word, size_t *word_length, size_t *max_length,
const char *words, size_t *offset, int flags, const char *words, size_t *offset, int flags,
wordexp_t *pwordexp, const char *ifs, const char *ifs_white, wordexp_t *pwordexp, const char *ifs, const char *ifs_white,
int quoted) int quoted, int *fsplit)
{ {
/* We are poised _at_ "$" */ /* We are poised _at_ "$" */
switch (words[1 + *offset]) switch (words[1 + *offset])
@ -1839,6 +1764,12 @@ parse_dollars (char **word, size_t *word_length, size_t *max_length,
if (words[i] == ')' && words[i + 1] == ')') if (words[i] == ')' && words[i + 1] == ')')
{ {
(*offset) += 3; (*offset) += 3;
/* This word is subject to field-splitting as long as
* it isn't quoted. */
if (fsplit)
*fsplit = !quoted;
/* Call parse_arith -- 0 is for "no brackets" */ /* Call parse_arith -- 0 is for "no brackets" */
return parse_arith (word, word_length, max_length, words, offset, return parse_arith (word, word_length, max_length, words, offset,
flags, 0); flags, 0);
@ -1849,11 +1780,23 @@ parse_dollars (char **word, size_t *word_length, size_t *max_length,
return WRDE_CMDSUB; return WRDE_CMDSUB;
(*offset) += 2; (*offset) += 2;
/* This word is subject to field-splitting as long as
* it isn't quoted. */
if (fsplit)
*fsplit = !quoted;
return parse_comm (word, word_length, max_length, words, offset, flags, return parse_comm (word, word_length, max_length, words, offset, flags,
quoted? NULL : pwordexp, ifs, ifs_white); quoted? NULL : pwordexp, ifs, ifs_white);
case '[': case '[':
(*offset) += 2; (*offset) += 2;
/* This word is subject to field-splitting as long as
* it isn't quoted. */
if (fsplit)
*fsplit = !quoted;
/* Call parse_arith -- 1 is for "brackets" */ /* Call parse_arith -- 1 is for "brackets" */
return parse_arith (word, word_length, max_length, words, offset, flags, return parse_arith (word, word_length, max_length, words, offset, flags,
1); 1);
@ -1861,6 +1804,12 @@ parse_dollars (char **word, size_t *word_length, size_t *max_length,
case '{': case '{':
default: default:
++(*offset); /* parse_param needs to know if "{" is there */ ++(*offset); /* parse_param needs to know if "{" is there */
/* This word is subject to field-splitting as long as
* it isn't quoted. */
if (fsplit)
*fsplit = !quoted;
return parse_param (word, word_length, max_length, words, offset, flags, return parse_param (word, word_length, max_length, words, offset, flags,
pwordexp, ifs, ifs_white, quoted); pwordexp, ifs, ifs_white, quoted);
} }
@ -1948,7 +1897,7 @@ parse_dquote (char **word, size_t *word_length, size_t *max_length,
case '$': case '$':
error = parse_dollars (word, word_length, max_length, words, offset, error = parse_dollars (word, word_length, max_length, words, offset,
flags, pwordexp, ifs, ifs_white, 1); flags, pwordexp, ifs, ifs_white, 1, NULL);
/* The ``1'' here is to tell parse_dollars not to /* The ``1'' here is to tell parse_dollars not to
* split the fields. It may need to, however ("$@"). * split the fields. It may need to, however ("$@").
*/ */
@ -2030,6 +1979,7 @@ wordexp (const char *words, wordexp_t *pwordexp, int flags)
char ifs_white[4]; char ifs_white[4];
char **old_wordv = pwordexp->we_wordv; char **old_wordv = pwordexp->we_wordv;
size_t old_wordc = (flags & WRDE_REUSE) ? pwordexp->we_wordc : 0; size_t old_wordc = (flags & WRDE_REUSE) ? pwordexp->we_wordc : 0;
int fieldsplit_this_word = 0;
if (flags & WRDE_REUSE) if (flags & WRDE_REUSE)
{ {
@ -2100,7 +2050,8 @@ wordexp (const char *words, wordexp_t *pwordexp, int flags)
*whch = '\0'; *whch = '\0';
} }
for (words_offset = 0 ; words[words_offset] ; ++words_offset) fieldsplit_this_word = 0;
for (words_offset = 0 ; ; ++words_offset)
switch (words[words_offset]) switch (words[words_offset])
{ {
case '\\': case '\\':
@ -2115,7 +2066,7 @@ wordexp (const char *words, wordexp_t *pwordexp, int flags)
case '$': case '$':
error = parse_dollars (&word, &word_length, &max_length, words, error = parse_dollars (&word, &word_length, &max_length, words,
&words_offset, flags, pwordexp, ifs, ifs_white, &words_offset, flags, pwordexp, ifs, ifs_white,
0); 0, &fieldsplit_this_word);
if (error) if (error)
goto do_error; goto do_error;
@ -2137,6 +2088,8 @@ wordexp (const char *words, wordexp_t *pwordexp, int flags)
if (error) if (error)
goto do_error; goto do_error;
fieldsplit_this_word = 1;
break; break;
case '"': case '"':
@ -2181,7 +2134,8 @@ wordexp (const char *words, wordexp_t *pwordexp, int flags)
default: default:
/* Is it a word separator? */ /* Is it a word separator? */
if (strchr (" \t", words[words_offset]) == NULL) if (words[words_offset] != '\0' &&
strchr (" \t", words[words_offset]) == NULL)
{ {
char ch = words[words_offset]; char ch = words[words_offset];
@ -2196,11 +2150,6 @@ wordexp (const char *words, wordexp_t *pwordexp, int flags)
} }
/* "Ordinary" character -- add it to word */ /* "Ordinary" character -- add it to word */
/* Convert IFS chars to blanks -- bash does this */
if (strchr (ifs, ch))
ch = ' ';
word = w_addchar (word, &word_length, &max_length, word = w_addchar (word, &word_length, &max_length,
ch); ch);
if (word == NULL) if (word == NULL)
@ -2215,23 +2164,30 @@ wordexp (const char *words, wordexp_t *pwordexp, int flags)
/* If a word has been delimited, add it to the list. */ /* If a word has been delimited, add it to the list. */
if (word != NULL) if (word != NULL)
{ {
if (fieldsplit_this_word)
{
error = field_split_word (word, pwordexp, ifs, ifs_white);
free (word);
}
else
error = w_addword (pwordexp, word); error = w_addword (pwordexp, word);
if (error) if (error)
goto do_error; goto do_error;
} }
fieldsplit_this_word = 0;
if (words[words_offset] == '\0')
/* End of string. */
goto end_of_string;
word = w_newword (&word_length, &max_length); word = w_newword (&word_length, &max_length);
} }
/* End of string */ end_of_string:
/* There was a word separator at the end */
if (word == NULL) /* i.e. w_newword */
return 0; return 0;
/* There was no field separator at the end */
return w_addword (pwordexp, word);
do_error: do_error:
/* Error: /* Error:
* free memory used (unless error is WRDE_NOSPACE), and * free memory used (unless error is WRDE_NOSPACE), and