1 /* POSIX.2 wordexp implementation.
2 Copyright (C) 1997-2002, 2003, 2005 Free Software Foundation, Inc.
3 This file is part of the GNU C Library.
4 Contributed by Tim Waugh <tim@cyberelk.demon.co.uk>.
6 The GNU C Library is free software; you can redistribute it and/or
7 modify it under the terms of the GNU Lesser General Public
8 License as published by the Free Software Foundation; either
9 version 2.1 of the License, or (at your option) any later version.
11 The GNU C Library is distributed in the hope that it will be useful,
12 but WITHOUT ANY WARRANTY; without even the implied warranty of
13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14 Lesser General Public License for more details.
16 You should have received a copy of the GNU Lesser General Public
17 License along with the GNU C Library; if not, write to the Free
18 Software Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA
34 #include <sys/param.h>
37 #include <sys/types.h>
38 #include <sys/types.h>
46 #include <bits/libc-lock.h>
47 #include <stdio-common/_itoa.h>
49 /* Undefine the following line for the production version. */
50 /* #define NDEBUG 1 */
53 /* Get some device information. */
54 #include <device-nrs.h>
57 * This is a recursive-descent-style word expansion routine.
60 /* These variables are defined and initialized in the startup code. */
61 extern int __libc_argc attribute_hidden
;
62 extern char **__libc_argv attribute_hidden
;
64 /* Some forward declarations */
65 static int parse_dollars (char **word
, size_t *word_length
, size_t *max_length
,
66 const char *words
, size_t *offset
, int flags
,
67 wordexp_t
*pwordexp
, const char *ifs
,
68 const char *ifs_white
, int quoted
)
70 static int parse_backtick (char **word
, size_t *word_length
,
71 size_t *max_length
, const char *words
,
72 size_t *offset
, int flags
, wordexp_t
*pwordexp
,
73 const char *ifs
, const char *ifs_white
)
75 static int parse_dquote (char **word
, size_t *word_length
, size_t *max_length
,
76 const char *words
, size_t *offset
, int flags
,
77 wordexp_t
*pwordexp
, const char *ifs
,
78 const char *ifs_white
)
80 static int eval_expr (char *expr
, long int *result
) internal_function
;
82 /* The w_*() functions manipulate word lists. */
86 /* Result of w_newword will be ignored if it's the last word. */
88 w_newword (size_t *actlen
, size_t *maxlen
)
90 *actlen
= *maxlen
= 0;
95 w_addchar (char *buffer
, size_t *actlen
, size_t *maxlen
, char ch
)
96 /* (lengths exclude trailing zero) */
98 /* Add a character to the buffer, allocating room for it if needed. */
100 if (*actlen
== *maxlen
)
102 char *old_buffer
= buffer
;
103 assert (buffer
== NULL
|| *maxlen
!= 0);
105 buffer
= (char *) realloc (buffer
, 1 + *maxlen
);
113 buffer
[*actlen
] = ch
;
114 buffer
[++(*actlen
)] = '\0';
122 w_addmem (char *buffer
, size_t *actlen
, size_t *maxlen
, const char *str
,
125 /* Add a string to the buffer, allocating room for it if needed.
127 if (*actlen
+ len
> *maxlen
)
129 char *old_buffer
= buffer
;
130 assert (buffer
== NULL
|| *maxlen
!= 0);
131 *maxlen
+= MAX (2 * len
, W_CHUNK
);
132 buffer
= realloc (old_buffer
, 1 + *maxlen
);
140 *((char *) __mempcpy (&buffer
[*actlen
], str
, len
)) = '\0';
149 w_addstr (char *buffer
, size_t *actlen
, size_t *maxlen
, const char *str
)
150 /* (lengths exclude trailing zero) */
152 /* Add a string to the buffer, allocating room for it if needed.
156 assert (str
!= NULL
); /* w_addstr only called from this file */
159 return w_addmem (buffer
, actlen
, maxlen
, str
, len
);
164 w_addword (wordexp_t
*pwordexp
, char *word
)
166 /* Add a word to the wordlist */
170 /* Internally, NULL acts like "". Convert NULLs to "" before
171 * the caller sees them.
175 word
= __strdup ("");
180 num_p
= 2 + pwordexp
->we_wordc
+ pwordexp
->we_offs
;
181 new_wordv
= realloc (pwordexp
->we_wordv
, sizeof (char *) * num_p
);
182 if (new_wordv
!= NULL
)
184 pwordexp
->we_wordv
= new_wordv
;
185 pwordexp
->we_wordv
[pwordexp
->we_offs
+ pwordexp
->we_wordc
++] = word
;
186 pwordexp
->we_wordv
[pwordexp
->we_offs
+ pwordexp
->we_wordc
] = NULL
;
194 /* The parse_*() functions should leave *offset being the offset in 'words'
195 * to the last character processed.
200 parse_backslash (char **word
, size_t *word_length
, size_t *max_length
,
201 const char *words
, size_t *offset
)
203 /* We are poised _at_ a backslash, not in quotes */
205 switch (words
[1 + *offset
])
208 /* Backslash is last character of input words */
216 *word
= w_addchar (*word
, word_length
, max_length
, words
[1 + *offset
]);
229 parse_qtd_backslash (char **word
, size_t *word_length
, size_t *max_length
,
230 const char *words
, size_t *offset
)
232 /* We are poised _at_ a backslash, inside quotes */
234 switch (words
[1 + *offset
])
237 /* Backslash is last character of input words */
248 *word
= w_addchar (*word
, word_length
, max_length
, words
[1 + *offset
]);
256 *word
= w_addchar (*word
, word_length
, max_length
, words
[*offset
]);
258 *word
= w_addchar (*word
, word_length
, max_length
, words
[1 + *offset
]);
272 parse_tilde (char **word
, size_t *word_length
, size_t *max_length
,
273 const char *words
, size_t *offset
, size_t wordc
)
275 /* We are poised _at_ a tilde */
278 if (*word_length
!= 0)
280 if (!((*word
)[*word_length
- 1] == '=' && wordc
== 0))
282 if (!((*word
)[*word_length
- 1] == ':'
283 && strchr (*word
, '=') && wordc
== 0))
285 *word
= w_addchar (*word
, word_length
, max_length
, '~');
286 return *word
? 0 : WRDE_NOSPACE
;
291 for (i
= 1 + *offset
; words
[i
]; i
++)
293 if (words
[i
] == ':' || words
[i
] == '/' || words
[i
] == ' ' ||
294 words
[i
] == '\t' || words
[i
] == 0 )
297 if (words
[i
] == '\\')
299 *word
= w_addchar (*word
, word_length
, max_length
, '~');
300 return *word
? 0 : WRDE_NOSPACE
;
304 if (i
== 1 + *offset
)
306 /* Tilde appears on its own */
308 struct passwd pwd
, *tpwd
;
314 /* POSIX.2 says ~ expands to $HOME and if HOME is unset the
315 results are unspecified. We do a lookup on the uid if
318 home
= getenv ("HOME");
321 *word
= w_addstr (*word
, word_length
, max_length
, home
);
328 buffer
= __alloca (buflen
);
330 while ((result
= __getpwuid_r (uid
, &pwd
, buffer
, buflen
, &tpwd
)) != 0
332 buffer
= extend_alloca (buffer
, buflen
, buflen
+ 1000);
334 if (result
== 0 && tpwd
!= NULL
&& pwd
.pw_dir
!= NULL
)
336 *word
= w_addstr (*word
, word_length
, max_length
, pwd
.pw_dir
);
342 *word
= w_addchar (*word
, word_length
, max_length
, '~');
350 /* Look up user name in database to get home directory */
351 char *user
= strndupa (&words
[1 + *offset
], i
- (1 + *offset
));
352 struct passwd pwd
, *tpwd
;
354 char* buffer
= __alloca (buflen
);
357 while ((result
= __getpwnam_r (user
, &pwd
, buffer
, buflen
, &tpwd
)) != 0
359 buffer
= extend_alloca (buffer
, buflen
, buflen
+ 1000);
361 if (result
== 0 && tpwd
!= NULL
&& pwd
.pw_dir
)
362 *word
= w_addstr (*word
, word_length
, max_length
, pwd
.pw_dir
);
365 /* (invalid login name) */
366 *word
= w_addchar (*word
, word_length
, max_length
, '~');
368 *word
= w_addstr (*word
, word_length
, max_length
, user
);
373 return *word
? 0 : WRDE_NOSPACE
;
379 do_parse_glob (const char *glob_word
, char **word
, size_t *word_length
,
380 size_t *max_length
, wordexp_t
*pwordexp
, const char *ifs
,
381 const char *ifs_white
)
387 error
= glob (glob_word
, GLOB_NOCHECK
, NULL
, &globbuf
);
391 /* We can only run into memory problems. */
392 assert (error
== GLOB_NOSPACE
);
398 /* No field splitting allowed. */
399 assert (globbuf
.gl_pathv
[0] != NULL
);
400 *word
= w_addstr (*word
, word_length
, max_length
, globbuf
.gl_pathv
[0]);
401 for (match
= 1; match
< globbuf
.gl_pathc
&& *word
!= NULL
; ++match
)
403 *word
= w_addchar (*word
, word_length
, max_length
, ' ');
405 *word
= w_addstr (*word
, word_length
, max_length
,
406 globbuf
.gl_pathv
[match
]);
410 return *word
? 0 : WRDE_NOSPACE
;
413 assert (ifs
== NULL
|| *ifs
!= '\0');
417 *word
= w_newword (word_length
, max_length
);
420 for (match
= 0; match
< globbuf
.gl_pathc
; ++match
)
422 char *matching_word
= __strdup (globbuf
.gl_pathv
[match
]);
423 if (matching_word
== NULL
|| w_addword (pwordexp
, matching_word
))
436 parse_glob (char **word
, size_t *word_length
, size_t *max_length
,
437 const char *words
, size_t *offset
, int flags
,
438 wordexp_t
*pwordexp
, const char *ifs
, const char *ifs_white
)
440 /* We are poised just after a '*', a '[' or a '?'. */
441 int error
= WRDE_NOSPACE
;
442 int quoted
= 0; /* 1 if singly-quoted, 2 if doubly */
444 wordexp_t glob_list
; /* List of words to glob */
446 glob_list
.we_wordc
= 0;
447 glob_list
.we_wordv
= NULL
;
448 glob_list
.we_offs
= 0;
449 for (; words
[*offset
] != '\0'; ++*offset
)
451 if ((ifs
&& strchr (ifs
, words
[*offset
])) ||
452 (!ifs
&& strchr (" \t\n", words
[*offset
])))
456 /* Sort out quoting */
457 if (words
[*offset
] == '\'')
464 else if (quoted
== 1)
470 else if (words
[*offset
] == '"')
477 else if (quoted
== 2)
484 /* Sort out other special characters */
485 if (quoted
!= 1 && words
[*offset
] == '$')
487 error
= parse_dollars (word
, word_length
, max_length
, words
,
488 offset
, flags
, &glob_list
, ifs
, ifs_white
,
495 else if (words
[*offset
] == '\\')
498 error
= parse_qtd_backslash (word
, word_length
, max_length
,
501 error
= parse_backslash (word
, word_length
, max_length
,
510 *word
= w_addchar (*word
, word_length
, max_length
, words
[*offset
]);
515 /* Don't forget to re-parse the character we stopped at. */
519 error
= w_addword (&glob_list
, *word
);
520 *word
= w_newword (word_length
, max_length
);
521 for (i
= 0; error
== 0 && i
< glob_list
.we_wordc
; i
++)
522 error
= do_parse_glob (glob_list
.we_wordv
[i
], word
, word_length
,
523 max_length
, pwordexp
, ifs
, ifs_white
);
527 wordfree (&glob_list
);
533 parse_squote (char **word
, size_t *word_length
, size_t *max_length
,
534 const char *words
, size_t *offset
)
536 /* We are poised just after a single quote */
537 for (; words
[*offset
]; ++(*offset
))
539 if (words
[*offset
] != '\'')
541 *word
= w_addchar (*word
, word_length
, max_length
, words
[*offset
]);
548 /* Unterminated string */
552 /* Functions to evaluate an arithmetic expression */
555 eval_expr_val (char **expr
, long int *result
)
559 /* Skip white space */
560 for (digit
= *expr
; digit
&& *digit
&& isspace (*digit
); ++digit
);
564 /* Scan for closing paren */
565 for (++digit
; **expr
&& **expr
!= ')'; ++(*expr
));
573 if (eval_expr (digit
, result
))
579 /* POSIX requires that decimal, octal, and hexadecimal constants are
580 recognized. Therefore we pass 0 as the third parameter to strtol. */
581 *result
= strtol (digit
, expr
, 0);
590 eval_expr_multdiv (char **expr
, long int *result
)
595 if (eval_expr_val (expr
, result
) != 0)
600 /* Skip white space */
601 for (; *expr
&& **expr
&& isspace (**expr
); ++(*expr
));
606 if (eval_expr_val (expr
, &arg
) != 0)
611 else if (**expr
== '/')
614 if (eval_expr_val (expr
, &arg
) != 0)
627 eval_expr (char *expr
, long int *result
)
632 if (eval_expr_multdiv (&expr
, result
) != 0)
637 /* Skip white space */
638 for (; expr
&& *expr
&& isspace (*expr
); ++expr
);
643 if (eval_expr_multdiv (&expr
, &arg
) != 0)
648 else if (*expr
== '-')
651 if (eval_expr_multdiv (&expr
, &arg
) != 0)
664 parse_arith (char **word
, size_t *word_length
, size_t *max_length
,
665 const char *words
, size_t *offset
, int flags
, int bracket
)
667 /* We are poised just after "$((" or "$[" */
674 expr
= w_newword (&expr_length
, &expr_maxlen
);
675 for (; words
[*offset
]; ++(*offset
))
677 switch (words
[*offset
])
680 error
= parse_dollars (&expr
, &expr_length
, &expr_maxlen
,
681 words
, offset
, flags
, NULL
, NULL
, NULL
, 1);
682 /* The ``1'' here is to tell parse_dollars not to
694 error
= parse_backtick (&expr
, &expr_length
, &expr_maxlen
,
695 words
, offset
, flags
, NULL
, NULL
, NULL
);
696 /* The first NULL here is to tell parse_backtick not to
707 error
= parse_qtd_backslash (&expr
, &expr_length
, &expr_maxlen
,
714 /* I think that a backslash within an
715 * arithmetic expansion is bound to
716 * cause an error sooner or later anyway though.
721 if (--paren_depth
== 0)
723 char result
[21]; /* 21 = ceil(log10(2^64)) + 1 */
724 long int numresult
= 0;
725 long long int convertme
;
727 if (bracket
|| words
[1 + *offset
] != ')')
736 if (*expr
&& eval_expr (expr
, &numresult
) != 0)
744 convertme
= -numresult
;
745 *word
= w_addchar (*word
, word_length
, max_length
, '-');
753 convertme
= numresult
;
756 *word
= w_addstr (*word
, word_length
, max_length
,
757 _itoa (convertme
, &result
[20], 10, 0));
759 return *word
? 0 : WRDE_NOSPACE
;
761 expr
= w_addchar (expr
, &expr_length
, &expr_maxlen
, words
[*offset
]);
768 if (bracket
&& paren_depth
== 1)
770 char result
[21]; /* 21 = ceil(log10(2^64)) + 1 */
771 long int numresult
= 0;
774 if (*expr
&& eval_expr (expr
, &numresult
) != 0)
781 *word
= w_addstr (*word
, word_length
, max_length
,
782 _itoa_word (numresult
, &result
[20], 10, 0));
784 return *word
? 0 : WRDE_NOSPACE
;
800 expr
= w_addchar (expr
, &expr_length
, &expr_maxlen
, words
[*offset
]);
811 /* Function called by child process in exec_comm() */
813 internal_function
__attribute__ ((always_inline
))
814 exec_comm_child (char *comm
, int *fildes
, int showerr
, int noexec
)
816 const char *args
[4] = { _PATH_BSHELL
, "-c", comm
, NULL
};
818 /* Execute the command, or just check syntax? */
822 /* Redirect output. */
823 __dup2 (fildes
[1], STDOUT_FILENO
);
826 /* Redirect stderr to /dev/null if we have to. */
832 fd
= __open (_PATH_DEVNULL
, O_WRONLY
);
833 if (fd
>= 0 && fd
!= 2)
835 __dup2 (fd
, STDERR_FILENO
);
838 /* Be paranoid. Check that we actually opened the /dev/null
840 if (__builtin_expect (__fxstat64 (_STAT_VER
, STDERR_FILENO
, &st
), 0) != 0
841 || __builtin_expect (S_ISCHR (st
.st_mode
), 1) == 0
842 #if defined DEV_NULL_MAJOR && defined DEV_NULL_MINOR
843 || st
.st_rdev
!= makedev (DEV_NULL_MAJOR
, DEV_NULL_MINOR
)
846 /* It's not the /dev/null device. Stop right here. The
847 problem is: how do we stop? We use _exit() with an
848 hopefully unusual exit code. */
852 /* Make sure the subshell doesn't field-split on our behalf. */
856 __execve (_PATH_BSHELL
, (char *const *) args
, __environ
);
862 /* Function to execute a command and retrieve the results */
863 /* pwordexp contains NULL if field-splitting is forbidden */
866 exec_comm (char *comm
, char **word
, size_t *word_length
, size_t *max_length
,
867 int flags
, wordexp_t
*pwordexp
, const char *ifs
,
868 const char *ifs_white
)
875 size_t maxnewlines
= 0;
876 char buffer
[bufsize
];
880 /* Don't fork() unless necessary */
889 if ((pid
= __fork ()) < 0)
900 exec_comm_child (comm
, fildes
, noexec
? 0 : flags
& WRDE_SHOWERR
, noexec
);
904 /* If we are just testing the syntax, only wait. */
906 return (TEMP_FAILURE_RETRY (__waitpid (pid
, &status
, 0)) == pid
907 && status
!= 0) ? WRDE_SYNTAX
: 0;
913 /* Quoted - no field splitting */
917 if ((buflen
= TEMP_FAILURE_RETRY (__read (fildes
[0], buffer
,
920 if (TEMP_FAILURE_RETRY (__waitpid (pid
, &status
, WNOHANG
)) == 0)
922 if ((buflen
= TEMP_FAILURE_RETRY (__read (fildes
[0], buffer
,
927 maxnewlines
+= buflen
;
929 *word
= w_addmem (*word
, word_length
, max_length
, buffer
, buflen
);
935 /* Not quoted - split fields */
939 * 0 when searching for first character in a field not IFS white space
940 * 1 when copying the text of a field
941 * 2 when searching for possible non-whitespace IFS
942 * 3 when searching for non-newline after copying field
947 if ((buflen
= TEMP_FAILURE_RETRY (__read (fildes
[0], buffer
,
950 if (TEMP_FAILURE_RETRY (__waitpid (pid
, &status
, WNOHANG
)) == 0)
952 if ((buflen
= TEMP_FAILURE_RETRY (__read (fildes
[0], buffer
,
957 for (i
= 0; i
< buflen
; ++i
)
959 if (strchr (ifs
, buffer
[i
]) != NULL
)
961 /* Current character is IFS */
962 if (strchr (ifs_white
, buffer
[i
]) == NULL
)
964 /* Current character is IFS but not whitespace */
970 * eg: text<space><comma><space>moretext
972 * So, strip whitespace IFS (like at the start)
979 /* fall through and delimit field.. */
983 if (buffer
[i
] == '\n')
985 /* Current character is (IFS) newline */
987 /* If copying a field, this is the end of it,
988 but maybe all that's left is trailing newlines.
989 So start searching for a non-newline. */
997 /* Current character is IFS white space, but
1000 /* If not either copying a field or searching
1001 for non-newline after a field, ignore it */
1002 if (copying
!= 1 && copying
!= 3)
1005 /* End of field (search for non-ws IFS afterwards) */
1010 /* First IFS white space (non-newline), or IFS non-whitespace.
1011 * Delimit the field. Nulls are converted by w_addword. */
1012 if (w_addword (pwordexp
, *word
) == WRDE_NOSPACE
)
1015 *word
= w_newword (word_length
, max_length
);
1018 /* fall back round the loop.. */
1022 /* Not IFS character */
1026 /* Nothing but (IFS) newlines since the last field,
1027 so delimit it here before starting new word */
1028 if (w_addword (pwordexp
, *word
) == WRDE_NOSPACE
)
1031 *word
= w_newword (word_length
, max_length
);
1036 if (buffer
[i
] == '\n') /* happens if newline not in IFS */
1041 *word
= w_addchar (*word
, word_length
, max_length
,
1050 /* Chop off trailing newlines (required by POSIX.2) */
1051 /* Ensure we don't go back further than the beginning of the
1052 substitution (i.e. remove maxnewlines bytes at most) */
1053 while (maxnewlines
-- != 0 &&
1054 *word_length
> 0 && (*word
)[*word_length
- 1] == '\n')
1056 (*word
)[--*word_length
] = '\0';
1058 /* If the last word was entirely newlines, turn it into a new word
1059 * which can be ignored if there's nothing following it. */
1060 if (*word_length
== 0)
1063 *word
= w_newword (word_length
, max_length
);
1068 __close (fildes
[0]);
1071 /* Check for syntax error (re-execute but with "-n" flag) */
1072 if (buflen
< 1 && status
!= 0)
1081 __kill (pid
, SIGKILL
);
1082 TEMP_FAILURE_RETRY (__waitpid (pid
, NULL
, 0));
1083 __close (fildes
[0]);
1084 return WRDE_NOSPACE
;
1089 parse_comm (char **word
, size_t *word_length
, size_t *max_length
,
1090 const char *words
, size_t *offset
, int flags
, wordexp_t
*pwordexp
,
1091 const char *ifs
, const char *ifs_white
)
1093 /* We are poised just after "$(" */
1094 int paren_depth
= 1;
1096 int quoted
= 0; /* 1 for singly-quoted, 2 for doubly-quoted */
1099 char *comm
= w_newword (&comm_length
, &comm_maxlen
);
1101 for (; words
[*offset
]; ++(*offset
))
1103 switch (words
[*offset
])
1108 else if (quoted
== 1)
1116 else if (quoted
== 2)
1122 if (!quoted
&& --paren_depth
== 0)
1124 /* Go -- give script to the shell */
1127 #ifdef __libc_ptf_call
1128 /* We do not want the exec_comm call to be cut short
1129 by a thread cancellation since cleanup is very
1130 ugly. Therefore disable cancellation for
1132 // XXX Ideally we do want the thread being cancelable.
1133 // XXX If demand is there we'll change it.
1134 int state
= PTHREAD_CANCEL_ENABLE
;
1135 __libc_ptf_call (pthread_setcancelstate
,
1136 (PTHREAD_CANCEL_DISABLE
, &state
), 0);
1139 error
= exec_comm (comm
, word
, word_length
, max_length
,
1140 flags
, pwordexp
, ifs
, ifs_white
);
1142 #ifdef __libc_ptf_call
1143 __libc_ptf_call (pthread_setcancelstate
, (state
, NULL
), 0);
1152 /* This is just part of the script */
1160 comm
= w_addchar (comm
, &comm_length
, &comm_maxlen
, words
[*offset
]);
1162 return WRDE_NOSPACE
;
1174 parse_param (char **word
, size_t *word_length
, size_t *max_length
,
1175 const char *words
, size_t *offset
, int flags
, wordexp_t
*pwordexp
,
1176 const char *ifs
, const char *ifs_white
, int quoted
)
1178 /* We are poised just after "$" */
1182 ACT_RP_SHORT_LEFT
= '#',
1183 ACT_RP_LONG_LEFT
= 'L',
1184 ACT_RP_SHORT_RIGHT
= '%',
1185 ACT_RP_LONG_RIGHT
= 'R',
1186 ACT_NULL_ERROR
= '?',
1187 ACT_NULL_SUBST
= '-',
1188 ACT_NONNULL_SUBST
= '+',
1189 ACT_NULL_ASSIGN
= '='
1195 size_t start
= *offset
;
1199 enum action action
= ACT_NONE
;
1204 int pattern_is_quoted
= 0; /* 1 for singly-quoted, 2 for doubly-quoted */
1208 int brace
= words
[*offset
] == '{';
1210 env
= w_newword (&env_length
, &env_maxlen
);
1211 pattern
= w_newword (&pat_length
, &pat_maxlen
);
1216 /* First collect the parameter name. */
1218 if (words
[*offset
] == '#')
1226 if (isalpha (words
[*offset
]) || words
[*offset
] == '_')
1228 /* Normal parameter name. */
1231 env
= w_addchar (env
, &env_length
, &env_maxlen
,
1236 while (isalnum (words
[++*offset
]) || words
[*offset
] == '_');
1238 else if (isdigit (words
[*offset
]))
1240 /* Numeric parameter name. */
1244 env
= w_addchar (env
, &env_length
, &env_maxlen
,
1251 while (isdigit(words
[++*offset
]));
1253 else if (strchr ("*@$", words
[*offset
]) != NULL
)
1255 /* Special parameter. */
1257 env
= w_addchar (env
, &env_length
, &env_maxlen
,
1271 /* Check for special action to be applied to the value. */
1272 switch (words
[*offset
])
1279 action
= ACT_RP_SHORT_LEFT
;
1280 if (words
[1 + *offset
] == '#')
1283 action
= ACT_RP_LONG_LEFT
;
1288 action
= ACT_RP_SHORT_RIGHT
;
1289 if (words
[1 + *offset
] == '%')
1292 action
= ACT_RP_LONG_RIGHT
;
1297 if (strchr ("-=?+", words
[1 + *offset
]) == NULL
)
1301 action
= words
[++*offset
];
1308 action
= words
[*offset
];
1315 /* Now collect the pattern, but don't expand it yet. */
1317 for (; words
[*offset
]; ++(*offset
))
1319 switch (words
[*offset
])
1322 if (!pattern_is_quoted
)
1327 if (!pattern_is_quoted
)
1336 if (pattern_is_quoted
)
1337 /* Quoted; treat as normal character. */
1340 /* Otherwise, it's an escape: next character is literal. */
1341 if (words
[++*offset
] == '\0')
1344 pattern
= w_addchar (pattern
, &pat_length
, &pat_maxlen
, '\\');
1345 if (pattern
== NULL
)
1351 if (pattern_is_quoted
== 0)
1352 pattern_is_quoted
= 1;
1353 else if (pattern_is_quoted
== 1)
1354 pattern_is_quoted
= 0;
1359 if (pattern_is_quoted
== 0)
1360 pattern_is_quoted
= 2;
1361 else if (pattern_is_quoted
== 2)
1362 pattern_is_quoted
= 0;
1367 pattern
= w_addchar (pattern
, &pat_length
, &pat_maxlen
,
1369 if (pattern
== NULL
)
1374 /* End of input string -- remember to reparse the character that we
1379 if (words
[start
] == '{' && words
[*offset
] != '}')
1386 /* $# expands to the number of positional parameters */
1388 value
= _itoa_word (__libc_argc
- 1, &buffer
[20], 10, 0);
1393 /* Just $ on its own */
1394 *offset
= start
- 1;
1395 *word
= w_addchar (*word
, word_length
, max_length
, '$');
1396 return *word
? 0 : WRDE_NOSPACE
;
1399 /* Is it a numeric parameter? */
1400 else if (isdigit (env
[0]))
1404 if (n
>= __libc_argc
)
1405 /* Substitute NULL. */
1408 /* Replace with appropriate positional parameter. */
1409 value
= __libc_argv
[n
];
1411 /* Is it a special parameter? */
1418 value
= _itoa_word (__getpid (), &buffer
[20], 10, 0);
1420 /* Is it `${#*}' or `${#@}'? */
1421 else if ((*env
== '*' || *env
== '@') && seen_hash
)
1424 value
= _itoa_word (__libc_argc
> 0 ? __libc_argc
- 1 : 0,
1425 &buffer
[20], 10, 0);
1426 *word
= w_addstr (*word
, word_length
, max_length
, value
);
1430 return *word
? 0 : WRDE_NOSPACE
;
1432 /* Is it `$*' or `$@' (unquoted) ? */
1433 else if (*env
== '*' || (*env
== '@' && !quoted
))
1435 size_t plist_len
= 0;
1439 /* Build up value parameter by parameter (copy them) */
1440 for (p
= 1; __libc_argv
[p
]; ++p
)
1441 plist_len
+= strlen (__libc_argv
[p
]) + 1; /* for space */
1442 value
= malloc (plist_len
);
1447 for (p
= 1; __libc_argv
[p
]; ++p
)
1451 end
= __stpcpy (end
, __libc_argv
[p
]);
1458 /* Must be a quoted `$@' */
1459 assert (*env
== '@' && quoted
);
1461 /* Each parameter is a separate word ("$@") */
1462 if (__libc_argc
== 2)
1463 value
= __libc_argv
[1];
1464 else if (__libc_argc
> 2)
1468 /* Append first parameter to current word. */
1469 value
= w_addstr (*word
, word_length
, max_length
,
1471 if (value
== NULL
|| w_addword (pwordexp
, value
))
1474 for (p
= 2; __libc_argv
[p
+ 1]; p
++)
1476 char *newword
= __strdup (__libc_argv
[p
]);
1477 if (newword
== NULL
|| w_addword (pwordexp
, newword
))
1481 /* Start a new word with the last parameter. */
1482 *word
= w_newword (word_length
, max_length
);
1483 value
= __libc_argv
[p
];
1494 value
= getenv (env
);
1496 if (value
== NULL
&& (flags
& WRDE_UNDEF
))
1498 /* Variable not defined. */
1499 error
= WRDE_BADVAL
;
1503 if (action
!= ACT_NONE
)
1505 int expand_pattern
= 0;
1507 /* First, find out if we need to expand pattern (i.e. if we will
1511 case ACT_RP_SHORT_LEFT
:
1512 case ACT_RP_LONG_LEFT
:
1513 case ACT_RP_SHORT_RIGHT
:
1514 case ACT_RP_LONG_RIGHT
:
1515 /* Always expand for these. */
1519 case ACT_NULL_ERROR
:
1520 case ACT_NULL_SUBST
:
1521 case ACT_NULL_ASSIGN
:
1522 if (!value
|| (!*value
&& colon_seen
))
1523 /* If param is unset, or set but null and a colon has been seen,
1524 the expansion of the pattern will be needed. */
1529 case ACT_NONNULL_SUBST
:
1530 /* Expansion of word will be needed if parameter is set and not null,
1531 or set null but no colon has been seen. */
1532 if (value
&& (*value
|| !colon_seen
))
1538 assert (! "Unrecognised action!");
1543 /* We need to perform tilde expansion, parameter expansion,
1544 command substitution, and arithmetic expansion. We also
1545 have to be a bit careful with wildcard characters, as
1546 pattern might be given to fnmatch soon. To do this, we
1547 convert quotes to escapes. */
1553 int quoted
= 0; /* 1: single quotes; 2: double */
1555 expanded
= w_newword (&exp_len
, &exp_maxl
);
1556 for (p
= pattern
; p
&& *p
; p
++)
1565 else if (quoted
== 0)
1574 else if (quoted
== 0)
1584 /* Convert quoted wildchar to escaped wildchar. */
1585 expanded
= w_addchar (expanded
, &exp_len
,
1588 if (expanded
== NULL
)
1595 error
= parse_dollars (&expanded
, &exp_len
, &exp_maxl
, p
,
1596 &offset
, flags
, NULL
, NULL
, NULL
, 1);
1612 if (quoted
|| exp_len
)
1616 error
= parse_tilde (&expanded
, &exp_len
, &exp_maxl
, p
,
1633 expanded
= w_addchar (expanded
, &exp_len
, &exp_maxl
, '\\');
1635 assert (*p
); /* checked when extracted initially */
1636 if (expanded
== NULL
)
1640 expanded
= w_addchar (expanded
, &exp_len
, &exp_maxl
, *p
);
1642 if (expanded
== NULL
)
1654 case ACT_RP_SHORT_LEFT
:
1655 case ACT_RP_LONG_LEFT
:
1656 case ACT_RP_SHORT_RIGHT
:
1657 case ACT_RP_LONG_RIGHT
:
1663 if (value
== NULL
|| pattern
== NULL
|| *pattern
== '\0')
1666 end
= value
+ strlen (value
);
1670 case ACT_RP_SHORT_LEFT
:
1671 for (p
= value
; p
<= end
; ++p
)
1675 if (fnmatch (pattern
, value
, 0) != FNM_NOMATCH
)
1680 char *newval
= __strdup (p
);
1698 case ACT_RP_LONG_LEFT
:
1699 for (p
= end
; p
>= value
; --p
)
1703 if (fnmatch (pattern
, value
, 0) != FNM_NOMATCH
)
1708 char *newval
= __strdup (p
);
1726 case ACT_RP_SHORT_RIGHT
:
1727 for (p
= end
; p
>= value
; --p
)
1729 if (fnmatch (pattern
, p
, 0) != FNM_NOMATCH
)
1732 newval
= malloc (p
- value
+ 1);
1741 *(char *) __mempcpy (newval
, value
, p
- value
) = '\0';
1752 case ACT_RP_LONG_RIGHT
:
1753 for (p
= value
; p
<= end
; ++p
)
1755 if (fnmatch (pattern
, p
, 0) != FNM_NOMATCH
)
1758 newval
= malloc (p
- value
+ 1);
1767 *(char *) __mempcpy (newval
, value
, p
- value
) = '\0';
1785 case ACT_NULL_ERROR
:
1786 if (value
&& *value
)
1787 /* Substitute parameter */
1791 if (!colon_seen
&& value
)
1792 /* Substitute NULL */
1796 const char *str
= pattern
;
1799 str
= _("parameter null or not set");
1801 __fxprintf (NULL
, "%s: %s\n", env
, str
);
1808 case ACT_NULL_SUBST
:
1809 if (value
&& *value
)
1810 /* Substitute parameter */
1813 if (free_value
&& value
)
1816 if (!colon_seen
&& value
)
1817 /* Substitute NULL */
1820 value
= pattern
? __strdup (pattern
) : pattern
;
1823 if (pattern
&& !value
)
1828 case ACT_NONNULL_SUBST
:
1829 if (value
&& (*value
|| !colon_seen
))
1831 if (free_value
&& value
)
1834 value
= pattern
? __strdup (pattern
) : pattern
;
1837 if (pattern
&& !value
)
1843 /* Substitute NULL */
1848 case ACT_NULL_ASSIGN
:
1849 if (value
&& *value
)
1850 /* Substitute parameter */
1853 if (!colon_seen
&& value
)
1855 /* Substitute NULL */
1861 if (free_value
&& value
)
1864 value
= pattern
? __strdup (pattern
) : pattern
;
1867 if (pattern
&& !value
)
1870 __setenv (env
, value
, 1);
1874 assert (! "Unrecognised action!");
1878 free (env
); env
= NULL
;
1879 free (pattern
); pattern
= NULL
;
1883 char param_length
[21];
1884 param_length
[20] = '\0';
1885 *word
= w_addstr (*word
, word_length
, max_length
,
1886 _itoa_word (value
? strlen (value
) : 0,
1887 ¶m_length
[20], 10, 0));
1890 assert (value
!= NULL
);
1894 return *word
? 0 : WRDE_NOSPACE
;
1900 if (quoted
|| !pwordexp
)
1902 /* Quoted - no field split */
1903 *word
= w_addstr (*word
, word_length
, max_length
, value
);
1907 return *word
? 0 : WRDE_NOSPACE
;
1911 /* Need to field-split */
1912 char *value_copy
= __strdup (value
); /* Don't modify value */
1913 char *field_begin
= value_copy
;
1914 int seen_nonws_ifs
= 0;
1919 if (value_copy
== NULL
)
1924 char *field_end
= field_begin
;
1927 /* If this isn't the first field, start a new word */
1928 if (field_begin
!= value_copy
)
1930 if (w_addword (pwordexp
, *word
) == WRDE_NOSPACE
)
1936 *word
= w_newword (word_length
, max_length
);
1939 /* Skip IFS whitespace before the field */
1940 field_begin
+= strspn (field_begin
, ifs_white
);
1942 if (!seen_nonws_ifs
&& *field_begin
== 0)
1943 /* Nothing but whitespace */
1946 /* Search for the end of the field */
1947 field_end
= field_begin
+ strcspn (field_begin
, ifs
);
1949 /* Set up pointer to the character after end of field and
1950 skip whitespace IFS after it. */
1951 next_field
= field_end
+ strspn (field_end
, ifs_white
);
1953 /* Skip at most one non-whitespace IFS character after the field */
1955 if (*next_field
&& strchr (ifs
, *next_field
))
1961 /* Null-terminate it */
1964 /* Tag a copy onto the current word */
1965 *word
= w_addstr (*word
, word_length
, max_length
, field_begin
);
1967 if (*word
== NULL
&& *field_begin
!= '\0')
1973 field_begin
= next_field
;
1975 while (seen_nonws_ifs
|| *field_begin
);
1987 error
= WRDE_NOSPACE
;
1991 error
= WRDE_SYNTAX
;
2005 parse_dollars (char **word
, size_t *word_length
, size_t *max_length
,
2006 const char *words
, size_t *offset
, int flags
,
2007 wordexp_t
*pwordexp
, const char *ifs
, const char *ifs_white
,
2010 /* We are poised _at_ "$" */
2011 switch (words
[1 + *offset
])
2016 *word
= w_addchar (*word
, word_length
, max_length
, '$');
2017 return *word
? 0 : WRDE_NOSPACE
;
2020 if (words
[2 + *offset
] == '(')
2022 /* Differentiate between $((1+3)) and $((echo);(ls)) */
2023 int i
= 3 + *offset
;
2025 while (words
[i
] && !(depth
== 0 && words
[i
] == ')'))
2027 if (words
[i
] == '(')
2029 else if (words
[i
] == ')')
2035 if (words
[i
] == ')' && words
[i
+ 1] == ')')
2038 /* Call parse_arith -- 0 is for "no brackets" */
2039 return parse_arith (word
, word_length
, max_length
, words
, offset
,
2044 if (flags
& WRDE_NOCMD
)
2048 return parse_comm (word
, word_length
, max_length
, words
, offset
, flags
,
2049 quoted
? NULL
: pwordexp
, ifs
, ifs_white
);
2053 /* Call parse_arith -- 1 is for "brackets" */
2054 return parse_arith (word
, word_length
, max_length
, words
, offset
, flags
,
2059 ++(*offset
); /* parse_param needs to know if "{" is there */
2060 return parse_param (word
, word_length
, max_length
, words
, offset
, flags
,
2061 pwordexp
, ifs
, ifs_white
, quoted
);
2067 parse_backtick (char **word
, size_t *word_length
, size_t *max_length
,
2068 const char *words
, size_t *offset
, int flags
,
2069 wordexp_t
*pwordexp
, const char *ifs
, const char *ifs_white
)
2071 /* We are poised just after "`" */
2076 char *comm
= w_newword (&comm_length
, &comm_maxlen
);
2078 for (; words
[*offset
]; ++(*offset
))
2080 switch (words
[*offset
])
2083 /* Go -- give the script to the shell */
2084 error
= exec_comm (comm
, word
, word_length
, max_length
, flags
,
2085 pwordexp
, ifs
, ifs_white
);
2092 error
= parse_qtd_backslash (&comm
, &comm_length
, &comm_maxlen
,
2105 error
= parse_backslash (&comm
, &comm_length
, &comm_maxlen
, words
,
2117 squoting
= 1 - squoting
;
2119 comm
= w_addchar (comm
, &comm_length
, &comm_maxlen
, words
[*offset
]);
2121 return WRDE_NOSPACE
;
2132 parse_dquote (char **word
, size_t *word_length
, size_t *max_length
,
2133 const char *words
, size_t *offset
, int flags
,
2134 wordexp_t
*pwordexp
, const char * ifs
, const char * ifs_white
)
2136 /* We are poised just after a double-quote */
2139 for (; words
[*offset
]; ++(*offset
))
2141 switch (words
[*offset
])
2147 error
= parse_dollars (word
, word_length
, max_length
, words
, offset
,
2148 flags
, pwordexp
, ifs
, ifs_white
, 1);
2149 /* The ``1'' here is to tell parse_dollars not to
2150 * split the fields. It may need to, however ("$@").
2158 if (flags
& WRDE_NOCMD
)
2162 error
= parse_backtick (word
, word_length
, max_length
, words
,
2163 offset
, flags
, NULL
, NULL
, NULL
);
2164 /* The first NULL here is to tell parse_backtick not to
2173 error
= parse_qtd_backslash (word
, word_length
, max_length
, words
,
2182 *word
= w_addchar (*word
, word_length
, max_length
, words
[*offset
]);
2184 return WRDE_NOSPACE
;
2188 /* Unterminated string */
2193 * wordfree() is to be called after pwordexp is finished with.
2197 wordfree (wordexp_t
*pwordexp
)
2200 /* wordexp can set pwordexp to NULL */
2201 if (pwordexp
&& pwordexp
->we_wordv
)
2203 char **wordv
= pwordexp
->we_wordv
;
2205 for (wordv
+= pwordexp
->we_offs
; *wordv
; ++wordv
)
2208 free (pwordexp
->we_wordv
);
2209 pwordexp
->we_wordv
= NULL
;
2212 libc_hidden_def (wordfree
)
2219 wordexp (const char *words
, wordexp_t
*pwordexp
, int flags
)
2221 size_t words_offset
;
2224 char *word
= w_newword (&word_length
, &max_length
);
2228 wordexp_t old_word
= *pwordexp
;
2230 if (flags
& WRDE_REUSE
)
2232 /* Minimal implementation of WRDE_REUSE for now */
2233 wordfree (pwordexp
);
2234 old_word
.we_wordv
= NULL
;
2237 if ((flags
& WRDE_APPEND
) == 0)
2239 pwordexp
->we_wordc
= 0;
2241 if (flags
& WRDE_DOOFFS
)
2243 pwordexp
->we_wordv
= calloc (1 + pwordexp
->we_offs
, sizeof (char *));
2244 if (pwordexp
->we_wordv
== NULL
)
2246 error
= WRDE_NOSPACE
;
2252 pwordexp
->we_wordv
= calloc (1, sizeof (char *));
2253 if (pwordexp
->we_wordv
== NULL
)
2255 error
= WRDE_NOSPACE
;
2259 pwordexp
->we_offs
= 0;
2263 /* Find out what the field separators are.
2264 * There are two types: whitespace and non-whitespace.
2266 ifs
= getenv ("IFS");
2269 /* IFS unset - use <space><tab><newline>. */
2270 ifs
= strcpy (ifs_white
, " \t\n");
2274 char *whch
= ifs_white
;
2276 /* Start off with no whitespace IFS characters */
2277 ifs_white
[0] = '\0';
2279 while (*ifsch
!= '\0')
2281 if ((*ifsch
== ' ') || (*ifsch
== '\t') || (*ifsch
== '\n'))
2283 /* Whitespace IFS. See first whether it is already in our
2285 char *runp
= ifs_white
;
2287 while (runp
< whch
&& *runp
!= '\0' && *runp
!= *ifsch
)
2299 for (words_offset
= 0 ; words
[words_offset
] ; ++words_offset
)
2300 switch (words
[words_offset
])
2303 error
= parse_backslash (&word
, &word_length
, &max_length
, words
,
2312 error
= parse_dollars (&word
, &word_length
, &max_length
, words
,
2313 &words_offset
, flags
, pwordexp
, ifs
, ifs_white
,
2322 if (flags
& WRDE_NOCMD
)
2324 error
= WRDE_CMDSUB
;
2329 error
= parse_backtick (&word
, &word_length
, &max_length
, words
,
2330 &words_offset
, flags
, pwordexp
, ifs
,
2340 error
= parse_dquote (&word
, &word_length
, &max_length
, words
,
2341 &words_offset
, flags
, pwordexp
, ifs
, ifs_white
);
2348 error
= w_addword (pwordexp
, NULL
);
2358 error
= parse_squote (&word
, &word_length
, &max_length
, words
,
2366 error
= w_addword (pwordexp
, NULL
);
2375 error
= parse_tilde (&word
, &word_length
, &max_length
, words
,
2376 &words_offset
, pwordexp
->we_wordc
);
2386 error
= parse_glob (&word
, &word_length
, &max_length
, words
,
2387 &words_offset
, flags
, pwordexp
, ifs
, ifs_white
);
2395 /* Is it a word separator? */
2396 if (strchr (" \t", words
[words_offset
]) == NULL
)
2398 char ch
= words
[words_offset
];
2400 /* Not a word separator -- but is it a valid word char? */
2401 if (strchr ("\n|&;<>(){}", ch
))
2404 error
= WRDE_BADCHAR
;
2408 /* "Ordinary" character -- add it to word */
2409 word
= w_addchar (word
, &word_length
, &max_length
,
2413 error
= WRDE_NOSPACE
;
2420 /* If a word has been delimited, add it to the list. */
2423 error
= w_addword (pwordexp
, word
);
2428 word
= w_newword (&word_length
, &max_length
);
2433 /* There was a word separator at the end */
2434 if (word
== NULL
) /* i.e. w_newword */
2437 /* There was no field separator at the end */
2438 return w_addword (pwordexp
, word
);
2442 * free memory used (unless error is WRDE_NOSPACE), and
2443 * set pwordexp members back to what they were.
2449 if (error
== WRDE_NOSPACE
)
2450 return WRDE_NOSPACE
;
2452 if ((flags
& WRDE_APPEND
) == 0)
2453 wordfree (pwordexp
);
2455 *pwordexp
= old_word
;