1 /* POSIX.2 wordexp implementation.
2 Copyright (C) 1997-2015 Free Software Foundation, Inc.
3 This file is part of the GNU C Library.
4 Contributed by Tim Waugh <tim@cyberelk.demon.co.uk>.
6 The GNU C Library is free software; you can redistribute it and/or
7 modify it under the terms of the GNU Lesser General Public
8 License as published by the Free Software Foundation; either
9 version 2.1 of the License, or (at your option) any later version.
11 The GNU C Library is distributed in the hope that it will be useful,
12 but WITHOUT ANY WARRANTY; without even the implied warranty of
13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14 Lesser General Public License for more details.
16 You should have received a copy of the GNU Lesser General Public
17 License along with the GNU C Library; if not, see
18 <http://www.gnu.org/licenses/>. */
34 #include <sys/param.h>
37 #include <sys/types.h>
38 #include <sys/types.h>
43 #include <kernel-features.h>
45 #include <libc-lock.h>
48 /* Undefine the following line for the production version. */
49 /* #define NDEBUG 1 */
52 /* Get some device information. */
53 #include <device-nrs.h>
56 * This is a recursive-descent-style word expansion routine.
59 /* These variables are defined and initialized in the startup code. */
60 extern int __libc_argc attribute_hidden
;
61 extern char **__libc_argv attribute_hidden
;
63 /* Some forward declarations */
64 static int parse_dollars (char **word
, size_t *word_length
, size_t *max_length
,
65 const char *words
, size_t *offset
, int flags
,
66 wordexp_t
*pwordexp
, const char *ifs
,
67 const char *ifs_white
, int quoted
)
69 static int parse_backtick (char **word
, size_t *word_length
,
70 size_t *max_length
, const char *words
,
71 size_t *offset
, int flags
, wordexp_t
*pwordexp
,
72 const char *ifs
, const char *ifs_white
)
74 static int parse_dquote (char **word
, size_t *word_length
, size_t *max_length
,
75 const char *words
, size_t *offset
, int flags
,
76 wordexp_t
*pwordexp
, const char *ifs
,
77 const char *ifs_white
)
79 static int eval_expr (char *expr
, long int *result
) internal_function
;
81 /* The w_*() functions manipulate word lists. */
85 /* Result of w_newword will be ignored if it's the last word. */
87 w_newword (size_t *actlen
, size_t *maxlen
)
89 *actlen
= *maxlen
= 0;
94 w_addchar (char *buffer
, size_t *actlen
, size_t *maxlen
, char ch
)
95 /* (lengths exclude trailing zero) */
97 /* Add a character to the buffer, allocating room for it if needed. */
99 if (*actlen
== *maxlen
)
101 char *old_buffer
= buffer
;
102 assert (buffer
== NULL
|| *maxlen
!= 0);
104 buffer
= (char *) realloc (buffer
, 1 + *maxlen
);
112 buffer
[*actlen
] = ch
;
113 buffer
[++(*actlen
)] = '\0';
121 w_addmem (char *buffer
, size_t *actlen
, size_t *maxlen
, const char *str
,
124 /* Add a string to the buffer, allocating room for it if needed.
126 if (*actlen
+ len
> *maxlen
)
128 char *old_buffer
= buffer
;
129 assert (buffer
== NULL
|| *maxlen
!= 0);
130 *maxlen
+= MAX (2 * len
, W_CHUNK
);
131 buffer
= realloc (old_buffer
, 1 + *maxlen
);
139 *((char *) __mempcpy (&buffer
[*actlen
], str
, len
)) = '\0';
148 w_addstr (char *buffer
, size_t *actlen
, size_t *maxlen
, const char *str
)
149 /* (lengths exclude trailing zero) */
151 /* Add a string to the buffer, allocating room for it if needed.
155 assert (str
!= NULL
); /* w_addstr only called from this file */
158 return w_addmem (buffer
, actlen
, maxlen
, str
, len
);
163 w_addword (wordexp_t
*pwordexp
, char *word
)
165 /* Add a word to the wordlist */
168 bool allocated
= false;
170 /* Internally, NULL acts like "". Convert NULLs to "" before
171 * the caller sees them.
175 word
= __strdup ("");
181 num_p
= 2 + pwordexp
->we_wordc
+ pwordexp
->we_offs
;
182 new_wordv
= realloc (pwordexp
->we_wordv
, sizeof (char *) * num_p
);
183 if (new_wordv
!= NULL
)
185 pwordexp
->we_wordv
= new_wordv
;
186 pwordexp
->we_wordv
[pwordexp
->we_offs
+ pwordexp
->we_wordc
++] = word
;
187 pwordexp
->we_wordv
[pwordexp
->we_offs
+ pwordexp
->we_wordc
] = NULL
;
198 /* The parse_*() functions should leave *offset being the offset in 'words'
199 * to the last character processed.
204 parse_backslash (char **word
, size_t *word_length
, size_t *max_length
,
205 const char *words
, size_t *offset
)
207 /* We are poised _at_ a backslash, not in quotes */
209 switch (words
[1 + *offset
])
212 /* Backslash is last character of input words */
220 *word
= w_addchar (*word
, word_length
, max_length
, words
[1 + *offset
]);
233 parse_qtd_backslash (char **word
, size_t *word_length
, size_t *max_length
,
234 const char *words
, size_t *offset
)
236 /* We are poised _at_ a backslash, inside quotes */
238 switch (words
[1 + *offset
])
241 /* Backslash is last character of input words */
252 *word
= w_addchar (*word
, word_length
, max_length
, words
[1 + *offset
]);
260 *word
= w_addchar (*word
, word_length
, max_length
, words
[*offset
]);
262 *word
= w_addchar (*word
, word_length
, max_length
, words
[1 + *offset
]);
276 parse_tilde (char **word
, size_t *word_length
, size_t *max_length
,
277 const char *words
, size_t *offset
, size_t wordc
)
279 /* We are poised _at_ a tilde */
282 if (*word_length
!= 0)
284 if (!((*word
)[*word_length
- 1] == '=' && wordc
== 0))
286 if (!((*word
)[*word_length
- 1] == ':'
287 && strchr (*word
, '=') && wordc
== 0))
289 *word
= w_addchar (*word
, word_length
, max_length
, '~');
290 return *word
? 0 : WRDE_NOSPACE
;
295 for (i
= 1 + *offset
; words
[i
]; i
++)
297 if (words
[i
] == ':' || words
[i
] == '/' || words
[i
] == ' ' ||
298 words
[i
] == '\t' || words
[i
] == 0 )
301 if (words
[i
] == '\\')
303 *word
= w_addchar (*word
, word_length
, max_length
, '~');
304 return *word
? 0 : WRDE_NOSPACE
;
308 if (i
== 1 + *offset
)
310 /* Tilde appears on its own */
312 struct passwd pwd
, *tpwd
;
318 /* POSIX.2 says ~ expands to $HOME and if HOME is unset the
319 results are unspecified. We do a lookup on the uid if
322 home
= getenv ("HOME");
325 *word
= w_addstr (*word
, word_length
, max_length
, home
);
332 buffer
= __alloca (buflen
);
334 while ((result
= __getpwuid_r (uid
, &pwd
, buffer
, buflen
, &tpwd
)) != 0
336 buffer
= extend_alloca (buffer
, buflen
, buflen
+ 1000);
338 if (result
== 0 && tpwd
!= NULL
&& pwd
.pw_dir
!= NULL
)
340 *word
= w_addstr (*word
, word_length
, max_length
, pwd
.pw_dir
);
346 *word
= w_addchar (*word
, word_length
, max_length
, '~');
354 /* Look up user name in database to get home directory */
355 char *user
= strndupa (&words
[1 + *offset
], i
- (1 + *offset
));
356 struct passwd pwd
, *tpwd
;
358 char* buffer
= __alloca (buflen
);
361 while ((result
= __getpwnam_r (user
, &pwd
, buffer
, buflen
, &tpwd
)) != 0
363 buffer
= extend_alloca (buffer
, buflen
, buflen
+ 1000);
365 if (result
== 0 && tpwd
!= NULL
&& pwd
.pw_dir
)
366 *word
= w_addstr (*word
, word_length
, max_length
, pwd
.pw_dir
);
369 /* (invalid login name) */
370 *word
= w_addchar (*word
, word_length
, max_length
, '~');
372 *word
= w_addstr (*word
, word_length
, max_length
, user
);
377 return *word
? 0 : WRDE_NOSPACE
;
383 do_parse_glob (const char *glob_word
, char **word
, size_t *word_length
,
384 size_t *max_length
, wordexp_t
*pwordexp
, const char *ifs
,
385 const char *ifs_white
)
391 error
= glob (glob_word
, GLOB_NOCHECK
, NULL
, &globbuf
);
395 /* We can only run into memory problems. */
396 assert (error
== GLOB_NOSPACE
);
402 /* No field splitting allowed. */
403 assert (globbuf
.gl_pathv
[0] != NULL
);
404 *word
= w_addstr (*word
, word_length
, max_length
, globbuf
.gl_pathv
[0]);
405 for (match
= 1; match
< globbuf
.gl_pathc
&& *word
!= NULL
; ++match
)
407 *word
= w_addchar (*word
, word_length
, max_length
, ' ');
409 *word
= w_addstr (*word
, word_length
, max_length
,
410 globbuf
.gl_pathv
[match
]);
414 return *word
? 0 : WRDE_NOSPACE
;
417 assert (ifs
== NULL
|| *ifs
!= '\0');
421 *word
= w_newword (word_length
, max_length
);
424 for (match
= 0; match
< globbuf
.gl_pathc
; ++match
)
426 char *matching_word
= __strdup (globbuf
.gl_pathv
[match
]);
427 if (matching_word
== NULL
|| w_addword (pwordexp
, matching_word
))
440 parse_glob (char **word
, size_t *word_length
, size_t *max_length
,
441 const char *words
, size_t *offset
, int flags
,
442 wordexp_t
*pwordexp
, const char *ifs
, const char *ifs_white
)
444 /* We are poised just after a '*', a '[' or a '?'. */
445 int error
= WRDE_NOSPACE
;
446 int quoted
= 0; /* 1 if singly-quoted, 2 if doubly */
448 wordexp_t glob_list
; /* List of words to glob */
450 glob_list
.we_wordc
= 0;
451 glob_list
.we_wordv
= NULL
;
452 glob_list
.we_offs
= 0;
453 for (; words
[*offset
] != '\0'; ++*offset
)
455 if (strchr (ifs
, words
[*offset
]) != NULL
)
459 /* Sort out quoting */
460 if (words
[*offset
] == '\'')
467 else if (quoted
== 1)
473 else if (words
[*offset
] == '"')
480 else if (quoted
== 2)
487 /* Sort out other special characters */
488 if (quoted
!= 1 && words
[*offset
] == '$')
490 error
= parse_dollars (word
, word_length
, max_length
, words
,
491 offset
, flags
, &glob_list
, ifs
, ifs_white
,
498 else if (words
[*offset
] == '\\')
501 error
= parse_qtd_backslash (word
, word_length
, max_length
,
504 error
= parse_backslash (word
, word_length
, max_length
,
513 *word
= w_addchar (*word
, word_length
, max_length
, words
[*offset
]);
518 /* Don't forget to re-parse the character we stopped at. */
522 error
= w_addword (&glob_list
, *word
);
523 *word
= w_newword (word_length
, max_length
);
524 for (i
= 0; error
== 0 && i
< glob_list
.we_wordc
; i
++)
525 error
= do_parse_glob (glob_list
.we_wordv
[i
], word
, word_length
,
526 max_length
, pwordexp
, ifs
, ifs_white
);
530 wordfree (&glob_list
);
536 parse_squote (char **word
, size_t *word_length
, size_t *max_length
,
537 const char *words
, size_t *offset
)
539 /* We are poised just after a single quote */
540 for (; words
[*offset
]; ++(*offset
))
542 if (words
[*offset
] != '\'')
544 *word
= w_addchar (*word
, word_length
, max_length
, words
[*offset
]);
551 /* Unterminated string */
555 /* Functions to evaluate an arithmetic expression */
558 eval_expr_val (char **expr
, long int *result
)
562 /* Skip white space */
563 for (digit
= *expr
; digit
&& *digit
&& isspace (*digit
); ++digit
);
567 /* Scan for closing paren */
568 for (++digit
; **expr
&& **expr
!= ')'; ++(*expr
));
576 if (eval_expr (digit
, result
))
582 /* POSIX requires that decimal, octal, and hexadecimal constants are
583 recognized. Therefore we pass 0 as the third parameter to strtol. */
584 *result
= strtol (digit
, expr
, 0);
593 eval_expr_multdiv (char **expr
, long int *result
)
598 if (eval_expr_val (expr
, result
) != 0)
603 /* Skip white space */
604 for (; *expr
&& **expr
&& isspace (**expr
); ++(*expr
));
609 if (eval_expr_val (expr
, &arg
) != 0)
614 else if (**expr
== '/')
617 if (eval_expr_val (expr
, &arg
) != 0)
620 /* Division by zero or integer overflow. */
621 if (arg
== 0 || (arg
== -1 && *result
== LONG_MIN
))
634 eval_expr (char *expr
, long int *result
)
639 if (eval_expr_multdiv (&expr
, result
) != 0)
644 /* Skip white space */
645 for (; expr
&& *expr
&& isspace (*expr
); ++expr
);
650 if (eval_expr_multdiv (&expr
, &arg
) != 0)
655 else if (*expr
== '-')
658 if (eval_expr_multdiv (&expr
, &arg
) != 0)
671 parse_arith (char **word
, size_t *word_length
, size_t *max_length
,
672 const char *words
, size_t *offset
, int flags
, int bracket
)
674 /* We are poised just after "$((" or "$[" */
681 expr
= w_newword (&expr_length
, &expr_maxlen
);
682 for (; words
[*offset
]; ++(*offset
))
684 switch (words
[*offset
])
687 error
= parse_dollars (&expr
, &expr_length
, &expr_maxlen
,
688 words
, offset
, flags
, NULL
, NULL
, NULL
, 1);
689 /* The ``1'' here is to tell parse_dollars not to
701 error
= parse_backtick (&expr
, &expr_length
, &expr_maxlen
,
702 words
, offset
, flags
, NULL
, NULL
, NULL
);
703 /* The first NULL here is to tell parse_backtick not to
714 error
= parse_qtd_backslash (&expr
, &expr_length
, &expr_maxlen
,
721 /* I think that a backslash within an
722 * arithmetic expansion is bound to
723 * cause an error sooner or later anyway though.
728 if (--paren_depth
== 0)
730 char result
[21]; /* 21 = ceil(log10(2^64)) + 1 */
731 long int numresult
= 0;
732 long long int convertme
;
734 if (bracket
|| words
[1 + *offset
] != ')')
743 if (*expr
&& eval_expr (expr
, &numresult
) != 0)
751 convertme
= -numresult
;
752 *word
= w_addchar (*word
, word_length
, max_length
, '-');
760 convertme
= numresult
;
763 *word
= w_addstr (*word
, word_length
, max_length
,
764 _itoa (convertme
, &result
[20], 10, 0));
766 return *word
? 0 : WRDE_NOSPACE
;
768 expr
= w_addchar (expr
, &expr_length
, &expr_maxlen
, words
[*offset
]);
775 if (bracket
&& paren_depth
== 1)
777 char result
[21]; /* 21 = ceil(log10(2^64)) + 1 */
778 long int numresult
= 0;
781 if (*expr
&& eval_expr (expr
, &numresult
) != 0)
788 *word
= w_addstr (*word
, word_length
, max_length
,
789 _itoa_word (numresult
, &result
[20], 10, 0));
791 return *word
? 0 : WRDE_NOSPACE
;
807 expr
= w_addchar (expr
, &expr_length
, &expr_maxlen
, words
[*offset
]);
818 /* Function called by child process in exec_comm() */
820 internal_function
__attribute__ ((always_inline
))
821 exec_comm_child (char *comm
, int *fildes
, int showerr
, int noexec
)
823 const char *args
[4] = { _PATH_BSHELL
, "-c", comm
, NULL
};
825 /* Execute the command, or just check syntax? */
829 /* Redirect output. */
830 if (__glibc_likely (fildes
[1] != STDOUT_FILENO
))
832 __dup2 (fildes
[1], STDOUT_FILENO
);
838 /* Reset the close-on-exec flag (if necessary). */
839 # ifndef __ASSUME_PIPE2
840 if (__have_pipe2
> 0)
842 __fcntl (fildes
[1], F_SETFD
, 0);
846 /* Redirect stderr to /dev/null if we have to. */
851 __close (STDERR_FILENO
);
852 fd
= __open (_PATH_DEVNULL
, O_WRONLY
);
853 if (fd
>= 0 && fd
!= STDERR_FILENO
)
855 __dup2 (fd
, STDERR_FILENO
);
858 /* Be paranoid. Check that we actually opened the /dev/null
860 if (__builtin_expect (__fxstat64 (_STAT_VER
, STDERR_FILENO
, &st
), 0) != 0
861 || __builtin_expect (S_ISCHR (st
.st_mode
), 1) == 0
862 #if defined DEV_NULL_MAJOR && defined DEV_NULL_MINOR
863 || st
.st_rdev
!= makedev (DEV_NULL_MAJOR
, DEV_NULL_MINOR
)
866 /* It's not the /dev/null device. Stop right here. The
867 problem is: how do we stop? We use _exit() with an
868 hopefully unusual exit code. */
872 /* Make sure the subshell doesn't field-split on our behalf. */
876 __execve (_PATH_BSHELL
, (char *const *) args
, __environ
);
882 /* Function to execute a command and retrieve the results */
883 /* pwordexp contains NULL if field-splitting is forbidden */
886 exec_comm (char *comm
, char **word
, size_t *word_length
, size_t *max_length
,
887 int flags
, wordexp_t
*pwordexp
, const char *ifs
,
888 const char *ifs_white
)
895 size_t maxnewlines
= 0;
896 char buffer
[bufsize
];
900 /* Do nothing if command substitution should not succeed. */
901 if (flags
& WRDE_NOCMD
)
904 /* Don't fork() unless necessary */
909 # ifndef __ASSUME_PIPE2
910 if (__have_pipe2
>= 0)
913 int r
= __pipe2 (fildes
, O_CLOEXEC
);
914 # ifndef __ASSUME_PIPE2
915 if (__have_pipe2
== 0)
916 __have_pipe2
= r
!= -1 || errno
!= ENOSYS
? 1 : -1;
918 if (__have_pipe2
> 0)
925 #ifndef __ASSUME_PIPE2
927 if (__have_pipe2
< 0)
929 if (__pipe (fildes
) < 0)
935 if ((pid
= __fork ()) < 0)
944 exec_comm_child (comm
, fildes
, noexec
? 0 : flags
& WRDE_SHOWERR
, noexec
);
948 /* If we are just testing the syntax, only wait. */
950 return (TEMP_FAILURE_RETRY (__waitpid (pid
, &status
, 0)) == pid
951 && status
!= 0) ? WRDE_SYNTAX
: 0;
957 /* Quoted - no field splitting */
961 if ((buflen
= TEMP_FAILURE_RETRY (__read (fildes
[0], buffer
,
964 /* If read returned 0 then the process has closed its
965 stdout. Don't use WNOHANG in that case to avoid busy
966 looping until the process eventually exits. */
967 if (TEMP_FAILURE_RETRY (__waitpid (pid
, &status
,
968 buflen
== 0 ? 0 : WNOHANG
))
971 if ((buflen
= TEMP_FAILURE_RETRY (__read (fildes
[0], buffer
,
976 maxnewlines
+= buflen
;
978 *word
= w_addmem (*word
, word_length
, max_length
, buffer
, buflen
);
984 /* Not quoted - split fields */
988 * 0 when searching for first character in a field not IFS white space
989 * 1 when copying the text of a field
990 * 2 when searching for possible non-whitespace IFS
991 * 3 when searching for non-newline after copying field
996 if ((buflen
= TEMP_FAILURE_RETRY (__read (fildes
[0], buffer
,
999 /* If read returned 0 then the process has closed its
1000 stdout. Don't use WNOHANG in that case to avoid busy
1001 looping until the process eventually exits. */
1002 if (TEMP_FAILURE_RETRY (__waitpid (pid
, &status
,
1003 buflen
== 0 ? 0 : WNOHANG
))
1006 if ((buflen
= TEMP_FAILURE_RETRY (__read (fildes
[0], buffer
,
1011 for (i
= 0; i
< buflen
; ++i
)
1013 if (strchr (ifs
, buffer
[i
]) != NULL
)
1015 /* Current character is IFS */
1016 if (strchr (ifs_white
, buffer
[i
]) == NULL
)
1018 /* Current character is IFS but not whitespace */
1021 /* current character
1024 * eg: text<space><comma><space>moretext
1026 * So, strip whitespace IFS (like at the start)
1033 /* fall through and delimit field.. */
1037 if (buffer
[i
] == '\n')
1039 /* Current character is (IFS) newline */
1041 /* If copying a field, this is the end of it,
1042 but maybe all that's left is trailing newlines.
1043 So start searching for a non-newline. */
1051 /* Current character is IFS white space, but
1054 /* If not either copying a field or searching
1055 for non-newline after a field, ignore it */
1056 if (copying
!= 1 && copying
!= 3)
1059 /* End of field (search for non-ws IFS afterwards) */
1064 /* First IFS white space (non-newline), or IFS non-whitespace.
1065 * Delimit the field. Nulls are converted by w_addword. */
1066 if (w_addword (pwordexp
, *word
) == WRDE_NOSPACE
)
1069 *word
= w_newword (word_length
, max_length
);
1072 /* fall back round the loop.. */
1076 /* Not IFS character */
1080 /* Nothing but (IFS) newlines since the last field,
1081 so delimit it here before starting new word */
1082 if (w_addword (pwordexp
, *word
) == WRDE_NOSPACE
)
1085 *word
= w_newword (word_length
, max_length
);
1090 if (buffer
[i
] == '\n') /* happens if newline not in IFS */
1095 *word
= w_addchar (*word
, word_length
, max_length
,
1104 /* Chop off trailing newlines (required by POSIX.2) */
1105 /* Ensure we don't go back further than the beginning of the
1106 substitution (i.e. remove maxnewlines bytes at most) */
1107 while (maxnewlines
-- != 0 &&
1108 *word_length
> 0 && (*word
)[*word_length
- 1] == '\n')
1110 (*word
)[--*word_length
] = '\0';
1112 /* If the last word was entirely newlines, turn it into a new word
1113 * which can be ignored if there's nothing following it. */
1114 if (*word_length
== 0)
1117 *word
= w_newword (word_length
, max_length
);
1122 __close (fildes
[0]);
1125 /* Check for syntax error (re-execute but with "-n" flag) */
1126 if (buflen
< 1 && status
!= 0)
1135 __kill (pid
, SIGKILL
);
1136 TEMP_FAILURE_RETRY (__waitpid (pid
, NULL
, 0));
1137 __close (fildes
[0]);
1138 return WRDE_NOSPACE
;
1143 parse_comm (char **word
, size_t *word_length
, size_t *max_length
,
1144 const char *words
, size_t *offset
, int flags
, wordexp_t
*pwordexp
,
1145 const char *ifs
, const char *ifs_white
)
1147 /* We are poised just after "$(" */
1148 int paren_depth
= 1;
1150 int quoted
= 0; /* 1 for singly-quoted, 2 for doubly-quoted */
1153 char *comm
= w_newword (&comm_length
, &comm_maxlen
);
1155 for (; words
[*offset
]; ++(*offset
))
1157 switch (words
[*offset
])
1162 else if (quoted
== 1)
1170 else if (quoted
== 2)
1176 if (!quoted
&& --paren_depth
== 0)
1178 /* Go -- give script to the shell */
1181 #ifdef __libc_ptf_call
1182 /* We do not want the exec_comm call to be cut short
1183 by a thread cancellation since cleanup is very
1184 ugly. Therefore disable cancellation for
1186 // XXX Ideally we do want the thread being cancelable.
1187 // XXX If demand is there we'll change it.
1188 int state
= PTHREAD_CANCEL_ENABLE
;
1189 __libc_ptf_call (__pthread_setcancelstate
,
1190 (PTHREAD_CANCEL_DISABLE
, &state
), 0);
1193 error
= exec_comm (comm
, word
, word_length
, max_length
,
1194 flags
, pwordexp
, ifs
, ifs_white
);
1196 #ifdef __libc_ptf_call
1197 __libc_ptf_call (__pthread_setcancelstate
,
1207 /* This is just part of the script */
1215 comm
= w_addchar (comm
, &comm_length
, &comm_maxlen
, words
[*offset
]);
1217 return WRDE_NOSPACE
;
1220 /* Premature end. */
1226 #define CHAR_IN_SET(ch, char_set) \
1227 (memchr (char_set "", ch, sizeof (char_set) - 1) != NULL)
1231 parse_param (char **word
, size_t *word_length
, size_t *max_length
,
1232 const char *words
, size_t *offset
, int flags
, wordexp_t
*pwordexp
,
1233 const char *ifs
, const char *ifs_white
, int quoted
)
1235 /* We are poised just after "$" */
1239 ACT_RP_SHORT_LEFT
= '#',
1240 ACT_RP_LONG_LEFT
= 'L',
1241 ACT_RP_SHORT_RIGHT
= '%',
1242 ACT_RP_LONG_RIGHT
= 'R',
1243 ACT_NULL_ERROR
= '?',
1244 ACT_NULL_SUBST
= '-',
1245 ACT_NONNULL_SUBST
= '+',
1246 ACT_NULL_ASSIGN
= '='
1252 size_t start
= *offset
;
1256 enum action action
= ACT_NONE
;
1261 int pattern_is_quoted
= 0; /* 1 for singly-quoted, 2 for doubly-quoted */
1265 int brace
= words
[*offset
] == '{';
1267 env
= w_newword (&env_length
, &env_maxlen
);
1268 pattern
= w_newword (&pat_length
, &pat_maxlen
);
1273 /* First collect the parameter name. */
1275 if (words
[*offset
] == '#')
1283 if (isalpha (words
[*offset
]) || words
[*offset
] == '_')
1285 /* Normal parameter name. */
1288 env
= w_addchar (env
, &env_length
, &env_maxlen
,
1293 while (isalnum (words
[++*offset
]) || words
[*offset
] == '_');
1295 else if (isdigit (words
[*offset
]))
1297 /* Numeric parameter name. */
1301 env
= w_addchar (env
, &env_length
, &env_maxlen
,
1308 while (isdigit(words
[++*offset
]));
1310 else if (CHAR_IN_SET (words
[*offset
], "*@$"))
1312 /* Special parameter. */
1314 env
= w_addchar (env
, &env_length
, &env_maxlen
,
1328 /* Check for special action to be applied to the value. */
1329 switch (words
[*offset
])
1336 action
= ACT_RP_SHORT_LEFT
;
1337 if (words
[1 + *offset
] == '#')
1340 action
= ACT_RP_LONG_LEFT
;
1345 action
= ACT_RP_SHORT_RIGHT
;
1346 if (words
[1 + *offset
] == '%')
1349 action
= ACT_RP_LONG_RIGHT
;
1354 if (!CHAR_IN_SET (words
[1 + *offset
], "-=?+"))
1358 action
= words
[++*offset
];
1365 action
= words
[*offset
];
1372 /* Now collect the pattern, but don't expand it yet. */
1374 for (; words
[*offset
]; ++(*offset
))
1376 switch (words
[*offset
])
1379 if (!pattern_is_quoted
)
1384 if (!pattern_is_quoted
)
1393 if (pattern_is_quoted
)
1394 /* Quoted; treat as normal character. */
1397 /* Otherwise, it's an escape: next character is literal. */
1398 if (words
[++*offset
] == '\0')
1401 pattern
= w_addchar (pattern
, &pat_length
, &pat_maxlen
, '\\');
1402 if (pattern
== NULL
)
1408 if (pattern_is_quoted
== 0)
1409 pattern_is_quoted
= 1;
1410 else if (pattern_is_quoted
== 1)
1411 pattern_is_quoted
= 0;
1416 if (pattern_is_quoted
== 0)
1417 pattern_is_quoted
= 2;
1418 else if (pattern_is_quoted
== 2)
1419 pattern_is_quoted
= 0;
1424 pattern
= w_addchar (pattern
, &pat_length
, &pat_maxlen
,
1426 if (pattern
== NULL
)
1431 /* End of input string -- remember to reparse the character that we
1436 if (words
[start
] == '{' && words
[*offset
] != '}')
1443 /* $# expands to the number of positional parameters */
1445 value
= _itoa_word (__libc_argc
- 1, &buffer
[20], 10, 0);
1450 /* Just $ on its own */
1451 *offset
= start
- 1;
1452 *word
= w_addchar (*word
, word_length
, max_length
, '$');
1453 return *word
? 0 : WRDE_NOSPACE
;
1456 /* Is it a numeric parameter? */
1457 else if (isdigit (env
[0]))
1461 if (n
>= __libc_argc
)
1462 /* Substitute NULL. */
1465 /* Replace with appropriate positional parameter. */
1466 value
= __libc_argv
[n
];
1468 /* Is it a special parameter? */
1475 value
= _itoa_word (__getpid (), &buffer
[20], 10, 0);
1477 /* Is it `${#*}' or `${#@}'? */
1478 else if ((*env
== '*' || *env
== '@') && seen_hash
)
1481 value
= _itoa_word (__libc_argc
> 0 ? __libc_argc
- 1 : 0,
1482 &buffer
[20], 10, 0);
1483 *word
= w_addstr (*word
, word_length
, max_length
, value
);
1486 return *word
? 0 : WRDE_NOSPACE
;
1488 /* Is it `$*' or `$@' (unquoted) ? */
1489 else if (*env
== '*' || (*env
== '@' && !quoted
))
1491 size_t plist_len
= 0;
1495 /* Build up value parameter by parameter (copy them) */
1496 for (p
= 1; __libc_argv
[p
]; ++p
)
1497 plist_len
+= strlen (__libc_argv
[p
]) + 1; /* for space */
1498 value
= malloc (plist_len
);
1503 for (p
= 1; __libc_argv
[p
]; ++p
)
1507 end
= __stpcpy (end
, __libc_argv
[p
]);
1514 /* Must be a quoted `$@' */
1515 assert (*env
== '@' && quoted
);
1517 /* Each parameter is a separate word ("$@") */
1518 if (__libc_argc
== 2)
1519 value
= __libc_argv
[1];
1520 else if (__libc_argc
> 2)
1524 /* Append first parameter to current word. */
1525 value
= w_addstr (*word
, word_length
, max_length
,
1527 if (value
== NULL
|| w_addword (pwordexp
, value
))
1530 for (p
= 2; __libc_argv
[p
+ 1]; p
++)
1532 char *newword
= __strdup (__libc_argv
[p
]);
1533 if (newword
== NULL
|| w_addword (pwordexp
, newword
))
1537 /* Start a new word with the last parameter. */
1538 *word
= w_newword (word_length
, max_length
);
1539 value
= __libc_argv
[p
];
1550 value
= getenv (env
);
1552 if (value
== NULL
&& (flags
& WRDE_UNDEF
))
1554 /* Variable not defined. */
1555 error
= WRDE_BADVAL
;
1559 if (action
!= ACT_NONE
)
1561 int expand_pattern
= 0;
1563 /* First, find out if we need to expand pattern (i.e. if we will
1567 case ACT_RP_SHORT_LEFT
:
1568 case ACT_RP_LONG_LEFT
:
1569 case ACT_RP_SHORT_RIGHT
:
1570 case ACT_RP_LONG_RIGHT
:
1571 /* Always expand for these. */
1575 case ACT_NULL_ERROR
:
1576 case ACT_NULL_SUBST
:
1577 case ACT_NULL_ASSIGN
:
1578 if (!value
|| (!*value
&& colon_seen
))
1579 /* If param is unset, or set but null and a colon has been seen,
1580 the expansion of the pattern will be needed. */
1585 case ACT_NONNULL_SUBST
:
1586 /* Expansion of word will be needed if parameter is set and not null,
1587 or set null but no colon has been seen. */
1588 if (value
&& (*value
|| !colon_seen
))
1594 assert (! "Unrecognised action!");
1599 /* We need to perform tilde expansion, parameter expansion,
1600 command substitution, and arithmetic expansion. We also
1601 have to be a bit careful with wildcard characters, as
1602 pattern might be given to fnmatch soon. To do this, we
1603 convert quotes to escapes. */
1609 int quoted
= 0; /* 1: single quotes; 2: double */
1611 expanded
= w_newword (&exp_len
, &exp_maxl
);
1612 for (p
= pattern
; p
&& *p
; p
++)
1621 else if (quoted
== 0)
1630 else if (quoted
== 0)
1640 /* Convert quoted wildchar to escaped wildchar. */
1641 expanded
= w_addchar (expanded
, &exp_len
,
1644 if (expanded
== NULL
)
1651 error
= parse_dollars (&expanded
, &exp_len
, &exp_maxl
, p
,
1652 &offset
, flags
, NULL
, NULL
, NULL
, 1);
1667 if (quoted
|| exp_len
)
1671 error
= parse_tilde (&expanded
, &exp_len
, &exp_maxl
, p
,
1687 expanded
= w_addchar (expanded
, &exp_len
, &exp_maxl
, '\\');
1689 assert (*p
); /* checked when extracted initially */
1690 if (expanded
== NULL
)
1694 expanded
= w_addchar (expanded
, &exp_len
, &exp_maxl
, *p
);
1696 if (expanded
== NULL
)
1707 case ACT_RP_SHORT_LEFT
:
1708 case ACT_RP_LONG_LEFT
:
1709 case ACT_RP_SHORT_RIGHT
:
1710 case ACT_RP_LONG_RIGHT
:
1716 if (value
== NULL
|| pattern
== NULL
|| *pattern
== '\0')
1719 end
= value
+ strlen (value
);
1723 case ACT_RP_SHORT_LEFT
:
1724 for (p
= value
; p
<= end
; ++p
)
1728 if (fnmatch (pattern
, value
, 0) != FNM_NOMATCH
)
1733 char *newval
= __strdup (p
);
1751 case ACT_RP_LONG_LEFT
:
1752 for (p
= end
; p
>= value
; --p
)
1756 if (fnmatch (pattern
, value
, 0) != FNM_NOMATCH
)
1761 char *newval
= __strdup (p
);
1779 case ACT_RP_SHORT_RIGHT
:
1780 for (p
= end
; p
>= value
; --p
)
1782 if (fnmatch (pattern
, p
, 0) != FNM_NOMATCH
)
1785 newval
= malloc (p
- value
+ 1);
1794 *(char *) __mempcpy (newval
, value
, p
- value
) = '\0';
1805 case ACT_RP_LONG_RIGHT
:
1806 for (p
= value
; p
<= end
; ++p
)
1808 if (fnmatch (pattern
, p
, 0) != FNM_NOMATCH
)
1811 newval
= malloc (p
- value
+ 1);
1820 *(char *) __mempcpy (newval
, value
, p
- value
) = '\0';
1838 case ACT_NULL_ERROR
:
1839 if (value
&& *value
)
1840 /* Substitute parameter */
1844 if (!colon_seen
&& value
)
1845 /* Substitute NULL */
1849 const char *str
= pattern
;
1852 str
= _("parameter null or not set");
1854 __fxprintf (NULL
, "%s: %s\n", env
, str
);
1861 case ACT_NULL_SUBST
:
1862 if (value
&& *value
)
1863 /* Substitute parameter */
1869 if (!colon_seen
&& value
)
1870 /* Substitute NULL */
1873 value
= pattern
? __strdup (pattern
) : pattern
;
1876 if (pattern
&& !value
)
1881 case ACT_NONNULL_SUBST
:
1882 if (value
&& (*value
|| !colon_seen
))
1887 value
= pattern
? __strdup (pattern
) : pattern
;
1890 if (pattern
&& !value
)
1896 /* Substitute NULL */
1901 case ACT_NULL_ASSIGN
:
1902 if (value
&& *value
)
1903 /* Substitute parameter */
1906 if (!colon_seen
&& value
)
1908 /* Substitute NULL */
1917 value
= pattern
? __strdup (pattern
) : pattern
;
1920 if (pattern
&& !value
)
1923 __setenv (env
, value
?: "", 1);
1927 assert (! "Unrecognised action!");
1938 char param_length
[21];
1939 param_length
[20] = '\0';
1940 *word
= w_addstr (*word
, word_length
, max_length
,
1941 _itoa_word (value
? strlen (value
) : 0,
1942 ¶m_length
[20], 10, 0));
1945 assert (value
!= NULL
);
1949 return *word
? 0 : WRDE_NOSPACE
;
1955 if (quoted
|| !pwordexp
)
1957 /* Quoted - no field split */
1958 *word
= w_addstr (*word
, word_length
, max_length
, value
);
1962 return *word
? 0 : WRDE_NOSPACE
;
1966 /* Need to field-split */
1967 char *value_copy
= __strdup (value
); /* Don't modify value */
1968 char *field_begin
= value_copy
;
1969 int seen_nonws_ifs
= 0;
1974 if (value_copy
== NULL
)
1979 char *field_end
= field_begin
;
1982 /* If this isn't the first field, start a new word */
1983 if (field_begin
!= value_copy
)
1985 if (w_addword (pwordexp
, *word
) == WRDE_NOSPACE
)
1991 *word
= w_newword (word_length
, max_length
);
1994 /* Skip IFS whitespace before the field */
1995 field_begin
+= strspn (field_begin
, ifs_white
);
1997 if (!seen_nonws_ifs
&& *field_begin
== 0)
1998 /* Nothing but whitespace */
2001 /* Search for the end of the field */
2002 field_end
= field_begin
+ strcspn (field_begin
, ifs
);
2004 /* Set up pointer to the character after end of field and
2005 skip whitespace IFS after it. */
2006 next_field
= field_end
+ strspn (field_end
, ifs_white
);
2008 /* Skip at most one non-whitespace IFS character after the field */
2010 if (*next_field
&& strchr (ifs
, *next_field
))
2016 /* Null-terminate it */
2019 /* Tag a copy onto the current word */
2020 *word
= w_addstr (*word
, word_length
, max_length
, field_begin
);
2022 if (*word
== NULL
&& *field_begin
!= '\0')
2028 field_begin
= next_field
;
2030 while (seen_nonws_ifs
|| *field_begin
);
2042 error
= WRDE_NOSPACE
;
2046 error
= WRDE_SYNTAX
;
2060 parse_dollars (char **word
, size_t *word_length
, size_t *max_length
,
2061 const char *words
, size_t *offset
, int flags
,
2062 wordexp_t
*pwordexp
, const char *ifs
, const char *ifs_white
,
2065 /* We are poised _at_ "$" */
2066 switch (words
[1 + *offset
])
2071 *word
= w_addchar (*word
, word_length
, max_length
, '$');
2072 return *word
? 0 : WRDE_NOSPACE
;
2075 if (words
[2 + *offset
] == '(')
2077 /* Differentiate between $((1+3)) and $((echo);(ls)) */
2078 int i
= 3 + *offset
;
2080 while (words
[i
] && !(depth
== 0 && words
[i
] == ')'))
2082 if (words
[i
] == '(')
2084 else if (words
[i
] == ')')
2090 if (words
[i
] == ')' && words
[i
+ 1] == ')')
2093 /* Call parse_arith -- 0 is for "no brackets" */
2094 return parse_arith (word
, word_length
, max_length
, words
, offset
,
2100 return parse_comm (word
, word_length
, max_length
, words
, offset
, flags
,
2101 quoted
? NULL
: pwordexp
, ifs
, ifs_white
);
2105 /* Call parse_arith -- 1 is for "brackets" */
2106 return parse_arith (word
, word_length
, max_length
, words
, offset
, flags
,
2111 ++(*offset
); /* parse_param needs to know if "{" is there */
2112 return parse_param (word
, word_length
, max_length
, words
, offset
, flags
,
2113 pwordexp
, ifs
, ifs_white
, quoted
);
2119 parse_backtick (char **word
, size_t *word_length
, size_t *max_length
,
2120 const char *words
, size_t *offset
, int flags
,
2121 wordexp_t
*pwordexp
, const char *ifs
, const char *ifs_white
)
2123 /* We are poised just after "`" */
2128 char *comm
= w_newword (&comm_length
, &comm_maxlen
);
2130 for (; words
[*offset
]; ++(*offset
))
2132 switch (words
[*offset
])
2135 /* Go -- give the script to the shell */
2136 error
= exec_comm (comm
, word
, word_length
, max_length
, flags
,
2137 pwordexp
, ifs
, ifs_white
);
2144 error
= parse_qtd_backslash (&comm
, &comm_length
, &comm_maxlen
,
2156 error
= parse_backslash (&comm
, &comm_length
, &comm_maxlen
, words
,
2168 squoting
= 1 - squoting
;
2170 comm
= w_addchar (comm
, &comm_length
, &comm_maxlen
, words
[*offset
]);
2172 return WRDE_NOSPACE
;
2183 parse_dquote (char **word
, size_t *word_length
, size_t *max_length
,
2184 const char *words
, size_t *offset
, int flags
,
2185 wordexp_t
*pwordexp
, const char * ifs
, const char * ifs_white
)
2187 /* We are poised just after a double-quote */
2190 for (; words
[*offset
]; ++(*offset
))
2192 switch (words
[*offset
])
2198 error
= parse_dollars (word
, word_length
, max_length
, words
, offset
,
2199 flags
, pwordexp
, ifs
, ifs_white
, 1);
2200 /* The ``1'' here is to tell parse_dollars not to
2201 * split the fields. It may need to, however ("$@").
2210 error
= parse_backtick (word
, word_length
, max_length
, words
,
2211 offset
, flags
, NULL
, NULL
, NULL
);
2212 /* The first NULL here is to tell parse_backtick not to
2221 error
= parse_qtd_backslash (word
, word_length
, max_length
, words
,
2230 *word
= w_addchar (*word
, word_length
, max_length
, words
[*offset
]);
2232 return WRDE_NOSPACE
;
2236 /* Unterminated string */
2241 * wordfree() is to be called after pwordexp is finished with.
2245 wordfree (wordexp_t
*pwordexp
)
2248 /* wordexp can set pwordexp to NULL */
2249 if (pwordexp
&& pwordexp
->we_wordv
)
2251 char **wordv
= pwordexp
->we_wordv
;
2253 for (wordv
+= pwordexp
->we_offs
; *wordv
; ++wordv
)
2256 free (pwordexp
->we_wordv
);
2257 pwordexp
->we_wordv
= NULL
;
2260 libc_hidden_def (wordfree
)
2267 wordexp (const char *words
, wordexp_t
*pwordexp
, int flags
)
2269 size_t words_offset
;
2272 char *word
= w_newword (&word_length
, &max_length
);
2276 wordexp_t old_word
= *pwordexp
;
2278 if (flags
& WRDE_REUSE
)
2280 /* Minimal implementation of WRDE_REUSE for now */
2281 wordfree (pwordexp
);
2282 old_word
.we_wordv
= NULL
;
2285 if ((flags
& WRDE_APPEND
) == 0)
2287 pwordexp
->we_wordc
= 0;
2289 if (flags
& WRDE_DOOFFS
)
2291 pwordexp
->we_wordv
= calloc (1 + pwordexp
->we_offs
, sizeof (char *));
2292 if (pwordexp
->we_wordv
== NULL
)
2294 error
= WRDE_NOSPACE
;
2300 pwordexp
->we_wordv
= calloc (1, sizeof (char *));
2301 if (pwordexp
->we_wordv
== NULL
)
2303 error
= WRDE_NOSPACE
;
2307 pwordexp
->we_offs
= 0;
2311 /* Find out what the field separators are.
2312 * There are two types: whitespace and non-whitespace.
2314 ifs
= getenv ("IFS");
2317 /* IFS unset - use <space><tab><newline>. */
2318 ifs
= strcpy (ifs_white
, " \t\n");
2322 char *whch
= ifs_white
;
2324 while (*ifsch
!= '\0')
2326 if (*ifsch
== ' ' || *ifsch
== '\t' || *ifsch
== '\n')
2328 /* Whitespace IFS. See first whether it is already in our
2330 char *runp
= ifs_white
;
2332 while (runp
< whch
&& *runp
!= *ifsch
)
2344 for (words_offset
= 0 ; words
[words_offset
] ; ++words_offset
)
2345 switch (words
[words_offset
])
2348 error
= parse_backslash (&word
, &word_length
, &max_length
, words
,
2357 error
= parse_dollars (&word
, &word_length
, &max_length
, words
,
2358 &words_offset
, flags
, pwordexp
, ifs
, ifs_white
,
2368 error
= parse_backtick (&word
, &word_length
, &max_length
, words
,
2369 &words_offset
, flags
, pwordexp
, ifs
,
2379 error
= parse_dquote (&word
, &word_length
, &max_length
, words
,
2380 &words_offset
, flags
, pwordexp
, ifs
, ifs_white
);
2387 error
= w_addword (pwordexp
, NULL
);
2397 error
= parse_squote (&word
, &word_length
, &max_length
, words
,
2405 error
= w_addword (pwordexp
, NULL
);
2414 error
= parse_tilde (&word
, &word_length
, &max_length
, words
,
2415 &words_offset
, pwordexp
->we_wordc
);
2425 error
= parse_glob (&word
, &word_length
, &max_length
, words
,
2426 &words_offset
, flags
, pwordexp
, ifs
, ifs_white
);
2434 /* Is it a word separator? */
2435 if (strchr (" \t", words
[words_offset
]) == NULL
)
2437 char ch
= words
[words_offset
];
2439 /* Not a word separator -- but is it a valid word char? */
2440 if (strchr ("\n|&;<>(){}", ch
))
2443 error
= WRDE_BADCHAR
;
2447 /* "Ordinary" character -- add it to word */
2448 word
= w_addchar (word
, &word_length
, &max_length
,
2452 error
= WRDE_NOSPACE
;
2459 /* If a word has been delimited, add it to the list. */
2462 error
= w_addword (pwordexp
, word
);
2467 word
= w_newword (&word_length
, &max_length
);
2472 /* There was a word separator at the end */
2473 if (word
== NULL
) /* i.e. w_newword */
2476 /* There was no field separator at the end */
2477 return w_addword (pwordexp
, word
);
2481 * free memory used (unless error is WRDE_NOSPACE), and
2482 * set pwordexp members back to what they were.
2487 if (error
== WRDE_NOSPACE
)
2488 return WRDE_NOSPACE
;
2490 if ((flags
& WRDE_APPEND
) == 0)
2491 wordfree (pwordexp
);
2493 *pwordexp
= old_word
;