2 * Copyright (c) 1991, 1993
3 * The Regents of the University of California. All rights reserved.
4 * Copyright (c) 1997-2005
5 * Herbert Xu <herbert@gondor.apana.org.au>. All rights reserved.
7 * This code is derived from software contributed to Berkeley by
10 * Redistribution and use in source and binary forms, with or without
11 * modification, are permitted provided that the following conditions
13 * 1. Redistributions of source code must retain the above copyright
14 * notice, this list of conditions and the following disclaimer.
15 * 2. Redistributions in binary form must reproduce the above copyright
16 * notice, this list of conditions and the following disclaimer in the
17 * documentation and/or other materials provided with the distribution.
18 * 3. Neither the name of the University nor the names of its contributors
19 * may be used to endorse or promote products derived from this software
20 * without specific prior written permission.
22 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
23 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
24 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
25 * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
26 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
27 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
28 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
29 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
30 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
31 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
37 static char sccsid
[] = "@(#)expand.c 8.5 (Berkeley) 5/15/95";
40 #include <sys/cdefs.h>
41 __FBSDID("$FreeBSD$");
43 #include <sys/types.h>
59 * Routines to expand arguments to commands. We have to deal with
60 * backquotes, shell variables, and file metacharacters.
83 * Structure specifying which parts of the string should be searched
88 struct ifsregion
*next
; /* next region in list */
89 int begoff
; /* offset of start of region */
90 int endoff
; /* offset of end of region */
91 int inquotes
; /* search for nul bytes only */
95 static char *expdest
; /* output of current string */
96 static struct nodelist
*argbackq
; /* list of back quote expressions */
97 static struct ifsregion ifsfirst
; /* first struct in list of ifs regions */
98 static struct ifsregion
*ifslastp
; /* last struct in list */
99 static struct arglist exparg
; /* holds expanded arg list */
101 static char *argstr(char *, int);
102 static char *exptilde(char *, int);
103 static char *expari(char *);
104 static void expbackq(union node
*, int, int);
105 static int subevalvar(char *, char *, int, int, int, int, int);
106 static char *evalvar(char *, int);
107 static int varisset(const char *, int);
108 static void strtodest(const char *, int, int, int);
109 static void varvalue(const char *, int, int, int);
110 static void recordregion(int, int, int);
111 static void removerecordregions(int);
112 static void ifsbreakup(char *, struct arglist
*);
113 static void expandmeta(struct strlist
*);
114 static void expmeta(char *, char *);
115 static void addfname(char *);
116 static struct strlist
*expsort(struct strlist
*);
117 static struct strlist
*msort(struct strlist
*, int);
118 static int patmatch(const char *, const char *, int);
119 static char *cvtnum(int, char *);
120 static int collate_range_cmp(wchar_t, wchar_t);
123 collate_range_cmp(wchar_t c1
, wchar_t c2
)
125 static wchar_t s1
[2], s2
[2];
129 return (wcscoll(s1
, s2
));
133 stputs_quotes(const char *data
, const char *syntax
, char *p
)
137 if (syntax
[(int)*data
] == CCTL
)
143 #define STPUTS_QUOTES(data, syntax, p) p = stputs_quotes((data), syntax, p)
146 * Perform expansions on an argument, placing the resulting list of arguments
147 * in arglist. Parameter expansion, command substitution and arithmetic
148 * expansion are always performed; additional expansions can be requested
150 * The result is left in the stack string.
151 * When arglist is NULL, perform here document expansion.
153 * Caution: this function uses global state and is not reentrant.
154 * However, a new invocation after an interrupted invocation is safe
155 * and will reset the global state for the new call.
158 expandarg(union node
*arg
, struct arglist
*arglist
, int flag
)
163 argbackq
= arg
->narg
.backquote
;
164 STARTSTACKSTR(expdest
);
165 ifsfirst
.next
= NULL
;
167 argstr(arg
->narg
.text
, flag
);
168 if (arglist
== NULL
) {
169 STACKSTRNUL(expdest
);
170 return; /* here document expanded */
172 STPUTC('\0', expdest
);
173 p
= grabstackstr(expdest
);
174 exparg
.lastp
= &exparg
.list
;
175 if (flag
& EXP_FULL
) {
176 ifsbreakup(p
, &exparg
);
177 *exparg
.lastp
= NULL
;
178 exparg
.lastp
= &exparg
.list
;
179 expandmeta(exparg
.list
);
181 sp
= (struct strlist
*)stalloc(sizeof (struct strlist
));
184 exparg
.lastp
= &sp
->next
;
186 while (ifsfirst
.next
!= NULL
) {
187 struct ifsregion
*ifsp
;
189 ifsp
= ifsfirst
.next
->next
;
190 ckfree(ifsfirst
.next
);
191 ifsfirst
.next
= ifsp
;
194 *exparg
.lastp
= NULL
;
196 *arglist
->lastp
= exparg
.list
;
197 arglist
->lastp
= exparg
.lastp
;
204 * Perform parameter expansion, command substitution and arithmetic
205 * expansion, and tilde expansion if requested via EXP_TILDE/EXP_VARTILDE.
206 * Processing ends at a CTLENDVAR or CTLENDARI character as well as '\0'.
207 * This is used to expand word in ${var+word} etc.
208 * If EXP_FULL or EXP_CASE are set, keep and/or generate CTLESC
209 * characters to allow for further processing.
210 * If EXP_FULL is set, also preserve CTLQUOTEMARK characters.
213 argstr(char *p
, int flag
)
216 int quotes
= flag
& (EXP_FULL
| EXP_CASE
); /* do CTLESC */
221 split_lit
= flag
& EXP_SPLIT_LIT
;
222 lit_quoted
= flag
& EXP_LIT_QUOTED
;
223 flag
&= ~(EXP_SPLIT_LIT
| EXP_LIT_QUOTED
);
224 if (*p
== '~' && (flag
& (EXP_TILDE
| EXP_VARTILDE
)))
225 p
= exptilde(p
, flag
);
227 CHECKSTRSPACE(2, expdest
);
236 /* "$@" syntax adherence hack */
237 if (p
[0] == CTLVAR
&& p
[2] == '@' && p
[3] == '=')
239 if ((flag
& EXP_FULL
) != 0)
250 if (split_lit
&& !lit_quoted
)
251 recordregion(expdest
- stackblock() -
253 expdest
- stackblock(), 0);
256 p
= evalvar(p
, flag
);
259 case CTLBACKQ
|CTLQUOTE
:
260 expbackq(argbackq
->n
, c
& CTLQUOTE
, flag
);
261 argbackq
= argbackq
->next
;
269 * sort of a hack - expand tildes in variable
270 * assignments (after the first '=' and after ':'s).
273 if (split_lit
&& !lit_quoted
)
274 recordregion(expdest
- stackblock() - 1,
275 expdest
- stackblock(), 0);
276 if (flag
& EXP_VARTILDE
&& *p
== '~' &&
277 (c
!= '=' || firsteq
)) {
280 p
= exptilde(p
, flag
);
285 if (split_lit
&& !lit_quoted
)
286 recordregion(expdest
- stackblock() - 1,
287 expdest
- stackblock(), 0);
293 * Perform tilde expansion, placing the result in the stack string and
294 * returning the next position in the input string to process.
297 exptilde(char *p
, int flag
)
306 case CTLESC
: /* This means CTL* are always considered quoted. */
309 case CTLBACKQ
| CTLQUOTE
:
315 if ((flag
& EXP_VARTILDE
) == 0)
322 if (*(startp
+1) == '\0') {
323 home
= lookupvar("HOME");
325 pw
= getpwnam(startp
+1);
326 home
= pw
!= NULL
? pw
->pw_dir
: NULL
;
329 if (home
== NULL
|| *home
== '\0')
331 strtodest(home
, flag
, VSNORMAL
, 1);
340 removerecordregions(int endoff
)
342 if (ifslastp
== NULL
)
345 if (ifsfirst
.endoff
> endoff
) {
346 while (ifsfirst
.next
!= NULL
) {
347 struct ifsregion
*ifsp
;
349 ifsp
= ifsfirst
.next
->next
;
350 ckfree(ifsfirst
.next
);
351 ifsfirst
.next
= ifsp
;
354 if (ifsfirst
.begoff
> endoff
)
357 ifslastp
= &ifsfirst
;
358 ifsfirst
.endoff
= endoff
;
363 ifslastp
= &ifsfirst
;
364 while (ifslastp
->next
&& ifslastp
->next
->begoff
< endoff
)
365 ifslastp
=ifslastp
->next
;
366 while (ifslastp
->next
!= NULL
) {
367 struct ifsregion
*ifsp
;
369 ifsp
= ifslastp
->next
->next
;
370 ckfree(ifslastp
->next
);
371 ifslastp
->next
= ifsp
;
374 if (ifslastp
->endoff
> endoff
)
375 ifslastp
->endoff
= endoff
;
379 * Expand arithmetic expression.
380 * Note that flag is not required as digits never require CTLESC characters.
391 quoted
= *p
++ == '"';
392 begoff
= expdest
- stackblock();
394 removerecordregions(begoff
);
395 STPUTC('\0', expdest
);
396 start
= stackblock() + begoff
;
398 q
= grabstackstr(expdest
);
399 result
= arith(start
);
400 ungrabstackstr(q
, expdest
);
402 start
= stackblock() + begoff
;
403 adj
= start
- expdest
;
404 STADJUST(adj
, expdest
);
406 CHECKSTRSPACE((int)(DIGITS(result
) + 1), expdest
);
407 fmtstr(expdest
, DIGITS(result
), ARITH_FORMAT_STR
, result
);
408 adj
= strlen(expdest
);
409 STADJUST(adj
, expdest
);
411 recordregion(begoff
, expdest
- stackblock(), 0);
417 * Perform command substitution.
420 expbackq(union node
*cmd
, int quoted
, int flag
)
426 char *dest
= expdest
;
427 struct ifsregion saveifs
, *savelastp
;
428 struct nodelist
*saveargbackq
;
430 int startloc
= dest
- stackblock();
431 char const *syntax
= quoted
? DQSYNTAX
: BASESYNTAX
;
432 int quotes
= flag
& (EXP_FULL
| EXP_CASE
);
437 savelastp
= ifslastp
;
438 saveargbackq
= argbackq
;
439 p
= grabstackstr(dest
);
440 evalbackcmd(cmd
, &in
);
441 ungrabstackstr(p
, dest
);
443 ifslastp
= savelastp
;
444 argbackq
= saveargbackq
;
449 /* Don't copy trailing newlines */
451 if (--in
.nleft
< 0) {
454 while ((i
= read(in
.fd
, buf
, sizeof buf
)) < 0 && errno
== EINTR
);
455 TRACE(("expbackq: read returns %d\n", i
));
466 CHECKSTRSPACE(nnl
+ 2, dest
);
471 if (quotes
&& syntax
[(int)lastc
] == CCTL
)
472 USTPUTC(CTLESC
, dest
);
473 USTPUTC(lastc
, dest
);
483 exitstatus
= waitforjob(in
.jp
, (int *)NULL
);
485 recordregion(startloc
, dest
- stackblock(), 0);
486 TRACE(("expbackq: size=%td: \"%.*s\"\n",
487 ((dest
- stackblock()) - startloc
),
488 (int)((dest
- stackblock()) - startloc
),
489 stackblock() + startloc
));
497 recordleft(const char *str
, const char *loc
, char *startp
)
501 amount
= ((str
- 1) - (loc
- startp
)) - expdest
;
502 STADJUST(amount
, expdest
);
503 while (loc
!= str
- 1)
508 subevalvar(char *p
, char *str
, int strloc
, int subtype
, int startloc
,
509 int varflags
, int quotes
)
515 struct nodelist
*saveargbackq
= argbackq
;
518 argstr(p
, (subtype
== VSTRIMLEFT
|| subtype
== VSTRIMLEFTMAX
||
519 subtype
== VSTRIMRIGHT
|| subtype
== VSTRIMRIGHTMAX
?
520 EXP_CASE
: 0) | EXP_TILDE
);
521 STACKSTRNUL(expdest
);
522 argbackq
= saveargbackq
;
523 startp
= stackblock() + startloc
;
525 str
= stackblock() + strloc
;
529 setvar(str
, startp
, 0);
530 amount
= startp
- expdest
;
531 STADJUST(amount
, expdest
);
536 if (*p
!= CTLENDVAR
) {
537 outfmt(out2
, "%s\n", startp
);
540 error("%.*s: parameter %snot set", (int)(p
- str
- 1),
541 str
, (varflags
& VSNUL
) ? "null or " : "");
545 for (loc
= startp
; loc
< str
; loc
++) {
548 if (patmatch(str
, startp
, quotes
)) {
550 recordleft(str
, loc
, startp
);
554 if (quotes
&& *loc
== CTLESC
)
560 for (loc
= str
- 1; loc
>= startp
;) {
563 if (patmatch(str
, startp
, quotes
)) {
565 recordleft(str
, loc
, startp
);
570 if (quotes
&& loc
> startp
&& *(loc
- 1) == CTLESC
) {
571 for (q
= startp
; q
< loc
; q
++)
581 for (loc
= str
- 1; loc
>= startp
;) {
582 if (patmatch(str
, loc
, quotes
)) {
583 amount
= loc
- expdest
;
584 STADJUST(amount
, expdest
);
588 if (quotes
&& loc
> startp
&& *(loc
- 1) == CTLESC
) {
589 for (q
= startp
; q
< loc
; q
++)
599 for (loc
= startp
; loc
< str
- 1; loc
++) {
600 if (patmatch(str
, loc
, quotes
)) {
601 amount
= loc
- expdest
;
602 STADJUST(amount
, expdest
);
605 if (quotes
&& *loc
== CTLESC
)
618 * Expand a variable, and return a pointer to the next character in the
623 evalvar(char *p
, int flag
)
637 int quotes
= flag
& (EXP_FULL
| EXP_CASE
);
640 varflags
= (unsigned char)*p
++;
641 subtype
= varflags
& VSTYPE
;
646 p
= strchr(p
, '=') + 1;
647 again
: /* jump here after setting a variable with ${var=text} */
648 if (varflags
& VSLINENO
) {
652 } else if (special
) {
653 set
= varisset(var
, varflags
& VSNUL
);
656 val
= bltinlookup(var
, 1);
657 if (val
== NULL
|| ((varflags
& VSNUL
) && val
[0] == '\0')) {
664 startloc
= expdest
- stackblock();
665 if (!set
&& uflag
&& *var
!= '@' && *var
!= '*') {
673 error("%.*s: parameter not set", (int)(p
- var
- 1),
677 if (set
&& subtype
!= VSPLUS
) {
678 /* insert the value of the variable */
680 if (varflags
& VSLINENO
)
681 STPUTBIN(var
, p
- var
- 1, expdest
);
683 varvalue(var
, varflags
& VSQUOTE
, subtype
, flag
);
684 if (subtype
== VSLENGTH
) {
685 varlenb
= expdest
- stackblock() - startloc
;
688 val
= stackblock() + startloc
;
689 for (;val
!= expdest
; val
++)
690 if ((*val
& 0xC0) == 0x80)
693 STADJUST(-varlenb
, expdest
);
696 if (subtype
== VSLENGTH
) {
699 (*val
& 0xC0) != 0x80)
703 strtodest(val
, flag
, subtype
,
708 if (subtype
== VSPLUS
)
711 easy
= ((varflags
& VSQUOTE
) == 0 ||
712 (*var
== '@' && shellparam
.nparam
!= 1));
717 expdest
= cvtnum(varlen
, expdest
);
728 argstr(p
, flag
| (flag
& EXP_FULL
? EXP_SPLIT_LIT
: 0) |
729 (varflags
& VSQUOTE
? EXP_LIT_QUOTED
: 0));
742 * Terminate the string and start recording the pattern
745 STPUTC('\0', expdest
);
746 patloc
= expdest
- stackblock();
747 if (subevalvar(p
, NULL
, patloc
, subtype
,
748 startloc
, varflags
, quotes
) == 0) {
749 int amount
= (expdest
- stackblock() - patloc
) + 1;
750 STADJUST(-amount
, expdest
);
752 /* Remove any recorded regions beyond start of variable */
753 removerecordregions(startloc
);
760 if (subevalvar(p
, var
, 0, subtype
, startloc
, varflags
,
764 * Remove any recorded regions beyond
767 removerecordregions(startloc
);
777 error("${%.*s%s}: Bad substitution", c
, var
,
778 (c
> 0 && *p
!= CTLENDVAR
) ? "..." : "");
785 recordregion(startloc
, expdest
- stackblock(),
786 varflags
& VSQUOTE
|| (ifsset() && ifsval()[0] == '\0' &&
787 (*var
== '@' || *var
== '*')));
789 if (subtype
!= VSNORMAL
) { /* skip to end of alternative */
792 if ((c
= *p
++) == CTLESC
)
794 else if (c
== CTLBACKQ
|| c
== (CTLBACKQ
|CTLQUOTE
)) {
796 argbackq
= argbackq
->next
;
797 } else if (c
== CTLVAR
) {
798 if ((*p
++ & VSTYPE
) != VSNORMAL
)
800 } else if (c
== CTLENDVAR
) {
812 * Test whether a specialized variable is set.
816 varisset(const char *name
, int nulok
)
820 return backgndpidset();
821 else if (*name
== '@' || *name
== '*') {
822 if (*shellparam
.p
== NULL
)
828 for (av
= shellparam
.p
; *av
; av
++)
833 } else if (is_digit(*name
)) {
838 num
= strtol(name
, NULL
, 10);
839 if (errno
!= 0 || num
> shellparam
.nparam
)
845 ap
= shellparam
.p
[num
- 1];
847 if (nulok
&& (ap
== NULL
|| *ap
== '\0'))
854 strtodest(const char *p
, int flag
, int subtype
, int quoted
)
856 if (flag
& (EXP_FULL
| EXP_CASE
) && subtype
!= VSLENGTH
)
857 STPUTS_QUOTES(p
, quoted
? DQSYNTAX
: BASESYNTAX
, expdest
);
863 * Add the value of a specialized variable to the stack string.
867 varvalue(const char *name
, int quoted
, int subtype
, int flag
)
883 num
= shellparam
.nparam
;
886 num
= backgndpidval();
889 for (i
= 0 ; i
< NOPTS
; i
++) {
891 STPUTC(optlist
[i
].letter
, expdest
);
895 if (flag
& EXP_FULL
&& quoted
) {
896 for (ap
= shellparam
.p
; (p
= *ap
++) != NULL
; ) {
897 strtodest(p
, flag
, subtype
, quoted
);
899 STPUTC('\0', expdest
);
906 sep
[0] = ifsval()[0];
910 for (ap
= shellparam
.p
; (p
= *ap
++) != NULL
; ) {
911 strtodest(p
, flag
, subtype
, quoted
);
915 strtodest(sep
, flag
, subtype
, quoted
);
916 else if (flag
& EXP_FULL
&& !quoted
&& **ap
!= '\0')
917 STPUTC('\0', expdest
);
921 if (is_digit(*name
)) {
925 else if (num
> 0 && num
<= shellparam
.nparam
)
926 p
= shellparam
.p
[num
- 1];
929 strtodest(p
, flag
, subtype
, quoted
);
933 expdest
= cvtnum(num
, expdest
);
939 * Record the fact that we have to scan this region of the
940 * string for IFS characters.
944 recordregion(int start
, int end
, int inquotes
)
946 struct ifsregion
*ifsp
;
949 if (ifslastp
== NULL
) {
952 if (ifslastp
->endoff
== start
953 && ifslastp
->inquotes
== inquotes
) {
954 /* extend previous area */
955 ifslastp
->endoff
= end
;
959 ifsp
= (struct ifsregion
*)ckmalloc(sizeof (struct ifsregion
));
960 ifslastp
->next
= ifsp
;
963 ifslastp
->next
= NULL
;
964 ifslastp
->begoff
= start
;
965 ifslastp
->endoff
= end
;
966 ifslastp
->inquotes
= inquotes
;
973 * Break the argument string into pieces based upon IFS and add the
974 * strings to the argument list. The regions of the string to be
975 * searched for IFS characters have been stored by recordregion.
976 * CTLESC characters are preserved but have little effect in this pass
977 * other than escaping CTL* characters. In particular, they do not escape
978 * IFS characters: that should be done with the ifsregion mechanism.
979 * CTLQUOTEMARK characters are used to preserve empty quoted strings.
980 * This pass treats them as a regular character, making the string non-empty.
981 * Later, they are removed along with the other CTL* characters.
984 ifsbreakup(char *string
, struct arglist
*arglist
)
986 struct ifsregion
*ifsp
;
993 int had_param_ch
= 0;
997 if (ifslastp
== NULL
) {
998 /* Return entire argument, IFS doesn't apply to any of it */
999 sp
= (struct strlist
*)stalloc(sizeof *sp
);
1001 *arglist
->lastp
= sp
;
1002 arglist
->lastp
= &sp
->next
;
1006 ifs
= ifsset() ? ifsval() : " \t\n";
1008 for (ifsp
= &ifsfirst
; ifsp
!= NULL
; ifsp
= ifsp
->next
) {
1009 p
= string
+ ifsp
->begoff
;
1010 while (p
< string
+ ifsp
->endoff
) {
1014 if (ifsp
->inquotes
) {
1015 /* Only NULs (should be from "$@") end args */
1023 if (!strchr(ifs
, *p
)) {
1028 ifsspc
= strchr(" \t\n", *p
);
1030 /* Ignore IFS whitespace at start */
1031 if (q
== start
&& ifsspc
!= NULL
) {
1039 /* Save this argument... */
1041 sp
= (struct strlist
*)stalloc(sizeof *sp
);
1043 *arglist
->lastp
= sp
;
1044 arglist
->lastp
= &sp
->next
;
1047 if (ifsspc
!= NULL
) {
1048 /* Ignore further trailing IFS whitespace */
1049 for (; p
< string
+ ifsp
->endoff
; p
++) {
1053 if (strchr(ifs
, *p
) == NULL
) {
1057 if (strchr(" \t\n", *p
) == NULL
) {
1068 * Save anything left as an argument.
1069 * Traditionally we have treated 'IFS=':'; set -- x$IFS' as
1070 * generating 2 arguments, the second of which is empty.
1071 * Some recent clarification of the Posix spec say that it
1072 * should only generate one....
1074 if (had_param_ch
|| *start
!= 0) {
1075 sp
= (struct strlist
*)stalloc(sizeof *sp
);
1077 *arglist
->lastp
= sp
;
1078 arglist
->lastp
= &sp
->next
;
1083 static char expdir
[PATH_MAX
];
1084 #define expdir_end (expdir + sizeof(expdir))
1087 * Perform pathname generation and remove control characters.
1088 * At this point, the only control characters should be CTLESC and CTLQUOTEMARK.
1089 * The results are stored in the list exparg.
1092 expandmeta(struct strlist
*str
)
1095 struct strlist
**savelastp
;
1100 savelastp
= exparg
.lastp
;
1103 for (; (c
= *p
) != '\0'; p
++) {
1104 /* fast check for meta chars */
1105 if (c
== '*' || c
== '?' || c
== '[') {
1107 expmeta(expdir
, str
->text
);
1113 if (exparg
.lastp
== savelastp
) {
1117 *exparg
.lastp
= str
;
1118 rmescapes(str
->text
);
1119 exparg
.lastp
= &str
->next
;
1121 *exparg
.lastp
= NULL
;
1122 *savelastp
= sp
= expsort(*savelastp
);
1123 while (sp
->next
!= NULL
)
1125 exparg
.lastp
= &sp
->next
;
1133 * Do metacharacter (i.e. *, ?, [...]) expansion.
1137 expmeta(char *enddir
, char *name
)
1154 for (p
= name
; esc
= 0, *p
; p
+= esc
+ 1) {
1155 if (*p
== '*' || *p
== '?')
1157 else if (*p
== '[') {
1159 if (*q
== '!' || *q
== '^')
1162 while (*q
== CTLQUOTEMARK
)
1166 if (*q
== '/' || *q
== '\0')
1173 } else if (*p
== '\0')
1175 else if (*p
== CTLQUOTEMARK
)
1180 if (p
[esc
] == '/') {
1183 start
= p
+ esc
+ 1;
1187 if (metaflag
== 0) { /* we've reached the end of the file name */
1188 if (enddir
!= expdir
)
1190 for (p
= name
; ; p
++) {
1191 if (*p
== CTLQUOTEMARK
)
1198 if (enddir
== expdir_end
)
1201 if (metaflag
== 0 || lstat(expdir
, &statb
) >= 0)
1205 endname
= name
+ (p
- name
);
1206 if (start
!= name
) {
1209 while (*p
== CTLQUOTEMARK
)
1214 if (enddir
== expdir_end
)
1218 if (enddir
== expdir
) {
1220 } else if (enddir
== expdir
+ 1 && *expdir
== '/') {
1226 if ((dirp
= opendir(p
)) == NULL
)
1228 if (enddir
!= expdir
)
1230 if (*endname
== 0) {
1239 while (*p
== CTLQUOTEMARK
)
1245 while (! int_pending() && (dp
= readdir(dirp
)) != NULL
) {
1246 if (dp
->d_name
[0] == '.' && ! matchdot
)
1248 if (patmatch(start
, dp
->d_name
, 0)) {
1249 namlen
= dp
->d_namlen
;
1250 if (enddir
+ namlen
+ 1 > expdir_end
)
1252 memcpy(enddir
, dp
->d_name
, namlen
+ 1);
1256 if (dp
->d_type
!= DT_UNKNOWN
&&
1257 dp
->d_type
!= DT_DIR
&&
1258 dp
->d_type
!= DT_LNK
)
1260 if (enddir
+ namlen
+ 2 > expdir_end
)
1262 enddir
[namlen
] = '/';
1263 enddir
[namlen
+ 1] = '\0';
1264 expmeta(enddir
+ namlen
+ 1, endname
);
1270 endname
[-esc
- 1] = esc
? CTLESC
: '/';
1275 * Add a file name to the list.
1279 addfname(char *name
)
1284 p
= stsavestr(name
);
1285 sp
= (struct strlist
*)stalloc(sizeof *sp
);
1288 exparg
.lastp
= &sp
->next
;
1293 * Sort the results of file name expansion. It calculates the number of
1294 * strings to sort and then calls msort (short for merge sort) to do the
1298 static struct strlist
*
1299 expsort(struct strlist
*str
)
1305 for (sp
= str
; sp
; sp
= sp
->next
)
1307 return msort(str
, len
);
1311 static struct strlist
*
1312 msort(struct strlist
*list
, int len
)
1314 struct strlist
*p
, *q
= NULL
;
1315 struct strlist
**lpp
;
1323 for (n
= half
; --n
>= 0 ; ) {
1327 q
->next
= NULL
; /* terminate first half of list */
1328 q
= msort(list
, half
); /* sort first half of list */
1329 p
= msort(p
, len
- half
); /* sort second half */
1332 if (strcmp(p
->text
, q
->text
) < 0) {
1335 if ((p
= *lpp
) == NULL
) {
1342 if ((q
= *lpp
) == NULL
) {
1354 get_wc(const char **p
)
1359 chrlen
= mbtowc(&c
, *p
, 4);
1362 else if (chrlen
== -1)
1371 * See if a character matches a character class, starting at the first colon
1373 * If a valid character class is recognized, a pointer to the next character
1374 * after the final closing bracket is stored into *end, otherwise a null
1375 * pointer is stored into *end.
1378 match_charclass(const char *p
, wchar_t chr
, const char **end
)
1381 const char *nameend
;
1386 nameend
= strstr(p
, ":]");
1387 if (nameend
== NULL
|| (size_t)(nameend
- p
) >= sizeof(name
) ||
1390 memcpy(name
, p
, nameend
- p
);
1391 name
[nameend
- p
] = '\0';
1393 cclass
= wctype(name
);
1394 /* An unknown class matches nothing but is valid nevertheless. */
1397 return iswctype(chr
, cclass
);
1402 * Returns true if the pattern matches the string.
1406 patmatch(const char *pattern
, const char *string
, int squoted
)
1408 const char *p
, *q
, *end
;
1409 const char *bt_p
, *bt_q
;
1424 if (squoted
&& *q
== CTLESC
)
1432 if (squoted
&& *q
== CTLESC
)
1439 * A '?' does not match invalid UTF-8 but a
1440 * '*' does, so backtrack.
1445 wc
= (unsigned char)*q
++;
1449 while (c
== CTLQUOTEMARK
|| c
== '*')
1452 * If the pattern ends here, we know the string
1453 * matches without needing to look at the rest of it.
1458 * First try the shortest match for the '*' that
1459 * could work. We can forget any earlier '*' since
1460 * there is no way having it match more characters
1461 * can help us, given that we are already here.
1472 if (*endp
== '!' || *endp
== '^')
1475 while (*endp
== CTLQUOTEMARK
)
1478 goto dft
; /* no matching ] */
1479 if (*endp
== CTLESC
)
1481 } while (*++endp
!= ']');
1483 if (*p
== '!' || *p
== '^') {
1488 if (squoted
&& *q
== CTLESC
)
1497 chr
= (unsigned char)*q
++;
1500 if (c
== CTLQUOTEMARK
)
1502 if (c
== '[' && *p
== ':') {
1503 found
|= match_charclass(p
, chr
, &end
);
1509 if (localeisutf8
&& c
& 0x80) {
1512 if (wc
== 0) /* bad utf-8 */
1515 wc
= (unsigned char)c
;
1516 if (*p
== '-' && p
[1] != ']') {
1518 while (*p
== CTLQUOTEMARK
)
1524 if (wc2
== 0) /* bad utf-8 */
1527 wc2
= (unsigned char)*p
++;
1528 if ( collate_range_cmp(chr
, wc
) >= 0
1529 && collate_range_cmp(chr
, wc2
) <= 0
1536 } while ((c
= *p
++) != ']');
1537 if (found
== invert
)
1542 if (squoted
&& *q
== CTLESC
)
1550 * If we have a mismatch (other than hitting the end
1551 * of the string), go back to the last '*' seen and
1552 * have it match one additional character.
1556 if (squoted
&& *bt_q
== CTLESC
)
1571 * Remove any CTLESC and CTLQUOTEMARK characters from a string.
1575 rmescapes(char *str
)
1580 while (*p
!= CTLESC
&& *p
!= CTLQUOTEMARK
&& *p
!= CTLQUOTEEND
) {
1586 if (*p
== CTLQUOTEMARK
|| *p
== CTLQUOTEEND
) {
1600 * See if a pattern matches in a case statement.
1604 casematch(union node
*pattern
, const char *val
)
1606 struct stackmark smark
;
1610 setstackmark(&smark
);
1611 argbackq
= pattern
->narg
.backquote
;
1612 STARTSTACKSTR(expdest
);
1614 argstr(pattern
->narg
.text
, EXP_TILDE
| EXP_CASE
);
1615 STPUTC('\0', expdest
);
1616 p
= grabstackstr(expdest
);
1617 result
= patmatch(p
, val
, 0);
1618 popstackmark(&smark
);
1627 cvtnum(int num
, char *buf
)
1631 char *p
= temp
+ 31;
1636 *--p
= num
% 10 + '0';
1637 } while ((num
/= 10) != 0);
1647 * Do most of the work for wordexp(3).
1651 wordexpcmd(int argc
, char **argv
)
1656 out1fmt("%08x", argc
- 1);
1657 for (i
= 1, len
= 0; i
< argc
; i
++)
1658 len
+= strlen(argv
[i
]);
1659 out1fmt("%08x", (int)len
);
1660 for (i
= 1; i
< argc
; i
++)
1661 outbin(argv
[i
], strlen(argv
[i
]) + 1, out1
);