586 sed -i should take an "optional" argument
[illumos-gate.git] / usr / src / cmd / sed / main.c
blob93e14bb09b6d4a1725b956209bef7e2df11db715
1 /*
2 * Copyright (c) 2011 Gary Mills
3 * Copyright 2011 Nexenta Systems, Inc. All rights reserved.
4 * Copyright (c) 1992 Diomidis Spinellis.
5 * Copyright (c) 1992, 1993
6 * The Regents of the University of California. All rights reserved.
8 * This code is derived from software contributed to Berkeley by
9 * Diomidis Spinellis of Imperial College, University of London.
11 * Redistribution and use in source and binary forms, with or without
12 * modification, are permitted provided that the following conditions
13 * are met:
14 * 1. Redistributions of source code must retain the above copyright
15 * notice, this list of conditions and the following disclaimer.
16 * 2. Redistributions in binary form must reproduce the above copyright
17 * notice, this list of conditions and the following disclaimer in the
18 * documentation and/or other materials provided with the distribution.
19 * 4. Neither the name of the University nor the names of its contributors
20 * may be used to endorse or promote products derived from this software
21 * without specific prior written permission.
23 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
24 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
25 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
26 * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
27 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
28 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
29 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
30 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
31 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
32 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
33 * SUCH DAMAGE.
36 #include <sys/types.h>
37 #include <sys/mman.h>
38 #include <sys/param.h>
39 #include <sys/stat.h>
41 #include <err.h>
42 #include <errno.h>
43 #include <fcntl.h>
44 #include <getopt.h>
45 #include <libgen.h>
46 #include <libintl.h>
47 #include <limits.h>
48 #include <locale.h>
49 #include <regex.h>
50 #include <stddef.h>
51 #include <stdio.h>
52 #include <stdlib.h>
53 #include <string.h>
54 #include <unistd.h>
56 #include "defs.h"
57 #include "extern.h"
60 * Linked list of units (strings and files) to be compiled
62 struct s_compunit {
63 struct s_compunit *next;
64 enum e_cut {CU_FILE, CU_STRING} type;
65 char *s; /* Pointer to string or fname */
69 * Linked list pointer to compilation units and pointer to current
70 * next pointer.
72 static struct s_compunit *script, **cu_nextp = &script;
75 * Linked list of files to be processed
77 struct s_flist {
78 char *fname;
79 struct s_flist *next;
83 * Linked list pointer to files and pointer to current
84 * next pointer.
86 static struct s_flist *files, **fl_nextp = &files;
88 FILE *infile; /* Current input file */
89 FILE *outfile; /* Current output file */
91 int aflag, eflag, nflag;
92 int rflags = 0;
93 static int rval; /* Exit status */
95 static int ispan; /* Whether inplace editing spans across files */
98 * Current file and line number; line numbers restart across compilation
99 * units, but span across input files. The latter is optional if editing
100 * in place.
102 const char *fname; /* File name. */
103 const char *outfname; /* Output file name */
104 static char oldfname[PATH_MAX]; /* Old file name (for in-place editing) */
105 static char tmpfname[PATH_MAX]; /* Temporary file name (for in-place editing) */
106 static const char *inplace; /* Inplace edit file extension. */
107 ulong_t linenum;
109 static const struct option lopts[] = {
110 {"in-place", optional_argument, NULL, 'i'},
111 {NULL, 0, NULL, 0}
114 static void add_compunit(enum e_cut, char *);
115 static void add_file(char *);
116 static void usage(void);
117 static char *getln(FILE *, size_t *);
121 main(int argc, char *argv[])
123 int c, fflag;
124 char *temp_arg;
126 (void) setlocale(LC_ALL, "");
128 #ifndef TEXT_DOMAIN
129 #define TEXT_DOMAIN "SYS_TEST"
130 #endif
131 (void) textdomain(TEXT_DOMAIN);
133 fflag = 0;
134 inplace = NULL;
136 while ((c = getopt_long(argc, argv, "EI::ae:f:i::lnr", lopts, NULL)) !=
138 switch (c) {
139 case 'r': /* Gnu sed compat */
140 case 'E':
141 rflags = REG_EXTENDED;
142 break;
143 case 'I':
144 if (optarg != NULL)
145 inplace = optarg;
146 else
147 inplace = "";
148 ispan = 1; /* span across input files */
149 break;
150 case 'a':
151 aflag = 1;
152 break;
153 case 'e':
154 eflag = 1;
155 if (asprintf(&temp_arg, "%s\n", optarg) < 1)
156 err(1, "asprintf");
157 add_compunit(CU_STRING, temp_arg);
158 break;
159 case 'f':
160 fflag = 1;
161 add_compunit(CU_FILE, optarg);
162 break;
163 case 'i':
164 if (optarg != NULL)
165 inplace = optarg;
166 else
167 inplace = "";
168 ispan = 0; /* don't span across input files */
169 break;
170 case 'l':
171 /* On SunOS, setlinebuf "returns no useful value */
172 (void) setlinebuf(stdout);
173 break;
174 case 'n':
175 nflag = 1;
176 break;
177 default:
178 case '?':
179 usage();
181 argc -= optind;
182 argv += optind;
184 /* First usage case; script is the first arg */
185 if (!eflag && !fflag && *argv) {
186 add_compunit(CU_STRING, *argv);
187 argv++;
190 compile();
192 /* Continue with first and start second usage */
193 if (*argv)
194 for (; *argv; argv++)
195 add_file(*argv);
196 else
197 add_file(NULL);
198 process();
199 cfclose(prog, NULL);
200 if (fclose(stdout))
201 err(1, "stdout");
202 return (rval);
205 static void
206 usage(void)
208 (void) fputs(_("usage: sed script [-Ealn] [-i[extension]] [file...]\n"
209 " sed [-Ealn] [-i[extension]] [-e script]... "
210 "[-f script_file]... [file...]\n"),
211 stderr);
212 exit(1);
216 * Like fgets, but go through the chain of compilation units chaining them
217 * together. Empty strings and files are ignored.
219 char *
220 cu_fgets(char *buf, int n, int *more)
222 static enum {ST_EOF, ST_FILE, ST_STRING} state = ST_EOF;
223 static FILE *f; /* Current open file */
224 static char *s; /* Current pointer inside string */
225 static char string_ident[30];
226 char *p;
228 again:
229 switch (state) {
230 case ST_EOF:
231 if (script == NULL) {
232 if (more != NULL)
233 *more = 0;
234 return (NULL);
236 linenum = 0;
237 switch (script->type) {
238 case CU_FILE:
239 if ((f = fopen(script->s, "r")) == NULL)
240 err(1, "%s", script->s);
241 fname = script->s;
242 state = ST_FILE;
243 goto again;
244 case CU_STRING:
245 if (((size_t)snprintf(string_ident,
246 sizeof (string_ident), "\"%s\"", script->s)) >=
247 sizeof (string_ident) - 1)
248 (void) strcpy(string_ident +
249 sizeof (string_ident) - 6, " ...\"");
250 fname = string_ident;
251 s = script->s;
252 state = ST_STRING;
253 goto again;
255 /*NOTREACHED*/
257 case ST_FILE:
258 if ((p = fgets(buf, n, f)) != NULL) {
259 linenum++;
260 if (linenum == 1 && buf[0] == '#' && buf[1] == 'n')
261 nflag = 1;
262 if (more != NULL)
263 *more = !feof(f);
264 return (p);
266 script = script->next;
267 (void) fclose(f);
268 state = ST_EOF;
269 goto again;
270 case ST_STRING:
271 if (linenum == 0 && s[0] == '#' && s[1] == 'n')
272 nflag = 1;
273 p = buf;
274 for (;;) {
275 if (n-- <= 1) {
276 *p = '\0';
277 linenum++;
278 if (more != NULL)
279 *more = 1;
280 return (buf);
282 switch (*s) {
283 case '\0':
284 state = ST_EOF;
285 if (s == script->s) {
286 script = script->next;
287 goto again;
288 } else {
289 script = script->next;
290 *p = '\0';
291 linenum++;
292 if (more != NULL)
293 *more = 0;
294 return (buf);
296 case '\n':
297 *p++ = '\n';
298 *p = '\0';
299 s++;
300 linenum++;
301 if (more != NULL)
302 *more = 0;
303 return (buf);
304 default:
305 *p++ = *s++;
309 /* NOTREACHED */
310 return (NULL);
314 * Like fgets, but go through the list of files chaining them together.
315 * Set len to the length of the line.
318 mf_fgets(SPACE *sp, enum e_spflag spflag)
320 struct stat sb, nsb;
321 size_t len;
322 char *p;
323 int c;
324 static int firstfile;
326 if (infile == NULL) {
327 /* stdin? */
328 if (files->fname == NULL) {
329 if (inplace != NULL)
330 errx(1,
331 _("-I or -i may not be used with stdin"));
332 infile = stdin;
333 fname = "stdin";
334 outfile = stdout;
335 outfname = "stdout";
337 firstfile = 1;
340 for (;;) {
341 if (infile != NULL && (c = getc(infile)) != EOF) {
342 (void) ungetc(c, infile);
343 break;
345 /* If we are here then either eof or no files are open yet */
346 if (infile == stdin) {
347 sp->len = 0;
348 return (0);
350 if (infile != NULL) {
351 (void) fclose(infile);
352 if (*oldfname != '\0') {
353 /* if there was a backup file, remove it */
354 (void) unlink(oldfname);
356 * Backup the original. Note that hard links
357 * are not supported on all filesystems.
359 if ((link(fname, oldfname) != 0) &&
360 (rename(fname, oldfname) != 0)) {
361 warn("rename()");
362 if (*tmpfname)
363 (void) unlink(tmpfname);
364 exit(1);
366 *oldfname = '\0';
368 if (*tmpfname != '\0') {
369 if (outfile != NULL && outfile != stdout)
370 if (fclose(outfile) != 0) {
371 warn("fclose()");
372 (void) unlink(tmpfname);
373 exit(1);
375 outfile = NULL;
376 if (rename(tmpfname, fname) != 0) {
377 /* this should not happen really! */
378 warn("rename()");
379 (void) unlink(tmpfname);
380 exit(1);
382 *tmpfname = '\0';
384 outfname = NULL;
386 if (firstfile == 0)
387 files = files->next;
388 else
389 firstfile = 0;
390 if (files == NULL) {
391 sp->len = 0;
392 return (0);
394 fname = files->fname;
395 if (inplace != NULL) {
396 char bn[PATH_MAX];
397 char dn[PATH_MAX];
398 (void) strlcpy(bn, fname, sizeof (bn));
399 (void) strlcpy(dn, fname, sizeof (dn));
400 if (lstat(fname, &sb) != 0)
401 err(1, "%s", fname);
402 if (!(sb.st_mode & S_IFREG))
403 fatal(_("in-place editing only "
404 "works for regular files"));
405 if (*inplace != '\0') {
406 (void) strlcpy(oldfname, fname,
407 sizeof (oldfname));
408 len = strlcat(oldfname, inplace,
409 sizeof (oldfname));
410 if (len > sizeof (oldfname))
411 fatal(_("name too long"));
413 len = snprintf(tmpfname, sizeof (tmpfname),
414 "%s/.!%ld!%s", dirname(dn), (long)getpid(),
415 basename(bn));
416 if (len >= sizeof (tmpfname))
417 fatal(_("name too long"));
418 (void) unlink(tmpfname);
419 if ((outfile = fopen(tmpfname, "w")) == NULL)
420 err(1, "%s", fname);
422 * Some file systems don't support chown or
423 * chmod fully. On those, the owner/group and
424 * permissions will already be set to what
425 * they need to be.
427 if (fstat(fileno(outfile), &nsb) != 0) {
428 warn("fstat()");
430 if (((sb.st_uid != nsb.st_uid) ||
431 (sb.st_gid != nsb.st_gid)) &&
432 (fchown(fileno(outfile), sb.st_uid, sb.st_gid)
433 != 0))
434 warn("fchown()");
435 if ((sb.st_mode != nsb.st_mode) &&
436 (fchmod(fileno(outfile), sb.st_mode & 07777) != 0))
437 warn("fchmod()");
438 outfname = tmpfname;
439 if (!ispan) {
440 linenum = 0;
441 resetstate();
443 } else {
444 outfile = stdout;
445 outfname = "stdout";
447 if ((infile = fopen(fname, "r")) == NULL) {
448 warn("%s", fname);
449 rval = 1;
450 continue;
454 * We are here only when infile is open and we still have something
455 * to read from it.
457 * Use fgetln so that we can handle essentially infinite input data.
458 * Can't use the pointer into the stdio buffer as the process space
459 * because the ungetc() can cause it to move.
461 p = getln(infile, &len);
462 if (ferror(infile))
463 errx(1, "%s: %s", fname, strerror(errno ? errno : EIO));
464 if (len != 0 && p[len - 1] == '\n')
465 len--;
466 cspace(sp, p, len, spflag);
468 linenum++;
470 return (1);
474 * Add a compilation unit to the linked list
476 static void
477 add_compunit(enum e_cut type, char *s)
479 struct s_compunit *cu;
481 if ((cu = malloc(sizeof (struct s_compunit))) == NULL)
482 err(1, "malloc");
483 cu->type = type;
484 cu->s = s;
485 cu->next = NULL;
486 *cu_nextp = cu;
487 cu_nextp = &cu->next;
491 * Add a file to the linked list
493 static void
494 add_file(char *s)
496 struct s_flist *fp;
498 if ((fp = malloc(sizeof (struct s_flist))) == NULL)
499 err(1, "malloc");
500 fp->next = NULL;
501 *fl_nextp = fp;
502 fp->fname = s;
503 fl_nextp = &fp->next;
507 lastline(void)
509 int ch;
511 if (files->next != NULL && (inplace == NULL || ispan))
512 return (0);
513 if ((ch = getc(infile)) == EOF)
514 return (1);
515 (void) ungetc(ch, infile);
516 return (0);
519 char *
520 getln(FILE *in, size_t *lenp)
522 static char *buffer = NULL;
523 static size_t sz = 0;
525 size_t len = 0;
527 for (;;) {
528 if (sz <= (len + 1)) {
529 char *nb;
530 if ((nb = realloc(buffer, sz + LINE_MAX)) == NULL) {
531 err(1, "realloc");
533 buffer = nb;
534 sz += LINE_MAX;
537 buffer[len] = 0;
539 if (fgets(buffer + len, sz - len, in) == NULL) {
540 /* END OF FILE */
541 *lenp = len;
542 break;
545 len += strlen(buffer + len);
547 if (buffer[len - 1] == '\n') {
548 /* got the new line */
549 *lenp = len;
550 break;
554 return (buffer);