global: convert indentation-TABs to spaces
[coreutils.git] / src / expand.c
blobc8648335a395455171d84424e4db7188be1a0a66
1 /* expand - convert tabs to spaces
2 Copyright (C) 89, 91, 1995-2006, 2008-2009 Free Software Foundation, Inc.
4 This program is free software: you can redistribute it and/or modify
5 it under the terms of the GNU General Public License as published by
6 the Free Software Foundation, either version 3 of the License, or
7 (at your option) any later version.
9 This program is distributed in the hope that it will be useful,
10 but WITHOUT ANY WARRANTY; without even the implied warranty of
11 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
12 GNU General Public License for more details.
14 You should have received a copy of the GNU General Public License
15 along with this program. If not, see <http://www.gnu.org/licenses/>. */
17 /* By default, convert all tabs to spaces.
18 Preserves backspace characters in the output; they decrement the
19 column count for tab calculations.
20 The default action is equivalent to -8.
22 Options:
23 --tabs=tab1[,tab2[,...]]
24 -t tab1[,tab2[,...]]
25 -tab1[,tab2[,...]] If only one tab stop is given, set the tabs tab1
26 columns apart instead of the default 8. Otherwise,
27 set the tabs at columns tab1, tab2, etc. (numbered from
28 0); replace any tabs beyond the tab stops given with
29 single spaces.
30 --initial
31 -i Only convert initial tabs on each line to spaces.
33 David MacKenzie <djm@gnu.ai.mit.edu> */
35 #include <config.h>
37 #include <stdio.h>
38 #include <getopt.h>
39 #include <sys/types.h>
40 #include "system.h"
41 #include "error.h"
42 #include "quote.h"
43 #include "xstrndup.h"
45 /* The official name of this program (e.g., no `g' prefix). */
46 #define PROGRAM_NAME "expand"
48 #define AUTHORS proper_name ("David MacKenzie")
50 /* If true, convert blanks even after nonblank characters have been
51 read on the line. */
52 static bool convert_entire_line;
54 /* If nonzero, the size of all tab stops. If zero, use `tab_list' instead. */
55 static uintmax_t tab_size;
57 /* Array of the explicit column numbers of the tab stops;
58 after `tab_list' is exhausted, each additional tab is replaced
59 by a space. The first column is column 0. */
60 static uintmax_t *tab_list;
62 /* The number of allocated entries in `tab_list'. */
63 static size_t n_tabs_allocated;
65 /* The index of the first invalid element of `tab_list',
66 where the next element can be added. */
67 static size_t first_free_tab;
69 /* Null-terminated array of input filenames. */
70 static char **file_list;
72 /* Default for `file_list' if no files are given on the command line. */
73 static char *stdin_argv[] =
75 (char *) "-", NULL
78 /* True if we have ever read standard input. */
79 static bool have_read_stdin;
81 /* The desired exit status. */
82 static int exit_status;
84 static char const shortopts[] = "it:0::1::2::3::4::5::6::7::8::9::";
86 static struct option const longopts[] =
88 {"tabs", required_argument, NULL, 't'},
89 {"initial", no_argument, NULL, 'i'},
90 {GETOPT_HELP_OPTION_DECL},
91 {GETOPT_VERSION_OPTION_DECL},
92 {NULL, 0, NULL, 0}
95 void
96 usage (int status)
98 if (status != EXIT_SUCCESS)
99 fprintf (stderr, _("Try `%s --help' for more information.\n"),
100 program_name);
101 else
103 printf (_("\
104 Usage: %s [OPTION]... [FILE]...\n\
106 program_name);
107 fputs (_("\
108 Convert tabs in each FILE to spaces, writing to standard output.\n\
109 With no FILE, or when FILE is -, read standard input.\n\
111 "), stdout);
112 fputs (_("\
113 Mandatory arguments to long options are mandatory for short options too.\n\
114 "), stdout);
115 fputs (_("\
116 -i, --initial do not convert tabs after non blanks\n\
117 -t, --tabs=NUMBER have tabs NUMBER characters apart, not 8\n\
118 "), stdout);
119 fputs (_("\
120 -t, --tabs=LIST use comma separated list of explicit tab positions\n\
121 "), stdout);
122 fputs (HELP_OPTION_DESCRIPTION, stdout);
123 fputs (VERSION_OPTION_DESCRIPTION, stdout);
124 emit_bug_reporting_address ();
126 exit (status);
129 /* Add tab stop TABVAL to the end of `tab_list'. */
131 static void
132 add_tab_stop (uintmax_t tabval)
134 if (first_free_tab == n_tabs_allocated)
135 tab_list = X2NREALLOC (tab_list, &n_tabs_allocated);
136 tab_list[first_free_tab++] = tabval;
139 /* Add the comma or blank separated list of tab stops STOPS
140 to the list of tab stops. */
142 static void
143 parse_tab_stops (char const *stops)
145 bool have_tabval = false;
146 uintmax_t tabval IF_LINT (= 0);
147 char const *num_start IF_LINT (= NULL);
148 bool ok = true;
150 for (; *stops; stops++)
152 if (*stops == ',' || isblank (to_uchar (*stops)))
154 if (have_tabval)
155 add_tab_stop (tabval);
156 have_tabval = false;
158 else if (ISDIGIT (*stops))
160 if (!have_tabval)
162 tabval = 0;
163 have_tabval = true;
164 num_start = stops;
167 /* Detect overflow. */
168 if (!DECIMAL_DIGIT_ACCUMULATE (tabval, *stops - '0', uintmax_t))
170 size_t len = strspn (num_start, "0123456789");
171 char *bad_num = xstrndup (num_start, len);
172 error (0, 0, _("tab stop is too large %s"), quote (bad_num));
173 free (bad_num);
174 ok = false;
175 stops = num_start + len - 1;
178 else
180 error (0, 0, _("tab size contains invalid character(s): %s"),
181 quote (stops));
182 ok = false;
183 break;
187 if (!ok)
188 exit (EXIT_FAILURE);
190 if (have_tabval)
191 add_tab_stop (tabval);
194 /* Check that the list of tab stops TABS, with ENTRIES entries,
195 contains only nonzero, ascending values. */
197 static void
198 validate_tab_stops (uintmax_t const *tabs, size_t entries)
200 uintmax_t prev_tab = 0;
201 size_t i;
203 for (i = 0; i < entries; i++)
205 if (tabs[i] == 0)
206 error (EXIT_FAILURE, 0, _("tab size cannot be 0"));
207 if (tabs[i] <= prev_tab)
208 error (EXIT_FAILURE, 0, _("tab sizes must be ascending"));
209 prev_tab = tabs[i];
213 /* Close the old stream pointer FP if it is non-NULL,
214 and return a new one opened to read the next input file.
215 Open a filename of `-' as the standard input.
216 Return NULL if there are no more input files. */
218 static FILE *
219 next_file (FILE *fp)
221 static char *prev_file;
222 char *file;
224 if (fp)
226 if (ferror (fp))
228 error (0, errno, "%s", prev_file);
229 exit_status = EXIT_FAILURE;
231 if (STREQ (prev_file, "-"))
232 clearerr (fp); /* Also clear EOF. */
233 else if (fclose (fp) != 0)
235 error (0, errno, "%s", prev_file);
236 exit_status = EXIT_FAILURE;
240 while ((file = *file_list++) != NULL)
242 if (STREQ (file, "-"))
244 have_read_stdin = true;
245 prev_file = file;
246 return stdin;
248 fp = fopen (file, "r");
249 if (fp)
251 prev_file = file;
252 return fp;
254 error (0, errno, "%s", file);
255 exit_status = EXIT_FAILURE;
257 return NULL;
260 /* Change tabs to spaces, writing to stdout.
261 Read each file in `file_list', in order. */
263 static void
264 expand (void)
266 /* Input stream. */
267 FILE *fp = next_file (NULL);
269 if (!fp)
270 return;
272 for (;;)
274 /* Input character, or EOF. */
275 int c;
277 /* If true, perform translations. */
278 bool convert = true;
281 /* The following variables have valid values only when CONVERT
282 is true: */
284 /* Column of next input character. */
285 uintmax_t column = 0;
287 /* Index in TAB_LIST of next tab stop to examine. */
288 size_t tab_index = 0;
291 /* Convert a line of text. */
295 while ((c = getc (fp)) < 0 && (fp = next_file (fp)))
296 continue;
298 if (convert)
300 if (c == '\t')
302 /* Column the next input tab stop is on. */
303 uintmax_t next_tab_column;
305 if (tab_size)
306 next_tab_column = column + (tab_size - column % tab_size);
307 else
308 for (;;)
309 if (tab_index == first_free_tab)
311 next_tab_column = column + 1;
312 break;
314 else
316 uintmax_t tab = tab_list[tab_index++];
317 if (column < tab)
319 next_tab_column = tab;
320 break;
324 if (next_tab_column < column)
325 error (EXIT_FAILURE, 0, _("input line is too long"));
327 while (++column < next_tab_column)
328 if (putchar (' ') < 0)
329 error (EXIT_FAILURE, errno, _("write error"));
331 c = ' ';
333 else if (c == '\b')
335 /* Go back one column, and force recalculation of the
336 next tab stop. */
337 column -= !!column;
338 tab_index -= !!tab_index;
340 else
342 column++;
343 if (!column)
344 error (EXIT_FAILURE, 0, _("input line is too long"));
347 convert &= convert_entire_line | !! isblank (c);
350 if (c < 0)
351 return;
353 if (putchar (c) < 0)
354 error (EXIT_FAILURE, errno, _("write error"));
356 while (c != '\n');
361 main (int argc, char **argv)
363 int c;
365 initialize_main (&argc, &argv);
366 set_program_name (argv[0]);
367 setlocale (LC_ALL, "");
368 bindtextdomain (PACKAGE, LOCALEDIR);
369 textdomain (PACKAGE);
371 atexit (close_stdout);
373 have_read_stdin = false;
374 exit_status = EXIT_SUCCESS;
375 convert_entire_line = true;
376 tab_list = NULL;
377 first_free_tab = 0;
379 while ((c = getopt_long (argc, argv, shortopts, longopts, NULL)) != -1)
381 switch (c)
383 case 'i':
384 convert_entire_line = false;
385 break;
387 case 't':
388 parse_tab_stops (optarg);
389 break;
391 case '0': case '1': case '2': case '3': case '4':
392 case '5': case '6': case '7': case '8': case '9':
393 if (optarg)
394 parse_tab_stops (optarg - 1);
395 else
397 char tab_stop[2];
398 tab_stop[0] = c;
399 tab_stop[1] = '\0';
400 parse_tab_stops (tab_stop);
402 break;
404 case_GETOPT_HELP_CHAR;
406 case_GETOPT_VERSION_CHAR (PROGRAM_NAME, AUTHORS);
408 default:
409 usage (EXIT_FAILURE);
413 validate_tab_stops (tab_list, first_free_tab);
415 if (first_free_tab == 0)
416 tab_size = 8;
417 else if (first_free_tab == 1)
418 tab_size = tab_list[0];
419 else
420 tab_size = 0;
422 file_list = (optind < argc ? &argv[optind] : stdin_argv);
424 expand ();
426 if (have_read_stdin && fclose (stdin) != 0)
427 error (EXIT_FAILURE, errno, "-");
429 exit (exit_status);