1 /* expand - convert tabs to spaces
2 Copyright (C) 89, 91, 1995-2005 Free Software Foundation, Inc.
4 This program is free software; you can redistribute it and/or modify
5 it under the terms of the GNU General Public License as published by
6 the Free Software Foundation; either version 2, or (at your option)
9 This program is distributed in the hope that it will be useful,
10 but WITHOUT ANY WARRANTY; without even the implied warranty of
11 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
12 GNU General Public License for more details.
14 You should have received a copy of the GNU General Public License
15 along with this program; if not, write to the Free Software Foundation,
16 Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA. */
18 /* By default, convert all tabs to spaces.
19 Preserves backspace characters in the output; they decrement the
20 column count for tab calculations.
21 The default action is equivalent to -8.
24 --tabs=tab1[,tab2[,...]]
26 -tab1[,tab2[,...]] If only one tab stop is given, set the tabs tab1
27 columns apart instead of the default 8. Otherwise,
28 set the tabs at columns tab1, tab2, etc. (numbered from
29 0); replace any tabs beyond the tab stops given with
32 -i Only convert initial tabs on each line to spaces.
34 David MacKenzie <djm@gnu.ai.mit.edu> */
40 #include <sys/types.h>
46 /* The official name of this program (e.g., no `g' prefix). */
47 #define PROGRAM_NAME "expand"
49 #define AUTHORS "David MacKenzie"
51 /* The number of bytes added at a time to the amount of memory
52 allocated for the output line. */
53 #define OUTPUT_BLOCK 256
55 /* The name this program was run with. */
58 /* If true, convert blanks even after nonblank characters have been
60 static bool convert_entire_line;
62 /* If nonzero, the size of all tab stops. If zero, use `tab_list' instead. */
63 static uintmax_t tab_size;
65 /* Array of the explicit column numbers of the tab stops;
66 after `tab_list' is exhausted, each additional tab is replaced
67 by a space. The first column is column 0. */
68 static uintmax_t *tab_list;
70 /* The number of allocated entries in `tab_list'. */
71 static size_t n_tabs_allocated;
73 /* The index of the first invalid element of `tab_list',
74 where the next element can be added. */
75 static size_t first_free_tab;
77 /* Null-terminated array of input filenames. */
78 static char **file_list;
80 /* Default for `file_list' if no files are given on the command line. */
81 static char *stdin_argv[] =
86 /* True if we have ever read standard input. */
87 static bool have_read_stdin;
89 /* The desired exit status. */
90 static int exit_status;
92 static char const shortopts[] = "it:0::1::2::3::4::5::6::7::8::9::";
94 static struct option const longopts[] =
96 {"tabs", required_argument, NULL, 't'},
97 {"initial", no_argument, NULL, 'i'},
98 {GETOPT_HELP_OPTION_DECL},
99 {GETOPT_VERSION_OPTION_DECL},
106 if (status != EXIT_SUCCESS)
107 fprintf (stderr, _("Try `%s --help' for more information.\n"),
112 Usage: %s [OPTION]... [FILE]...\n\
116 Convert tabs in each FILE to spaces, writing to standard output.\n\
117 With no FILE, or when FILE is -, read standard input.\n\
121 Mandatory arguments to long options are mandatory for short options too.\n\
124 -i, --initial do not convert tabs after non blanks\n\
125 -t, --tabs=NUMBER have tabs NUMBER characters apart, not 8\n\
128 -t, --tabs=LIST use comma separated list of explicit tab positions\n\
130 fputs (HELP_OPTION_DESCRIPTION, stdout);
131 fputs (VERSION_OPTION_DESCRIPTION, stdout);
132 printf (_("\nReport bugs to <%s>.\n"), PACKAGE_BUGREPORT);
137 /* Add tab stop TABVAL to the end of `tab_list'. */
140 add_tab_stop (uintmax_t tabval)
142 if (first_free_tab == n_tabs_allocated)
143 tab_list = x2nrealloc (tab_list, &n_tabs_allocated, sizeof *tab_list);
144 tab_list[first_free_tab++] = tabval;
147 /* Add the comma or blank separated list of tab stops STOPS
148 to the list of tab stops. */
151 parse_tab_stops (char const *stops)
153 bool have_tabval = false;
154 uintmax_t tabval IF_LINT (= 0);
155 char const *num_start IF_LINT (= NULL);
158 for (; *stops; stops++)
160 if (*stops == ',' || ISBLANK (to_uchar (*stops)))
163 add_tab_stop (tabval);
166 else if (ISDIGIT (*stops))
175 if (!DECIMAL_DIGIT_ACCUMULATE (tabval, *stops - '0', UINTMAX_MAX))
177 size_t len = strspn (num_start, "0123456789");
178 char *bad_num = xstrndup (num_start, len);
179 error (0, 0, _("tab stop is too large %s"), quote (bad_num));
182 stops = num_start + len - 1;
187 error (0, 0, _("tab size contains invalid character(s): %s"),
198 add_tab_stop (tabval);
201 /* Check that the list of tab stops TABS, with ENTRIES entries,
202 contains only nonzero, ascending values. */
205 validate_tab_stops (uintmax_t const *tabs, size_t entries)
207 uintmax_t prev_tab = 0;
210 for (i = 0; i < entries; i++)
213 error (EXIT_FAILURE, 0, _("tab size cannot be 0"));
214 if (tabs[i] <= prev_tab)
215 error (EXIT_FAILURE, 0, _("tab sizes must be ascending"));
220 /* Close the old stream pointer FP if it is non-NULL,
221 and return a new one opened to read the next input file.
222 Open a filename of `-' as the standard input.
223 Return NULL if there are no more input files. */
228 static char *prev_file;
235 error (0, errno, "%s", prev_file);
236 exit_status = EXIT_FAILURE;
239 clearerr (fp); /* Also clear EOF. */
240 else if (fclose (fp) != 0)
242 error (0, errno, "%s", prev_file);
243 exit_status = EXIT_FAILURE;
247 while ((file = *file_list++) != NULL)
249 if (file[0] == '-' && file[1] == '\0')
251 have_read_stdin = true;
255 fp = fopen (file, "r");
261 error (0, errno, "%s", file);
262 exit_status = EXIT_FAILURE;
267 /* Change tabs to spaces, writing to stdout.
268 Read each file in `file_list', in order. */
274 FILE *fp = next_file (NULL);
279 /* Binary I/O will preserve the original EOL style (DOS/Unix) of files. */
280 SET_BINARY2 (fileno (fp), STDOUT_FILENO);
284 /* Input character, or EOF. */
287 /* If true, perform translations. */
291 /* The following variables have valid values only when CONVERT
294 /* Column of next input character. */
295 uintmax_t column = 0;
297 /* Index in TAB_LIST of next tab stop to examine. */
298 size_t tab_index = 0;
301 /* Convert a line of text. */
305 while ((c = getc (fp)) < 0 && (fp = next_file (fp)))
306 SET_BINARY2 (fileno (fp), STDOUT_FILENO);
312 /* Column the next input tab stop is on. */
313 uintmax_t next_tab_column;
316 next_tab_column = column + (tab_size - column % tab_size);
319 if (tab_index == first_free_tab)
321 next_tab_column = column + 1;
326 uintmax_t tab = tab_list[tab_index++];
329 next_tab_column = tab;
334 if (next_tab_column < column)
335 error (EXIT_FAILURE, 0, _("input line is too long"));
337 while (++column < next_tab_column)
338 if (putchar (' ') < 0)
339 error (EXIT_FAILURE, errno, _("write error"));
345 /* Go back one column, and force recalculation of the
348 tab_index -= !!tab_index;
354 error (EXIT_FAILURE, 0, _("input line is too long"));
357 convert &= convert_entire_line | ISBLANK (c);
364 error (EXIT_FAILURE, errno, _("write error"));
371 main (int argc, char **argv)
375 initialize_main (&argc, &argv);
376 program_name = argv[0];
377 setlocale (LC_ALL, "");
378 bindtextdomain (PACKAGE, LOCALEDIR);
379 textdomain (PACKAGE);
381 atexit (close_stdout);
383 have_read_stdin = false;
384 exit_status = EXIT_SUCCESS;
385 convert_entire_line = true;
389 while ((c = getopt_long (argc, argv, shortopts, longopts, NULL)) != -1)
394 convert_entire_line = false;
398 parse_tab_stops (optarg);
401 case '0': case '1': case '2': case '3': case '4':
402 case '5': case '6': case '7': case '8': case '9':
404 parse_tab_stops (optarg - 1);
410 parse_tab_stops (tab_stop);
414 case_GETOPT_HELP_CHAR;
416 case_GETOPT_VERSION_CHAR (PROGRAM_NAME, AUTHORS);
419 usage (EXIT_FAILURE);
423 validate_tab_stops (tab_list, first_free_tab);
425 if (first_free_tab == 0)
427 else if (first_free_tab == 1)
428 tab_size = tab_list[0];
432 file_list = (optind < argc ? &argv[optind] : stdin_argv);
436 if (have_read_stdin && fclose (stdin) != 0)
437 error (EXIT_FAILURE, errno, "-");