Clean up after the change of 2006-12-28.
[coreutils.git] / src / expand.c
blob564520376319c86e1416bd8cc54a31e4e57f1e64
1 /* expand - convert tabs to spaces
2 Copyright (C) 89, 91, 1995-2006 Free Software Foundation, Inc.
4 This program is free software; you can redistribute it and/or modify
5 it under the terms of the GNU General Public License as published by
6 the Free Software Foundation; either version 2, or (at your option)
7 any later version.
9 This program is distributed in the hope that it will be useful,
10 but WITHOUT ANY WARRANTY; without even the implied warranty of
11 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
12 GNU General Public License for more details.
14 You should have received a copy of the GNU General Public License
15 along with this program; if not, write to the Free Software Foundation,
16 Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA. */
18 /* By default, convert all tabs to spaces.
19 Preserves backspace characters in the output; they decrement the
20 column count for tab calculations.
21 The default action is equivalent to -8.
23 Options:
24 --tabs=tab1[,tab2[,...]]
25 -t tab1[,tab2[,...]]
26 -tab1[,tab2[,...]] If only one tab stop is given, set the tabs tab1
27 columns apart instead of the default 8. Otherwise,
28 set the tabs at columns tab1, tab2, etc. (numbered from
29 0); replace any tabs beyond the tab stops given with
30 single spaces.
31 --initial
32 -i Only convert initial tabs on each line to spaces.
34 David MacKenzie <djm@gnu.ai.mit.edu> */
36 #include <config.h>
38 #include <stdio.h>
39 #include <getopt.h>
40 #include <sys/types.h>
41 #include "system.h"
42 #include "error.h"
43 #include "quote.h"
44 #include "xstrndup.h"
46 /* The official name of this program (e.g., no `g' prefix). */
47 #define PROGRAM_NAME "expand"
49 #define AUTHORS "David MacKenzie"
51 /* The number of bytes added at a time to the amount of memory
52 allocated for the output line. */
53 #define OUTPUT_BLOCK 256
55 /* The name this program was run with. */
56 char *program_name;
58 /* If true, convert blanks even after nonblank characters have been
59 read on the line. */
60 static bool convert_entire_line;
62 /* If nonzero, the size of all tab stops. If zero, use `tab_list' instead. */
63 static uintmax_t tab_size;
65 /* Array of the explicit column numbers of the tab stops;
66 after `tab_list' is exhausted, each additional tab is replaced
67 by a space. The first column is column 0. */
68 static uintmax_t *tab_list;
70 /* The number of allocated entries in `tab_list'. */
71 static size_t n_tabs_allocated;
73 /* The index of the first invalid element of `tab_list',
74 where the next element can be added. */
75 static size_t first_free_tab;
77 /* Null-terminated array of input filenames. */
78 static char **file_list;
80 /* Default for `file_list' if no files are given on the command line. */
81 static char *stdin_argv[] =
83 "-", NULL
86 /* True if we have ever read standard input. */
87 static bool have_read_stdin;
89 /* The desired exit status. */
90 static int exit_status;
92 static char const shortopts[] = "it:0::1::2::3::4::5::6::7::8::9::";
94 static struct option const longopts[] =
96 {"tabs", required_argument, NULL, 't'},
97 {"initial", no_argument, NULL, 'i'},
98 {GETOPT_HELP_OPTION_DECL},
99 {GETOPT_VERSION_OPTION_DECL},
100 {NULL, 0, NULL, 0}
103 void
104 usage (int status)
106 if (status != EXIT_SUCCESS)
107 fprintf (stderr, _("Try `%s --help' for more information.\n"),
108 program_name);
109 else
111 printf (_("\
112 Usage: %s [OPTION]... [FILE]...\n\
114 program_name);
115 fputs (_("\
116 Convert tabs in each FILE to spaces, writing to standard output.\n\
117 With no FILE, or when FILE is -, read standard input.\n\
119 "), stdout);
120 fputs (_("\
121 Mandatory arguments to long options are mandatory for short options too.\n\
122 "), stdout);
123 fputs (_("\
124 -i, --initial do not convert tabs after non blanks\n\
125 -t, --tabs=NUMBER have tabs NUMBER characters apart, not 8\n\
126 "), stdout);
127 fputs (_("\
128 -t, --tabs=LIST use comma separated list of explicit tab positions\n\
129 "), stdout);
130 fputs (HELP_OPTION_DESCRIPTION, stdout);
131 fputs (VERSION_OPTION_DESCRIPTION, stdout);
132 printf (_("\nReport bugs to <%s>.\n"), PACKAGE_BUGREPORT);
134 exit (status);
137 /* Add tab stop TABVAL to the end of `tab_list'. */
139 static void
140 add_tab_stop (uintmax_t tabval)
142 if (first_free_tab == n_tabs_allocated)
143 tab_list = X2NREALLOC (tab_list, &n_tabs_allocated);
144 tab_list[first_free_tab++] = tabval;
147 /* Add the comma or blank separated list of tab stops STOPS
148 to the list of tab stops. */
150 static void
151 parse_tab_stops (char const *stops)
153 bool have_tabval = false;
154 uintmax_t tabval IF_LINT (= 0);
155 char const *num_start IF_LINT (= NULL);
156 bool ok = true;
158 for (; *stops; stops++)
160 if (*stops == ',' || isblank (to_uchar (*stops)))
162 if (have_tabval)
163 add_tab_stop (tabval);
164 have_tabval = false;
166 else if (ISDIGIT (*stops))
168 if (!have_tabval)
170 tabval = 0;
171 have_tabval = true;
172 num_start = stops;
175 /* Detect overflow. */
176 if (!DECIMAL_DIGIT_ACCUMULATE (tabval, *stops - '0', uintmax_t))
178 size_t len = strspn (num_start, "0123456789");
179 char *bad_num = xstrndup (num_start, len);
180 error (0, 0, _("tab stop is too large %s"), quote (bad_num));
181 free (bad_num);
182 ok = false;
183 stops = num_start + len - 1;
186 else
188 error (0, 0, _("tab size contains invalid character(s): %s"),
189 quote (stops));
190 ok = false;
191 break;
195 if (!ok)
196 exit (EXIT_FAILURE);
198 if (have_tabval)
199 add_tab_stop (tabval);
202 /* Check that the list of tab stops TABS, with ENTRIES entries,
203 contains only nonzero, ascending values. */
205 static void
206 validate_tab_stops (uintmax_t const *tabs, size_t entries)
208 uintmax_t prev_tab = 0;
209 size_t i;
211 for (i = 0; i < entries; i++)
213 if (tabs[i] == 0)
214 error (EXIT_FAILURE, 0, _("tab size cannot be 0"));
215 if (tabs[i] <= prev_tab)
216 error (EXIT_FAILURE, 0, _("tab sizes must be ascending"));
217 prev_tab = tabs[i];
221 /* Close the old stream pointer FP if it is non-NULL,
222 and return a new one opened to read the next input file.
223 Open a filename of `-' as the standard input.
224 Return NULL if there are no more input files. */
226 static FILE *
227 next_file (FILE *fp)
229 static char *prev_file;
230 char *file;
232 if (fp)
234 if (ferror (fp))
236 error (0, errno, "%s", prev_file);
237 exit_status = EXIT_FAILURE;
239 if (STREQ (prev_file, "-"))
240 clearerr (fp); /* Also clear EOF. */
241 else if (fclose (fp) != 0)
243 error (0, errno, "%s", prev_file);
244 exit_status = EXIT_FAILURE;
248 while ((file = *file_list++) != NULL)
250 if (STREQ (file, "-"))
252 have_read_stdin = true;
253 prev_file = file;
254 return stdin;
256 fp = fopen (file, "r");
257 if (fp)
259 prev_file = file;
260 return fp;
262 error (0, errno, "%s", file);
263 exit_status = EXIT_FAILURE;
265 return NULL;
268 /* Change tabs to spaces, writing to stdout.
269 Read each file in `file_list', in order. */
271 static void
272 expand (void)
274 /* Input stream. */
275 FILE *fp = next_file (NULL);
277 if (!fp)
278 return;
280 for (;;)
282 /* Input character, or EOF. */
283 int c;
285 /* If true, perform translations. */
286 bool convert = true;
289 /* The following variables have valid values only when CONVERT
290 is true: */
292 /* Column of next input character. */
293 uintmax_t column = 0;
295 /* Index in TAB_LIST of next tab stop to examine. */
296 size_t tab_index = 0;
299 /* Convert a line of text. */
303 while ((c = getc (fp)) < 0 && (fp = next_file (fp)))
304 continue;
306 if (convert)
308 if (c == '\t')
310 /* Column the next input tab stop is on. */
311 uintmax_t next_tab_column;
313 if (tab_size)
314 next_tab_column = column + (tab_size - column % tab_size);
315 else
316 for (;;)
317 if (tab_index == first_free_tab)
319 next_tab_column = column + 1;
320 break;
322 else
324 uintmax_t tab = tab_list[tab_index++];
325 if (column < tab)
327 next_tab_column = tab;
328 break;
332 if (next_tab_column < column)
333 error (EXIT_FAILURE, 0, _("input line is too long"));
335 while (++column < next_tab_column)
336 if (putchar (' ') < 0)
337 error (EXIT_FAILURE, errno, _("write error"));
339 c = ' ';
341 else if (c == '\b')
343 /* Go back one column, and force recalculation of the
344 next tab stop. */
345 column -= !!column;
346 tab_index -= !!tab_index;
348 else
350 column++;
351 if (!column)
352 error (EXIT_FAILURE, 0, _("input line is too long"));
355 convert &= convert_entire_line | !! isblank (c);
358 if (c < 0)
359 return;
361 if (putchar (c) < 0)
362 error (EXIT_FAILURE, errno, _("write error"));
364 while (c != '\n');
369 main (int argc, char **argv)
371 int c;
373 initialize_main (&argc, &argv);
374 program_name = argv[0];
375 setlocale (LC_ALL, "");
376 bindtextdomain (PACKAGE, LOCALEDIR);
377 textdomain (PACKAGE);
379 atexit (close_stdout);
381 have_read_stdin = false;
382 exit_status = EXIT_SUCCESS;
383 convert_entire_line = true;
384 tab_list = NULL;
385 first_free_tab = 0;
387 while ((c = getopt_long (argc, argv, shortopts, longopts, NULL)) != -1)
389 switch (c)
391 case 'i':
392 convert_entire_line = false;
393 break;
395 case 't':
396 parse_tab_stops (optarg);
397 break;
399 case '0': case '1': case '2': case '3': case '4':
400 case '5': case '6': case '7': case '8': case '9':
401 if (optarg)
402 parse_tab_stops (optarg - 1);
403 else
405 char tab_stop[2];
406 tab_stop[0] = c;
407 tab_stop[1] = '\0';
408 parse_tab_stops (tab_stop);
410 break;
412 case_GETOPT_HELP_CHAR;
414 case_GETOPT_VERSION_CHAR (PROGRAM_NAME, AUTHORS);
416 default:
417 usage (EXIT_FAILURE);
421 validate_tab_stops (tab_list, first_free_tab);
423 if (first_free_tab == 0)
424 tab_size = 8;
425 else if (first_free_tab == 1)
426 tab_size = tab_list[0];
427 else
428 tab_size = 0;
430 file_list = (optind < argc ? &argv[optind] : stdin_argv);
432 expand ();
434 if (have_read_stdin && fclose (stdin) != 0)
435 error (EXIT_FAILURE, errno, "-");
437 exit (exit_status);