.
[coreutils.git] / src / expand.c
blob5180dfd1087a20c9b93cc9980501bd767b3f1df6
1 /* expand - convert tabs to spaces
2 Copyright (C) 89, 91, 95, 1996 Free Software Foundation, Inc.
4 This program is free software; you can redistribute it and/or modify
5 it under the terms of the GNU General Public License as published by
6 the Free Software Foundation; either version 2, or (at your option)
7 any later version.
9 This program is distributed in the hope that it will be useful,
10 but WITHOUT ANY WARRANTY; without even the implied warranty of
11 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
12 GNU General Public License for more details.
14 You should have received a copy of the GNU General Public License
15 along with this program; if not, write to the Free Software
16 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA. */
18 /* By default, convert all tabs to spaces.
19 Preserves backspace characters in the output; they decrement the
20 column count for tab calculations.
21 The default action is equivalent to -8.
23 Options:
24 --tabs=tab1[,tab2[,...]]
25 -t tab1[,tab2[,...]]
26 -tab1[,tab2[,...]] If only one tab stop is given, set the tabs tab1
27 spaces apart instead of the default 8. Otherwise,
28 set the tabs at columns tab1, tab2, etc. (numbered from
29 0); replace any tabs beyond the tabstops given with
30 single spaces.
31 --initial
32 -i Only convert initial tabs on each line to spaces.
34 David MacKenzie <djm@gnu.ai.mit.edu> */
36 #include <config.h>
38 /* Get isblank from GNU libc. */
39 #define _GNU_SOURCE
41 #include <stdio.h>
42 #include <getopt.h>
43 #include <sys/types.h>
44 #include "system.h"
45 #include "error.h"
47 /* The number of bytes added at a time to the amount of memory
48 allocated for the output line. */
49 #define OUTPUT_BLOCK 256
51 /* The number of bytes added at a time to the amount of memory
52 allocated for the list of tabstops. */
53 #define TABLIST_BLOCK 256
55 char *xmalloc ();
56 char *xrealloc ();
58 /* The name this program was run with. */
59 char *program_name;
61 /* If nonzero, convert blanks even after nonblank characters have been
62 read on the line. */
63 static int convert_entire_line;
65 /* If nonzero, the size of all tab stops. If zero, use `tab_list' instead. */
66 static int tab_size;
68 /* Array of the explicit column numbers of the tab stops;
69 after `tab_list' is exhausted, each additional tab is replaced
70 by a space. The first column is column 0. */
71 static int *tab_list;
73 /* The index of the first invalid element of `tab_list',
74 where the next element can be added. */
75 static int first_free_tab;
77 /* Null-terminated array of input filenames. */
78 static char **file_list;
80 /* Default for `file_list' if no files are given on the command line. */
81 static char *stdin_argv[] =
83 "-", NULL
86 /* Nonzero if we have ever read standard input. */
87 static int have_read_stdin;
89 /* Status to return to the system. */
90 static int exit_status;
92 /* If nonzero, display usage information and exit. */
93 static int show_help;
95 /* If nonzero, print the version on standard output then exit. */
96 static int show_version;
98 static struct option const longopts[] =
100 {"tabs", required_argument, NULL, 't'},
101 {"initial", no_argument, NULL, 'i'},
102 {"help", no_argument, &show_help, 1},
103 {"version", no_argument, &show_version, 1},
104 {NULL, 0, NULL, 0}
107 static void
108 usage (int status)
110 if (status != 0)
111 fprintf (stderr, _("Try `%s --help' for more information.\n"),
112 program_name);
113 else
115 printf (_("\
116 Usage: %s [OPTION]... [FILE]...\n\
118 program_name);
119 printf (_("\
120 Convert tabs in each FILE to spaces, writing to standard output.\n\
121 With no FILE, or when FILE is -, read standard input.\n\
123 -i, --initial do not convert TABs after non whitespace\n\
124 -t, --tabs=NUMBER have tabs NUMBER characters apart, not 8\n\
125 -t, --tabs=LIST use comma separated list of explicit tab positions\n\
126 --help display this help and exit\n\
127 --version output version information and exit\n\
129 Instead of -t NUMBER or -t LIST, -NUMBER or -LIST may be used.\n\
130 "));
132 exit (status == 0 ? EXIT_SUCCESS : EXIT_FAILURE);
135 /* Add tab stop TABVAL to the end of `tab_list', except
136 if TABVAL is -1, do nothing. */
138 static void
139 add_tabstop (int tabval)
141 if (tabval == -1)
142 return;
143 if (first_free_tab % TABLIST_BLOCK == 0)
144 tab_list = (int *) xrealloc (tab_list, first_free_tab
145 + TABLIST_BLOCK * sizeof (tab_list[0]));
146 tab_list[first_free_tab++] = tabval;
149 /* Add the comma or blank separated list of tabstops STOPS
150 to the list of tabstops. */
152 static void
153 parse_tabstops (char *stops)
155 int tabval = -1;
157 for (; *stops; stops++)
159 if (*stops == ',' || ISBLANK (*stops))
161 add_tabstop (tabval);
162 tabval = -1;
164 else if (ISDIGIT (*stops))
166 if (tabval == -1)
167 tabval = 0;
168 tabval = tabval * 10 + *stops - '0';
170 else
171 error (EXIT_FAILURE, 0, _("tab size contains an invalid character"));
174 add_tabstop (tabval);
177 /* Check that the list of tabstops TABS, with ENTRIES entries,
178 contains only nonzero, ascending values. */
180 static void
181 validate_tabstops (int *tabs, int entries)
183 int prev_tab = 0;
184 int i;
186 for (i = 0; i < entries; i++)
188 if (tabs[i] == 0)
189 error (EXIT_FAILURE, 0, _("tab size cannot be 0"));
190 if (tabs[i] <= prev_tab)
191 error (EXIT_FAILURE, 0, _("tab sizes must be ascending"));
192 prev_tab = tabs[i];
196 /* Close the old stream pointer FP if it is non-NULL,
197 and return a new one opened to read the next input file.
198 Open a filename of `-' as the standard input.
199 Return NULL if there are no more input files. */
201 static FILE *
202 next_file (FILE *fp)
204 static char *prev_file;
205 char *file;
207 if (fp)
209 if (ferror (fp))
211 error (0, errno, "%s", prev_file);
212 exit_status = 1;
214 if (fp == stdin)
215 clearerr (fp); /* Also clear EOF. */
216 else if (fclose (fp) == EOF)
218 error (0, errno, "%s", prev_file);
219 exit_status = 1;
223 while ((file = *file_list++) != NULL)
225 if (file[0] == '-' && file[1] == '\0')
227 have_read_stdin = 1;
228 prev_file = file;
229 return stdin;
231 fp = fopen (file, "r");
232 if (fp)
234 prev_file = file;
235 return fp;
237 error (0, errno, "%s", file);
238 exit_status = 1;
240 return NULL;
243 /* Change tabs to spaces, writing to stdout.
244 Read each file in `file_list', in order. */
246 static void
247 expand (void)
249 FILE *fp; /* Input stream. */
250 int c; /* Each input character. */
251 int tab_index = 0; /* Index in `tab_list' of next tabstop. */
252 int column = 0; /* Column on screen of the next char. */
253 int next_tab_column; /* Column the next tab stop is on. */
254 int convert = 1; /* If nonzero, perform translations. */
256 fp = next_file ((FILE *) NULL);
257 if (fp == NULL)
258 return;
259 for (;;)
261 c = getc (fp);
262 if (c == EOF)
264 fp = next_file (fp);
265 if (fp == NULL)
266 break; /* No more files. */
267 else
268 continue;
271 if (c == '\n')
273 putchar (c);
274 tab_index = 0;
275 column = 0;
276 convert = 1;
278 else if (c == '\t' && convert)
280 if (tab_size == 0)
282 /* Do not let tab_index == first_free_tab;
283 stop when it is 1 less. */
284 while (tab_index < first_free_tab - 1
285 && column >= tab_list[tab_index])
286 tab_index++;
287 next_tab_column = tab_list[tab_index];
288 if (tab_index < first_free_tab - 1)
289 tab_index++;
290 if (column >= next_tab_column)
291 next_tab_column = column + 1; /* Ran out of tab stops. */
293 else
295 next_tab_column = column + tab_size - column % tab_size;
297 while (column < next_tab_column)
299 putchar (' ');
300 ++column;
303 else
305 if (convert)
307 if (c == '\b')
309 if (column > 0)
310 --column;
312 else
314 ++column;
315 if (convert_entire_line == 0)
316 convert = 0;
319 putchar (c);
325 main (int argc, char **argv)
327 int tabval = -1; /* Value of tabstop being read, or -1. */
328 int c; /* Option character. */
330 have_read_stdin = 0;
331 exit_status = 0;
332 convert_entire_line = 1;
333 tab_list = NULL;
334 first_free_tab = 0;
335 program_name = argv[0];
336 setlocale (LC_ALL, "");
337 bindtextdomain (PACKAGE, LOCALEDIR);
338 textdomain (PACKAGE);
340 while ((c = getopt_long (argc, argv, "it:,0123456789", longopts, (int *) 0))
341 != EOF)
343 switch (c)
345 case 0:
346 break;
348 case '?':
349 usage (1);
350 case 'i':
351 convert_entire_line = 0;
352 break;
353 case 't':
354 parse_tabstops (optarg);
355 break;
356 case ',':
357 add_tabstop (tabval);
358 tabval = -1;
359 break;
360 default:
361 if (tabval == -1)
362 tabval = 0;
363 tabval = tabval * 10 + c - '0';
364 break;
368 if (show_version)
370 printf ("expand - %s\n", PACKAGE_VERSION);
371 exit (EXIT_SUCCESS);
374 if (show_help)
375 usage (0);
377 add_tabstop (tabval);
379 validate_tabstops (tab_list, first_free_tab);
381 if (first_free_tab == 0)
382 tab_size = 8;
383 else if (first_free_tab == 1)
384 tab_size = tab_list[0];
385 else
386 tab_size = 0;
388 if (optind == argc)
389 file_list = stdin_argv;
390 else
391 file_list = &argv[optind];
393 expand ();
395 if (have_read_stdin && fclose (stdin) == EOF)
396 error (EXIT_FAILURE, errno, "-");
397 if (ferror (stdout) || fclose (stdout) == EOF)
398 error (EXIT_FAILURE, errno, _("write error"));
400 exit (exit_status == 0 ? EXIT_SUCCESS : EXIT_FAILURE);