*** empty log message ***
[coreutils.git] / src / expand.c
blobecb4590b25578d6c8e063b4568755c1c6badd769
1 /* expand - convert tabs to spaces
2 Copyright (C) 89, 91, 1995-1998, 1999 Free Software Foundation, Inc.
4 This program is free software; you can redistribute it and/or modify
5 it under the terms of the GNU General Public License as published by
6 the Free Software Foundation; either version 2, or (at your option)
7 any later version.
9 This program is distributed in the hope that it will be useful,
10 but WITHOUT ANY WARRANTY; without even the implied warranty of
11 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
12 GNU General Public License for more details.
14 You should have received a copy of the GNU General Public License
15 along with this program; if not, write to the Free Software Foundation,
16 Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA. */
18 /* By default, convert all tabs to spaces.
19 Preserves backspace characters in the output; they decrement the
20 column count for tab calculations.
21 The default action is equivalent to -8.
23 Options:
24 --tabs=tab1[,tab2[,...]]
25 -t tab1[,tab2[,...]]
26 -tab1[,tab2[,...]] If only one tab stop is given, set the tabs tab1
27 spaces apart instead of the default 8. Otherwise,
28 set the tabs at columns tab1, tab2, etc. (numbered from
29 0); replace any tabs beyond the tabstops given with
30 single spaces.
31 --initial
32 -i Only convert initial tabs on each line to spaces.
34 David MacKenzie <djm@gnu.ai.mit.edu> */
36 #include <config.h>
38 #include <stdio.h>
39 #include <getopt.h>
40 #include <sys/types.h>
41 #include "system.h"
42 #include "error.h"
44 /* The number of bytes added at a time to the amount of memory
45 allocated for the output line. */
46 #define OUTPUT_BLOCK 256
48 /* The number of bytes added at a time to the amount of memory
49 allocated for the list of tabstops. */
50 #define TABLIST_BLOCK 256
52 /* The name this program was run with. */
53 char *program_name;
55 /* If nonzero, convert blanks even after nonblank characters have been
56 read on the line. */
57 static int convert_entire_line;
59 /* If nonzero, the size of all tab stops. If zero, use `tab_list' instead. */
60 static int tab_size;
62 /* Array of the explicit column numbers of the tab stops;
63 after `tab_list' is exhausted, each additional tab is replaced
64 by a space. The first column is column 0. */
65 static int *tab_list;
67 /* The index of the first invalid element of `tab_list',
68 where the next element can be added. */
69 static int first_free_tab;
71 /* Null-terminated array of input filenames. */
72 static char **file_list;
74 /* Default for `file_list' if no files are given on the command line. */
75 static char *stdin_argv[] =
77 "-", NULL
80 /* Nonzero if we have ever read standard input. */
81 static int have_read_stdin;
83 /* Status to return to the system. */
84 static int exit_status;
86 /* If nonzero, display usage information and exit. */
87 static int show_help;
89 /* If nonzero, print the version on standard output then exit. */
90 static int show_version;
92 static struct option const longopts[] =
94 {"tabs", required_argument, NULL, 't'},
95 {"initial", no_argument, NULL, 'i'},
96 {"help", no_argument, &show_help, 1},
97 {"version", no_argument, &show_version, 1},
98 {NULL, 0, NULL, 0}
101 void
102 usage (int status)
104 if (status != 0)
105 fprintf (stderr, _("Try `%s --help' for more information.\n"),
106 program_name);
107 else
109 printf (_("\
110 Usage: %s [OPTION]... [FILE]...\n\
112 program_name);
113 printf (_("\
114 Convert tabs in each FILE to spaces, writing to standard output.\n\
115 With no FILE, or when FILE is -, read standard input.\n\
117 -i, --initial do not convert TABs after non whitespace\n\
118 -t, --tabs=NUMBER have tabs NUMBER characters apart, not 8\n\
119 -t, --tabs=LIST use comma separated list of explicit tab positions\n\
120 --help display this help and exit\n\
121 --version output version information and exit\n\
123 Instead of -t NUMBER or -t LIST, -NUMBER or -LIST may be used.\n\
124 "));
125 puts (_("\nReport bugs to <bug-textutils@gnu.org>."));
127 exit (status == 0 ? EXIT_SUCCESS : EXIT_FAILURE);
130 /* Add tab stop TABVAL to the end of `tab_list', except
131 if TABVAL is -1, do nothing. */
133 static void
134 add_tabstop (int tabval)
136 if (tabval == -1)
137 return;
138 if (first_free_tab % TABLIST_BLOCK == 0)
139 tab_list = (int *) xrealloc ((char *) tab_list,
140 (first_free_tab
141 + TABLIST_BLOCK * sizeof (tab_list[0])));
142 tab_list[first_free_tab++] = tabval;
145 /* Add the comma or blank separated list of tabstops STOPS
146 to the list of tabstops. */
148 static void
149 parse_tabstops (char *stops)
151 int tabval = -1;
153 for (; *stops; stops++)
155 if (*stops == ',' || ISBLANK (*stops))
157 add_tabstop (tabval);
158 tabval = -1;
160 else if (ISDIGIT (*stops))
162 if (tabval == -1)
163 tabval = 0;
164 tabval = tabval * 10 + *stops - '0';
166 else
167 error (EXIT_FAILURE, 0, _("tab size contains an invalid character"));
170 add_tabstop (tabval);
173 /* Check that the list of tabstops TABS, with ENTRIES entries,
174 contains only nonzero, ascending values. */
176 static void
177 validate_tabstops (int *tabs, int entries)
179 int prev_tab = 0;
180 int i;
182 for (i = 0; i < entries; i++)
184 if (tabs[i] == 0)
185 error (EXIT_FAILURE, 0, _("tab size cannot be 0"));
186 if (tabs[i] <= prev_tab)
187 error (EXIT_FAILURE, 0, _("tab sizes must be ascending"));
188 prev_tab = tabs[i];
192 /* Close the old stream pointer FP if it is non-NULL,
193 and return a new one opened to read the next input file.
194 Open a filename of `-' as the standard input.
195 Return NULL if there are no more input files. */
197 static FILE *
198 next_file (FILE *fp)
200 static char *prev_file;
201 char *file;
203 if (fp)
205 if (ferror (fp))
207 error (0, errno, "%s", prev_file);
208 exit_status = 1;
210 if (fp == stdin)
211 clearerr (fp); /* Also clear EOF. */
212 else if (fclose (fp) == EOF)
214 error (0, errno, "%s", prev_file);
215 exit_status = 1;
219 while ((file = *file_list++) != NULL)
221 if (file[0] == '-' && file[1] == '\0')
223 have_read_stdin = 1;
224 prev_file = file;
225 return stdin;
227 fp = fopen (file, "r");
228 if (fp)
230 prev_file = file;
231 return fp;
233 error (0, errno, "%s", file);
234 exit_status = 1;
236 return NULL;
239 /* Change tabs to spaces, writing to stdout.
240 Read each file in `file_list', in order. */
242 static void
243 expand (void)
245 FILE *fp; /* Input stream. */
246 int c; /* Each input character. */
247 int tab_index = 0; /* Index in `tab_list' of next tabstop. */
248 int column = 0; /* Column on screen of the next char. */
249 int next_tab_column; /* Column the next tab stop is on. */
250 int convert = 1; /* If nonzero, perform translations. */
252 fp = next_file ((FILE *) NULL);
253 if (fp == NULL)
254 return;
256 /* Binary I/O will preserve the original EOL style (DOS/Unix) of files. */
257 SET_BINARY2 (fileno (fp), STDOUT_FILENO);
259 for (;;)
261 c = getc (fp);
262 if (c == EOF)
264 fp = next_file (fp);
265 if (fp == NULL)
266 break; /* No more files. */
267 else
269 SET_BINARY2 (fileno (fp), STDOUT_FILENO);
270 continue;
274 if (c == '\n')
276 putchar (c);
277 tab_index = 0;
278 column = 0;
279 convert = 1;
281 else if (c == '\t' && convert)
283 if (tab_size == 0)
285 /* Do not let tab_index == first_free_tab;
286 stop when it is 1 less. */
287 while (tab_index < first_free_tab - 1
288 && column >= tab_list[tab_index])
289 tab_index++;
290 next_tab_column = tab_list[tab_index];
291 if (tab_index < first_free_tab - 1)
292 tab_index++;
293 if (column >= next_tab_column)
294 next_tab_column = column + 1; /* Ran out of tab stops. */
296 else
298 next_tab_column = column + tab_size - column % tab_size;
300 while (column < next_tab_column)
302 putchar (' ');
303 ++column;
306 else
308 if (convert)
310 if (c == '\b')
312 if (column > 0)
313 --column;
315 else
317 ++column;
318 if (convert_entire_line == 0)
319 convert = 0;
322 putchar (c);
328 main (int argc, char **argv)
330 int tabval = -1; /* Value of tabstop being read, or -1. */
331 int c; /* Option character. */
333 have_read_stdin = 0;
334 exit_status = 0;
335 convert_entire_line = 1;
336 tab_list = NULL;
337 first_free_tab = 0;
338 program_name = argv[0];
339 setlocale (LC_ALL, "");
340 bindtextdomain (PACKAGE, LOCALEDIR);
341 textdomain (PACKAGE);
343 while ((c = getopt_long (argc, argv, "it:,0123456789", longopts, NULL)) != -1)
345 switch (c)
347 case 0:
348 break;
350 case '?':
351 usage (1);
352 case 'i':
353 convert_entire_line = 0;
354 break;
355 case 't':
356 parse_tabstops (optarg);
357 break;
358 case ',':
359 add_tabstop (tabval);
360 tabval = -1;
361 break;
362 default:
363 if (tabval == -1)
364 tabval = 0;
365 tabval = tabval * 10 + c - '0';
366 break;
370 if (show_version)
372 printf ("expand (%s) %s\n", GNU_PACKAGE, VERSION);
373 exit (EXIT_SUCCESS);
376 if (show_help)
377 usage (0);
379 add_tabstop (tabval);
381 validate_tabstops (tab_list, first_free_tab);
383 if (first_free_tab == 0)
384 tab_size = 8;
385 else if (first_free_tab == 1)
386 tab_size = tab_list[0];
387 else
388 tab_size = 0;
390 if (optind == argc)
391 file_list = stdin_argv;
392 else
393 file_list = &argv[optind];
395 expand ();
397 if (have_read_stdin && fclose (stdin) == EOF)
398 error (EXIT_FAILURE, errno, "-");
399 if (ferror (stdout) || fclose (stdout) == EOF)
400 error (EXIT_FAILURE, errno, _("write error"));
402 exit (exit_status == 0 ? EXIT_SUCCESS : EXIT_FAILURE);