(libfetish_a_SOURCES): Add mmap-stack.h.
[coreutils.git] / src / unexpand.c
blob9c1e751f62e2be63d5bcd79a1c88fc14ac11c734
1 /* unexpand - convert spaces to tabs
2 Copyright (C) 89, 91, 1995-2003 Free Software Foundation, Inc.
4 This program is free software; you can redistribute it and/or modify
5 it under the terms of the GNU General Public License as published by
6 the Free Software Foundation; either version 2, or (at your option)
7 any later version.
9 This program is distributed in the hope that it will be useful,
10 but WITHOUT ANY WARRANTY; without even the implied warranty of
11 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
12 GNU General Public License for more details.
14 You should have received a copy of the GNU General Public License
15 along with this program; if not, write to the Free Software Foundation,
16 Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA. */
18 /* By default, convert only maximal strings of initial blanks and tabs
19 into tabs.
20 Preserves backspace characters in the output; they decrement the
21 column count for tab calculations.
22 The default action is equivalent to -8.
24 Options:
25 --tabs=tab1[,tab2[,...]]
26 -t tab1[,tab2[,...]]
27 -tab1[,tab2[,...]] If only one tab stop is given, set the tabs tab1
28 spaces apart instead of the default 8. Otherwise,
29 set the tabs at columns tab1, tab2, etc. (numbered from
30 0); replace any tabs beyond the tabstops given with
31 single spaces.
32 --all
33 -a Use tabs wherever they would replace 2 or more spaces,
34 not just at the beginnings of lines.
36 David MacKenzie <djm@gnu.ai.mit.edu> */
38 #include <config.h>
40 #include <stdio.h>
41 #include <getopt.h>
42 #include <sys/types.h>
43 #include "system.h"
44 #include "closeout.h"
45 #include "error.h"
46 #include "posixver.h"
48 /* The official name of this program (e.g., no `g' prefix). */
49 #define PROGRAM_NAME "unexpand"
51 #define AUTHORS "David MacKenzie"
53 /* The number of bytes added at a time to the amount of memory
54 allocated for the output line. */
55 #define OUTPUT_BLOCK 256
57 /* The number of bytes added at a time to the amount of memory
58 allocated for the list of tabstops. */
59 #define TABLIST_BLOCK 256
61 /* A sentinel value that's placed at the end of the list of tab stops.
62 This value must be a large number, but not so large that adding the
63 length of a line to it would cause the column variable to overflow. */
64 #define TAB_STOP_SENTINEL INT_MAX
66 /* The name this program was run with. */
67 char *program_name;
69 /* If nonzero, convert blanks even after nonblank characters have been
70 read on the line. */
71 static int convert_entire_line;
73 /* If nonzero, the size of all tab stops. If zero, use `tab_list' instead. */
74 static int tab_size;
76 /* Array of the explicit column numbers of the tab stops;
77 after `tab_list' is exhausted, the rest of the line is printed
78 unchanged. The first column is column 0. */
79 static int *tab_list;
81 /* The index of the first invalid element of `tab_list',
82 where the next element can be added. */
83 static int first_free_tab;
85 /* Null-terminated array of input filenames. */
86 static char **file_list;
88 /* Default for `file_list' if no files are given on the command line. */
89 static char *stdin_argv[] =
91 "-", NULL
94 /* Nonzero if we have ever read standard input. */
95 static int have_read_stdin;
97 /* Status to return to the system. */
98 static int exit_status;
100 /* For long options that have no equivalent short option, use a
101 non-character as a pseudo short option, starting with CHAR_MAX + 1. */
102 enum
104 CONVERT_FIRST_ONLY_OPTION = CHAR_MAX + 1
107 static struct option const longopts[] =
109 {"tabs", required_argument, NULL, 't'},
110 {"all", no_argument, NULL, 'a'},
111 {"first-only", no_argument, NULL, CONVERT_FIRST_ONLY_OPTION},
112 {GETOPT_HELP_OPTION_DECL},
113 {GETOPT_VERSION_OPTION_DECL},
114 {NULL, 0, NULL, 0}
117 /* Add tab stop TABVAL to the end of `tab_list', except
118 if TABVAL is -1, do nothing. */
120 static void
121 add_tabstop (int tabval)
123 if (tabval == -1)
124 return;
125 if (first_free_tab % TABLIST_BLOCK == 0)
126 tab_list = (int *) xrealloc ((char *) tab_list,
127 first_free_tab + TABLIST_BLOCK);
128 tab_list[first_free_tab++] = tabval;
131 /* Add the comma or blank separated list of tabstops STOPS
132 to the list of tabstops. */
134 static void
135 parse_tabstops (const char *stops)
137 int tabval = -1;
139 for (; *stops; stops++)
141 if (*stops == ',' || ISBLANK (*stops))
143 add_tabstop (tabval);
144 tabval = -1;
146 else if (ISDIGIT (*stops))
148 if (tabval == -1)
149 tabval = 0;
150 tabval = tabval * 10 + *stops - '0';
152 else
153 error (EXIT_FAILURE, 0, _("tab size contains an invalid character"));
156 add_tabstop (tabval);
159 /* Check that the list of tabstops TABS, with ENTRIES entries,
160 contains only nonzero, ascending values. */
162 static void
163 validate_tabstops (const int *tabs, int entries)
165 int prev_tab = 0;
166 int i;
168 for (i = 0; i < entries; i++)
170 if (tabs[i] == 0)
171 error (EXIT_FAILURE, 0, _("tab size cannot be 0"));
172 if (tabs[i] <= prev_tab)
173 error (EXIT_FAILURE, 0, _("tab sizes must be ascending"));
174 prev_tab = tabs[i];
178 /* Close the old stream pointer FP if it is non-NULL,
179 and return a new one opened to read the next input file.
180 Open a filename of `-' as the standard input.
181 Return NULL if there are no more input files. */
183 static FILE *
184 next_file (FILE *fp)
186 static char *prev_file;
187 char *file;
189 if (fp)
191 if (ferror (fp))
193 error (0, errno, "%s", prev_file);
194 exit_status = 1;
196 if (fp == stdin)
197 clearerr (fp); /* Also clear EOF. */
198 else if (fclose (fp) == EOF)
200 error (0, errno, "%s", prev_file);
201 exit_status = 1;
205 while ((file = *file_list++) != NULL)
207 if (file[0] == '-' && file[1] == '\0')
209 have_read_stdin = 1;
210 prev_file = file;
211 return stdin;
213 fp = fopen (file, "r");
214 if (fp)
216 prev_file = file;
217 return fp;
219 error (0, errno, "%s", file);
220 exit_status = 1;
222 return NULL;
225 /* Change spaces to tabs, writing to stdout.
226 Read each file in `file_list', in order. */
228 static void
229 unexpand (void)
231 FILE *fp; /* Input stream. */
232 int c; /* Each input character. */
233 /* Index in `tab_list' of next tabstop: */
234 int tab_index = 0; /* For calculating width of pending tabs. */
235 int print_tab_index = 0; /* For printing as many tabs as possible. */
236 unsigned int column = 0; /* Column on screen of next char. */
237 int next_tab_column; /* Column the next tab stop is on. */
238 int convert = 1; /* If nonzero, perform translations. */
239 unsigned int pending = 0; /* Pending columns of blanks. */
241 fp = next_file ((FILE *) NULL);
242 if (fp == NULL)
243 return;
245 /* Binary I/O will preserve the original EOL style (DOS/Unix) of files. */
246 SET_BINARY2 (fileno (fp), STDOUT_FILENO);
248 for (;;)
250 c = getc (fp);
252 if (c == ' ' && convert && column < TAB_STOP_SENTINEL)
254 ++pending;
255 ++column;
257 else if (c == '\t' && convert)
259 if (tab_size == 0)
261 /* Do not let tab_index == first_free_tab;
262 stop when it is 1 less. */
263 while (tab_index < first_free_tab - 1
264 && column >= tab_list[tab_index])
265 tab_index++;
266 next_tab_column = tab_list[tab_index];
267 if (tab_index < first_free_tab - 1)
268 tab_index++;
269 if (column >= next_tab_column)
271 convert = 0; /* Ran out of tab stops. */
272 goto flush_pend;
275 else
277 next_tab_column = column + tab_size - column % tab_size;
279 pending += next_tab_column - column;
280 column = next_tab_column;
282 else
284 flush_pend:
285 /* Flush pending spaces. Print as many tabs as possible,
286 then print the rest as spaces. */
287 if (pending == 1)
289 putchar (' ');
290 pending = 0;
292 column -= pending;
293 while (pending > 0)
295 if (tab_size == 0)
297 /* Do not let print_tab_index == first_free_tab;
298 stop when it is 1 less. */
299 while (print_tab_index < first_free_tab - 1
300 && column >= tab_list[print_tab_index])
301 print_tab_index++;
302 next_tab_column = tab_list[print_tab_index];
303 if (print_tab_index < first_free_tab - 1)
304 print_tab_index++;
306 else
308 next_tab_column = column + tab_size - column % tab_size;
310 if (next_tab_column - column <= pending)
312 putchar ('\t');
313 pending -= next_tab_column - column;
314 column = next_tab_column;
316 else
318 --print_tab_index;
319 column += pending;
320 while (pending != 0)
322 putchar (' ');
323 pending--;
328 if (c == EOF)
330 fp = next_file (fp);
331 if (fp == NULL)
332 break; /* No more files. */
333 else
335 SET_BINARY2 (fileno (fp), STDOUT_FILENO);
336 continue;
340 if (convert)
342 if (c == '\b')
344 if (column > 0)
345 --column;
347 else
349 ++column;
350 if (convert_entire_line == 0)
351 convert = 0;
355 putchar (c);
357 if (c == '\n')
359 tab_index = print_tab_index = 0;
360 column = pending = 0;
361 convert = 1;
367 void
368 usage (int status)
370 if (status != 0)
371 fprintf (stderr, _("Try `%s --help' for more information.\n"),
372 program_name);
373 else
375 printf (_("\
376 Usage: %s [OPTION]... [FILE]...\n\
378 program_name);
379 fputs (_("\
380 Convert spaces in each FILE to tabs, writing to standard output.\n\
381 With no FILE, or when FILE is -, read standard input.\n\
383 "), stdout);
384 fputs (_("\
385 Mandatory arguments to long options are mandatory for short options too.\n\
386 "), stdout);
387 fputs (_("\
388 -a, --all convert all whitespace, instead of just initial whitespace\n\
389 --first-only convert only leading sequences of whitespace (overrides -a)\n\
390 -t, --tabs=N have tabs N characters apart instead of 8 (enables -a)\n\
391 -t, --tabs=LIST use comma separated LIST of tab positions (enables -a)\n\
392 "), stdout);
393 fputs (HELP_OPTION_DESCRIPTION, stdout);
394 fputs (VERSION_OPTION_DESCRIPTION, stdout);
395 printf (_("\nReport bugs to <%s>.\n"), PACKAGE_BUGREPORT);
397 exit (status == 0 ? EXIT_SUCCESS : EXIT_FAILURE);
401 main (int argc, char **argv)
403 int tabval = -1; /* Value of tabstop being read, or -1. */
404 int c; /* Option character. */
406 /* If nonzero, cancel the effect of any -a (explicit or implicit in -t),
407 so that only leading white space will be considered. */
408 int convert_first_only = 0;
410 bool obsolete_tablist = false;
412 program_name = argv[0];
413 setlocale (LC_ALL, "");
414 bindtextdomain (PACKAGE, LOCALEDIR);
415 textdomain (PACKAGE);
417 atexit (close_stdout);
419 have_read_stdin = 0;
420 exit_status = 0;
421 convert_entire_line = 0;
422 tab_list = NULL;
423 first_free_tab = 0;
425 while ((c = getopt_long (argc, argv, ",0123456789at:", longopts, NULL))
426 != -1)
428 switch (c)
430 case 0:
431 break;
433 case '?':
434 usage (EXIT_FAILURE);
435 case 'a':
436 convert_entire_line = 1;
437 break;
438 case 't':
439 convert_entire_line = 1;
440 parse_tabstops (optarg);
441 break;
442 case CONVERT_FIRST_ONLY_OPTION:
443 convert_first_only = 1;
444 break;
445 case ',':
446 add_tabstop (tabval);
447 tabval = -1;
448 obsolete_tablist = true;
449 break;
450 case_GETOPT_HELP_CHAR;
451 case_GETOPT_VERSION_CHAR (PROGRAM_NAME, AUTHORS);
452 default:
453 if (tabval == -1)
454 tabval = 0;
455 tabval = tabval * 10 + c - '0';
456 obsolete_tablist = true;
457 break;
461 if (obsolete_tablist && 200112 <= posix2_version ())
463 error (0, 0,
464 _("`-LIST' option is obsolete; use `--first-only -t LIST'"));
465 usage (EXIT_FAILURE);
468 if (convert_first_only)
469 convert_entire_line = 0;
471 add_tabstop (tabval);
473 validate_tabstops (tab_list, first_free_tab);
475 if (first_free_tab == 0)
476 tab_size = 8;
477 else if (first_free_tab == 1)
478 tab_size = tab_list[0];
479 else
481 /* Append a sentinel to the list of tab stop indices. */
482 add_tabstop (TAB_STOP_SENTINEL);
483 tab_size = 0;
486 if (optind == argc)
487 file_list = stdin_argv;
488 else
489 file_list = &argv[optind];
491 unexpand ();
493 if (have_read_stdin && fclose (stdin) == EOF)
494 error (EXIT_FAILURE, errno, "-");
495 exit (exit_status == 0 ? EXIT_SUCCESS : EXIT_FAILURE);