Clone the Makefile.am from join-test.
[coreutils.git] / src / unexpand.c
blob0d04ced64f106d5781a0bdfe39942ac5b68f6578
1 /* unexpand - convert spaces to tabs
2 Copyright (C) 89, 91, 95, 1996 Free Software Foundation, Inc.
4 This program is free software; you can redistribute it and/or modify
5 it under the terms of the GNU General Public License as published by
6 the Free Software Foundation; either version 2, or (at your option)
7 any later version.
9 This program is distributed in the hope that it will be useful,
10 but WITHOUT ANY WARRANTY; without even the implied warranty of
11 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
12 GNU General Public License for more details.
14 You should have received a copy of the GNU General Public License
15 along with this program; if not, write to the Free Software
16 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA. */
18 /* By default, convert only maximal strings of initial blanks and tabs
19 into tabs.
20 Preserves backspace characters in the output; they decrement the
21 column count for tab calculations.
22 The default action is equivalent to -8.
24 Options:
25 --tabs=tab1[,tab2[,...]]
26 -t tab1[,tab2[,...]]
27 -tab1[,tab2[,...]] If only one tab stop is given, set the tabs tab1
28 spaces apart instead of the default 8. Otherwise,
29 set the tabs at columns tab1, tab2, etc. (numbered from
30 0); replace any tabs beyond the tabstops given with
31 single spaces.
32 --all
33 -a Use tabs wherever they would replace 2 or more spaces,
34 not just at the beginnings of lines.
36 David MacKenzie <djm@gnu.ai.mit.edu> */
38 #include <config.h>
40 /* Get isblank from GNU libc. */
41 #define _GNU_SOURCE
43 #include <stdio.h>
44 #include <getopt.h>
45 #include <sys/types.h>
46 #include "system.h"
48 #ifdef HAVE_LIMITS_H
49 # include <limits.h>
50 #endif
52 #ifndef UINT_MAX
53 # define UINT_MAX ((unsigned int) ~(unsigned int) 0)
54 #endif
56 #ifndef INT_MAX
57 # define INT_MAX ((int) (UINT_MAX >> 1))
58 #endif
60 #include "error.h"
62 /* The number of bytes added at a time to the amount of memory
63 allocated for the output line. */
64 #define OUTPUT_BLOCK 256
66 /* The number of bytes added at a time to the amount of memory
67 allocated for the list of tabstops. */
68 #define TABLIST_BLOCK 256
70 char *xmalloc ();
71 char *xrealloc ();
73 /* The name this program was run with. */
74 char *program_name;
76 /* If nonzero, convert blanks even after nonblank characters have been
77 read on the line. */
78 static int convert_entire_line;
80 /* If nonzero, the size of all tab stops. If zero, use `tab_list' instead. */
81 static int tab_size;
83 /* Array of the explicit column numbers of the tab stops;
84 after `tab_list' is exhausted, the rest of the line is printed
85 unchanged. The first column is column 0. */
86 static int *tab_list;
88 /* The index of the first invalid element of `tab_list',
89 where the next element can be added. */
90 static int first_free_tab;
92 /* Null-terminated array of input filenames. */
93 static char **file_list;
95 /* Default for `file_list' if no files are given on the command line. */
96 static char *stdin_argv[] =
98 "-", NULL
101 /* Nonzero if we have ever read standard input. */
102 static int have_read_stdin;
104 /* Status to return to the system. */
105 static int exit_status;
107 /* If nonzero, display usage information and exit. */
108 static int show_help;
110 /* If nonzero, print the version on standard output then exit. */
111 static int show_version;
113 static struct option const longopts[] =
115 {"tabs", required_argument, NULL, 't'},
116 {"all", no_argument, NULL, 'a'},
117 {"help", no_argument, &show_help, 1},
118 {"version", no_argument, &show_version, 1},
119 {NULL, 0, NULL, 0}
122 /* Add tab stop TABVAL to the end of `tab_list', except
123 if TABVAL is -1, do nothing. */
125 static void
126 add_tabstop (int tabval)
128 if (tabval == -1)
129 return;
130 if (first_free_tab % TABLIST_BLOCK == 0)
131 tab_list = (int *) xrealloc (tab_list, first_free_tab + TABLIST_BLOCK);
132 tab_list[first_free_tab++] = tabval;
135 /* Add the comma or blank separated list of tabstops STOPS
136 to the list of tabstops. */
138 static void
139 parse_tabstops (const char *stops)
141 int tabval = -1;
143 for (; *stops; stops++)
145 if (*stops == ',' || ISBLANK (*stops))
147 add_tabstop (tabval);
148 tabval = -1;
150 else if (ISDIGIT (*stops))
152 if (tabval == -1)
153 tabval = 0;
154 tabval = tabval * 10 + *stops - '0';
156 else
157 error (EXIT_FAILURE, 0, _("tab size contains an invalid character"));
160 add_tabstop (tabval);
163 /* Check that the list of tabstops TABS, with ENTRIES entries,
164 contains only nonzero, ascending values. */
166 static void
167 validate_tabstops (const int *tabs, int entries)
169 int prev_tab = 0;
170 int i;
172 for (i = 0; i < entries; i++)
174 if (tabs[i] == 0)
175 error (EXIT_FAILURE, 0, _("tab size cannot be 0"));
176 if (tabs[i] <= prev_tab)
177 error (EXIT_FAILURE, 0, _("tab sizes must be ascending"));
178 prev_tab = tabs[i];
182 /* Close the old stream pointer FP if it is non-NULL,
183 and return a new one opened to read the next input file.
184 Open a filename of `-' as the standard input.
185 Return NULL if there are no more input files. */
187 static FILE *
188 next_file (FILE *fp)
190 static char *prev_file;
191 char *file;
193 if (fp)
195 if (ferror (fp))
197 error (0, errno, "%s", prev_file);
198 exit_status = 1;
200 if (fp == stdin)
201 clearerr (fp); /* Also clear EOF. */
202 else if (fclose (fp) == EOF)
204 error (0, errno, "%s", prev_file);
205 exit_status = 1;
209 while ((file = *file_list++) != NULL)
211 if (file[0] == '-' && file[1] == '\0')
213 have_read_stdin = 1;
214 prev_file = file;
215 return stdin;
217 fp = fopen (file, "r");
218 if (fp)
220 prev_file = file;
221 return fp;
223 error (0, errno, "%s", file);
224 exit_status = 1;
226 return NULL;
229 /* Change spaces to tabs, writing to stdout.
230 Read each file in `file_list', in order. */
232 static void
233 unexpand (void)
235 FILE *fp; /* Input stream. */
236 int c; /* Each input character. */
237 /* Index in `tab_list' of next tabstop: */
238 int tab_index = 0; /* For calculating width of pending tabs. */
239 int print_tab_index = 0; /* For printing as many tabs as possible. */
240 int column = 0; /* Column on screen of next char. */
241 int next_tab_column; /* Column the next tab stop is on. */
242 int convert = 1; /* If nonzero, perform translations. */
243 int pending = 0; /* Pending columns of blanks. */
245 fp = next_file ((FILE *) NULL);
246 if (fp == NULL)
247 return;
249 for (;;)
251 c = getc (fp);
253 if (c == ' ' && convert)
255 ++pending;
256 ++column;
258 else if (c == '\t' && convert)
260 if (tab_size == 0)
262 /* Do not let tab_index == first_free_tab;
263 stop when it is 1 less. */
264 while (tab_index < first_free_tab - 1
265 && column >= tab_list[tab_index])
266 tab_index++;
267 next_tab_column = tab_list[tab_index];
268 if (tab_index < first_free_tab - 1)
269 tab_index++;
270 if (column >= next_tab_column)
272 convert = 0; /* Ran out of tab stops. */
273 goto flush_pend;
276 else
278 next_tab_column = column + tab_size - column % tab_size;
280 pending += next_tab_column - column;
281 column = next_tab_column;
283 else
285 flush_pend:
286 /* Flush pending spaces. Print as many tabs as possible,
287 then print the rest as spaces. */
288 if (pending == 1)
290 putchar (' ');
291 pending = 0;
293 column -= pending;
294 while (pending != 0)
296 if (tab_size == 0)
298 /* Do not let print_tab_index == first_free_tab;
299 stop when it is 1 less. */
300 while (print_tab_index < first_free_tab - 1
301 && column >= tab_list[print_tab_index])
302 print_tab_index++;
303 next_tab_column = tab_list[print_tab_index];
304 if (print_tab_index < first_free_tab - 1)
305 print_tab_index++;
307 else
309 next_tab_column = column + tab_size - column % tab_size;
311 if (next_tab_column - column <= pending)
313 putchar ('\t');
314 pending -= next_tab_column - column;
315 column = next_tab_column;
317 else
319 --print_tab_index;
320 column += pending;
321 while (pending != 0)
323 putchar (' ');
324 pending--;
329 if (c == EOF)
331 fp = next_file (fp);
332 if (fp == NULL)
333 break; /* No more files. */
334 else
335 continue;
338 if (convert)
340 if (c == '\b')
342 if (column > 0)
343 --column;
345 else
347 ++column;
348 if (convert_entire_line == 0)
349 convert = 0;
353 putchar (c);
355 if (c == '\n')
357 tab_index = print_tab_index = 0;
358 column = pending = 0;
359 convert = 1;
365 static void
366 usage (int status)
368 if (status != 0)
369 fprintf (stderr, _("Try `%s --help' for more information.\n"),
370 program_name);
371 else
373 printf (_("\
374 Usage: %s [OPTION]... [FILE]...\n\
376 program_name);
377 printf (_("\
378 Convert spaces in each FILE to tabs, writing to standard output.\n\
379 With no FILE, or when FILE is -, read standard input.\n\
381 -a, --all convert all whitespace, instead of initial whitespace\n\
382 -t, --tabs=NUMBER have tabs NUMBER characters apart instead of 8\n\
383 -t, --tabs=LIST use comma separated list of explicit tab positions\n\
384 --help display this help and exit\n\
385 --version output version information and exit\n\
387 Instead of -t NUMBER or -t LIST, -NUMBER or -LIST may be used.\n\
388 "));
389 puts (_("\nReport bugs to textutils-bugs@gnu.ai.mit.edu"));
391 exit (status == 0 ? EXIT_SUCCESS : EXIT_FAILURE);
395 main (int argc, char **argv)
397 int tabval = -1; /* Value of tabstop being read, or -1. */
398 int c; /* Option character. */
400 program_name = argv[0];
401 setlocale (LC_ALL, "");
402 bindtextdomain (PACKAGE, LOCALEDIR);
403 textdomain (PACKAGE);
405 have_read_stdin = 0;
406 exit_status = 0;
407 convert_entire_line = 0;
408 tab_list = NULL;
409 first_free_tab = 0;
411 while ((c = getopt_long (argc, argv, "at:,0123456789", longopts, (int *) 0))
412 != EOF)
414 switch (c)
416 case 0:
417 break;
419 case '?':
420 usage (1);
421 case 'a':
422 convert_entire_line = 1;
423 break;
424 case 't':
425 convert_entire_line = 1;
426 parse_tabstops (optarg);
427 break;
428 case ',':
429 add_tabstop (tabval);
430 tabval = -1;
431 break;
432 default:
433 if (tabval == -1)
434 tabval = 0;
435 tabval = tabval * 10 + c - '0';
436 break;
440 if (show_version)
442 printf ("unexpand (%s) %s\n", GNU_PACKAGE, VERSION);
443 exit (EXIT_SUCCESS);
446 if (show_help)
447 usage (0);
449 add_tabstop (tabval);
451 validate_tabstops (tab_list, first_free_tab);
453 if (first_free_tab == 0)
454 tab_size = 8;
455 else if (first_free_tab == 1)
456 tab_size = tab_list[0];
457 else
459 /* Append a sentinel to the list of tab stop indices. */
460 add_tabstop (INT_MAX);
461 tab_size = 0;
464 if (optind == argc)
465 file_list = stdin_argv;
466 else
467 file_list = &argv[optind];
469 unexpand ();
471 if (have_read_stdin && fclose (stdin) == EOF)
472 error (EXIT_FAILURE, errno, "-");
473 if (fclose (stdout) == EOF)
474 error (EXIT_FAILURE, errno, _("write error"));
475 exit (exit_status == 0 ? EXIT_SUCCESS : EXIT_FAILURE);