1 /* unexpand - convert blanks to tabs
2 Copyright (C) 1989-2024 Free Software Foundation, Inc.
4 This program is free software: you can redistribute it and/or modify
5 it under the terms of the GNU General Public License as published by
6 the Free Software Foundation, either version 3 of the License, or
7 (at your option) any later version.
9 This program is distributed in the hope that it will be useful,
10 but WITHOUT ANY WARRANTY; without even the implied warranty of
11 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
12 GNU General Public License for more details.
14 You should have received a copy of the GNU General Public License
15 along with this program. If not, see <https://www.gnu.org/licenses/>. */
17 /* By default, convert only maximal strings of initial blanks and tabs
19 Preserves backspace characters in the output; they decrement the
20 column count for tab calculations.
21 The default action is equivalent to -8.
24 --tabs=tab1[,tab2[,...]]
26 -tab1[,tab2[,...]] If only one tab stop is given, set the tabs tab1
27 columns apart instead of the default 8. Otherwise,
28 set the tabs at columns tab1, tab2, etc. (numbered from
29 0); preserve any blanks beyond the tab stops given.
31 -a Use tabs wherever they would replace 2 or more blanks,
32 not just at the beginnings of lines.
34 David MacKenzie <djm@gnu.ai.mit.edu> */
41 #include <sys/types.h>
43 #include "expand-common.h"
45 /* The official name of this program (e.g., no 'g' prefix). */
46 #define PROGRAM_NAME "unexpand"
48 #define AUTHORS proper_name ("David MacKenzie")
52 /* For long options that have no equivalent short option, use a
53 non-character as a pseudo short option, starting with CHAR_MAX + 1. */
56 CONVERT_FIRST_ONLY_OPTION
= CHAR_MAX
+ 1
59 static struct option
const longopts
[] =
61 {"tabs", required_argument
, nullptr, 't'},
62 {"all", no_argument
, nullptr, 'a'},
63 {"first-only", no_argument
, nullptr, CONVERT_FIRST_ONLY_OPTION
},
64 {GETOPT_HELP_OPTION_DECL
},
65 {GETOPT_VERSION_OPTION_DECL
},
66 {nullptr, 0, nullptr, 0}
72 if (status
!= EXIT_SUCCESS
)
77 Usage: %s [OPTION]... [FILE]...\n\
81 Convert blanks in each FILE to tabs, writing to standard output.\n\
85 emit_mandatory_arg_note ();
88 -a, --all convert all blanks, instead of just initial blanks\n\
89 --first-only convert only leading sequences of blanks (overrides -a)\n\
90 -t, --tabs=N have tabs N characters apart instead of 8 (enables -a)\n\
92 emit_tab_list_info ();
93 fputs (HELP_OPTION_DESCRIPTION
, stdout
);
94 fputs (VERSION_OPTION_DESCRIPTION
, stdout
);
95 emit_ancillary_info (PROGRAM_NAME
);
100 /* Change blanks to tabs, writing to stdout.
101 Read each file in 'file_list', in order. */
107 FILE *fp
= next_file (nullptr);
109 /* The array of pending blanks. In non-POSIX locales, blanks can
110 include characters other than spaces, so the blanks must be
111 stored, not merely counted. */
117 /* The worst case is a non-blank character, then one blank, then a
118 tab stop, then MAX_COLUMN_WIDTH - 1 blanks, then a non-blank; so
119 allocate MAX_COLUMN_WIDTH bytes to store the blanks. */
120 pending_blank
= xmalloc (max_column_width
);
124 /* Input character, or EOF. */
127 /* If true, perform translations. */
131 /* The following variables have valid values only when CONVERT
134 /* Column of next input character. */
135 uintmax_t column
= 0;
137 /* Column the next input tab stop is on. */
138 uintmax_t next_tab_column
= 0;
140 /* Index in TAB_LIST of next tab stop to examine. */
141 size_t tab_index
= 0;
143 /* If true, the first pending blank came just before a tab stop. */
144 bool one_blank_before_tab_stop
= false;
146 /* If true, the previous input character was a blank. This is
147 initially true, since initial strings of blanks are treated
148 as if the line was preceded by a blank. */
149 bool prev_blank
= true;
151 /* Number of pending columns of blanks. */
155 /* Convert a line of text. */
159 while ((c
= getc (fp
)) < 0 && (fp
= next_file (fp
)))
164 bool blank
= !! isblank (c
);
170 next_tab_column
= get_next_tab_column (column
, &tab_index
,
178 if (next_tab_column
< column
)
179 error (EXIT_FAILURE
, 0, _("input line is too long"));
183 column
= next_tab_column
;
186 pending_blank
[0] = '\t';
192 if (! (prev_blank
&& column
== next_tab_column
))
194 /* It is not yet known whether the pending blanks
195 will be replaced by tabs. */
196 if (column
== next_tab_column
)
197 one_blank_before_tab_stop
= true;
198 pending_blank
[pending
++] = c
;
203 /* Replace the pending blanks by a tab or two. */
204 pending_blank
[0] = c
= '\t';
207 /* Discard pending blanks, unless it was a single
208 blank just before the previous tab stop. */
209 pending
= one_blank_before_tab_stop
;
214 /* Go back one column, and force recalculation of the
217 next_tab_column
= column
;
218 tab_index
-= !!tab_index
;
224 error (EXIT_FAILURE
, 0, _("input line is too long"));
229 if (pending
> 1 && one_blank_before_tab_stop
)
230 pending_blank
[0] = '\t';
231 if (fwrite (pending_blank
, 1, pending
, stdout
) != pending
)
234 one_blank_before_tab_stop
= false;
238 convert
&= convert_entire_line
|| blank
;
243 free (pending_blank
);
255 main (int argc
, char **argv
)
257 bool have_tabval
= false;
258 uintmax_t tabval
IF_LINT ( = 0);
261 /* If true, cancel the effect of any -a (explicit or implicit in -t),
262 so that only leading blanks will be considered. */
263 bool convert_first_only
= false;
265 initialize_main (&argc
, &argv
);
266 set_program_name (argv
[0]);
267 setlocale (LC_ALL
, "");
268 bindtextdomain (PACKAGE
, LOCALEDIR
);
269 textdomain (PACKAGE
);
271 atexit (close_stdout
);
273 while ((c
= getopt_long (argc
, argv
, ",0123456789at:", longopts
, nullptr))
279 usage (EXIT_FAILURE
);
281 convert_entire_line
= true;
284 convert_entire_line
= true;
285 parse_tab_stops (optarg
);
287 case CONVERT_FIRST_ONLY_OPTION
:
288 convert_first_only
= true;
292 add_tab_stop (tabval
);
295 case_GETOPT_HELP_CHAR
;
296 case_GETOPT_VERSION_CHAR (PROGRAM_NAME
, AUTHORS
);
303 if (!DECIMAL_DIGIT_ACCUMULATE (tabval
, c
- '0'))
304 error (EXIT_FAILURE
, 0, _("tab stop value is too large"));
309 if (convert_first_only
)
310 convert_entire_line
= false;
313 add_tab_stop (tabval
);
315 finalize_tab_stops ();
317 set_file_list ((optind
< argc
) ? &argv
[optind
] : nullptr);
321 cleanup_file_list_stdin ();