* NEWS: Add a line for 6.5-cvs.
[coreutils.git] / src / nl.c
blob7ee57b77d60e20901b9f4f6cf358427dc1a3a3b2
1 /* nl -- number lines of files
2 Copyright (C) 89, 92, 1995-2006 Free Software Foundation, Inc.
4 This program is free software; you can redistribute it and/or modify
5 it under the terms of the GNU General Public License as published by
6 the Free Software Foundation; either version 2, or (at your option)
7 any later version.
9 This program is distributed in the hope that it will be useful,
10 but WITHOUT ANY WARRANTY; without even the implied warranty of
11 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
12 GNU General Public License for more details.
14 You should have received a copy of the GNU General Public License
15 along with this program; if not, write to the Free Software Foundation,
16 Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA. */
18 /* Written by Scott Bartram (nancy!scott@uunet.uu.net)
19 Revised by David MacKenzie (djm@gnu.ai.mit.edu) */
21 #include <config.h>
23 #include <stdio.h>
24 #include <sys/types.h>
25 #include <getopt.h>
27 #include "system.h"
29 #include <regex.h>
31 #include "error.h"
32 #include "linebuffer.h"
33 #include "quote.h"
34 #include "xstrtol.h"
36 /* The official name of this program (e.g., no `g' prefix). */
37 #define PROGRAM_NAME "nl"
39 #define AUTHORS "Scott Bartram", "David MacKenzie"
41 /* Line-number formats. They are given an int width, an intmax_t
42 value, and a string separator. */
44 /* Right justified, no leading zeroes. */
45 static char const FORMAT_RIGHT_NOLZ[] = "%*" PRIdMAX "%s";
47 /* Right justified, leading zeroes. */
48 static char const FORMAT_RIGHT_LZ[] = "%0*" PRIdMAX "%s";
50 /* Left justified, no leading zeroes. */
51 static char const FORMAT_LEFT[] = "%-*" PRIdMAX "%s";
53 /* Default section delimiter characters. */
54 static char const DEFAULT_SECTION_DELIMITERS[] = "\\:";
56 /* Types of input lines: either one of the section delimiters,
57 or text to output. */
58 enum section
60 Header, Body, Footer, Text
63 /* The name this program was run with. */
64 char *program_name;
66 /* Format of body lines (-b). */
67 static char *body_type = "t";
69 /* Format of header lines (-h). */
70 static char *header_type = "n";
72 /* Format of footer lines (-f). */
73 static char *footer_type = "n";
75 /* Format currently being used (body, header, or footer). */
76 static char *current_type;
78 /* Regex for body lines to number (-bp). */
79 static struct re_pattern_buffer body_regex;
81 /* Regex for header lines to number (-hp). */
82 static struct re_pattern_buffer header_regex;
84 /* Regex for footer lines to number (-fp). */
85 static struct re_pattern_buffer footer_regex;
87 /* Fastmaps for the above. */
88 static char body_fastmap[UCHAR_MAX + 1];
89 static char header_fastmap[UCHAR_MAX + 1];
90 static char footer_fastmap[UCHAR_MAX + 1];
92 /* Pointer to current regex, if any. */
93 static struct re_pattern_buffer *current_regex = NULL;
95 /* Separator string to print after line number (-s). */
96 static char *separator_str = "\t";
98 /* Input section delimiter string (-d). */
99 static char const *section_del = DEFAULT_SECTION_DELIMITERS;
101 /* Header delimiter string. */
102 static char *header_del = NULL;
104 /* Header section delimiter length. */
105 static size_t header_del_len;
107 /* Body delimiter string. */
108 static char *body_del = NULL;
110 /* Body section delimiter length. */
111 static size_t body_del_len;
113 /* Footer delimiter string. */
114 static char *footer_del = NULL;
116 /* Footer section delimiter length. */
117 static size_t footer_del_len;
119 /* Input buffer. */
120 static struct linebuffer line_buf;
122 /* printf format string for unnumbered lines. */
123 static char *print_no_line_fmt = NULL;
125 /* Starting line number on each page (-v). */
126 static intmax_t starting_line_number = 1;
128 /* Line number increment (-i). */
129 static intmax_t page_incr = 1;
131 /* If true, reset line number at start of each page (-p). */
132 static bool reset_numbers = true;
134 /* Number of blank lines to consider to be one line for numbering (-l). */
135 static intmax_t blank_join = 1;
137 /* Width of line numbers (-w). */
138 static int lineno_width = 6;
140 /* Line number format (-n). */
141 static char const *lineno_format = FORMAT_RIGHT_NOLZ;
143 /* Current print line number. */
144 static intmax_t line_no;
146 /* True if we have ever read standard input. */
147 static bool have_read_stdin;
149 static struct option const longopts[] =
151 {"header-numbering", required_argument, NULL, 'h'},
152 {"body-numbering", required_argument, NULL, 'b'},
153 {"footer-numbering", required_argument, NULL, 'f'},
154 {"starting-line-number", required_argument, NULL, 'v'},
155 {"page-increment", required_argument, NULL, 'i'},
156 {"no-renumber", no_argument, NULL, 'p'},
157 {"join-blank-lines", required_argument, NULL, 'l'},
158 {"number-separator", required_argument, NULL, 's'},
159 {"number-width", required_argument, NULL, 'w'},
160 {"number-format", required_argument, NULL, 'n'},
161 {"section-delimiter", required_argument, NULL, 'd'},
162 {GETOPT_HELP_OPTION_DECL},
163 {GETOPT_VERSION_OPTION_DECL},
164 {NULL, 0, NULL, 0}
167 /* Print a usage message and quit. */
169 void
170 usage (int status)
172 if (status != EXIT_SUCCESS)
173 fprintf (stderr, _("Try `%s --help' for more information.\n"),
174 program_name);
175 else
177 printf (_("\
178 Usage: %s [OPTION]... [FILE]...\n\
180 program_name);
181 fputs (_("\
182 Write each FILE to standard output, with line numbers added.\n\
183 With no FILE, or when FILE is -, read standard input.\n\
185 "), stdout);
186 fputs (_("\
187 Mandatory arguments to long options are mandatory for short options too.\n\
188 "), stdout);
189 fputs (_("\
190 -b, --body-numbering=STYLE use STYLE for numbering body lines\n\
191 -d, --section-delimiter=CC use CC for separating logical pages\n\
192 -f, --footer-numbering=STYLE use STYLE for numbering footer lines\n\
193 "), stdout);
194 fputs (_("\
195 -h, --header-numbering=STYLE use STYLE for numbering header lines\n\
196 -i, --page-increment=NUMBER line number increment at each line\n\
197 -l, --join-blank-lines=NUMBER group of NUMBER empty lines counted as one\n\
198 -n, --number-format=FORMAT insert line numbers according to FORMAT\n\
199 -p, --no-renumber do not reset line numbers at logical pages\n\
200 -s, --number-separator=STRING add STRING after (possible) line number\n\
201 "), stdout);
202 fputs (_("\
203 -v, --first-page=NUMBER first line number on each logical page\n\
204 -w, --number-width=NUMBER use NUMBER columns for line numbers\n\
205 "), stdout);
206 fputs (HELP_OPTION_DESCRIPTION, stdout);
207 fputs (VERSION_OPTION_DESCRIPTION, stdout);
208 fputs (_("\
210 By default, selects -v1 -i1 -l1 -sTAB -w6 -nrn -hn -bt -fn. CC are\n\
211 two delimiter characters for separating logical pages, a missing\n\
212 second character implies :. Type \\\\ for \\. STYLE is one of:\n\
213 "), stdout);
214 fputs (_("\
216 a number all lines\n\
217 t number only nonempty lines\n\
218 n number no lines\n\
219 pBRE number only lines that contain a match for the basic regular\n\
220 expression, BRE\n\
222 FORMAT is one of:\n\
224 ln left justified, no leading zeros\n\
225 rn right justified, no leading zeros\n\
226 rz right justified, leading zeros\n\
228 "), stdout);
229 printf (_("\nReport bugs to <%s>.\n"), PACKAGE_BUGREPORT);
231 exit (status);
234 /* Set the command line flag TYPEP and possibly the regex pointer REGEXP,
235 according to `optarg'. */
237 static bool
238 build_type_arg (char **typep, struct re_pattern_buffer *regexp, char *fastmap)
240 const char *errmsg;
241 bool rval = true;
243 switch (*optarg)
245 case 'a':
246 case 't':
247 case 'n':
248 *typep = optarg;
249 break;
250 case 'p':
251 *typep = optarg++;
252 regexp->buffer = NULL;
253 regexp->allocated = 0;
254 regexp->fastmap = fastmap;
255 regexp->translate = NULL;
256 re_syntax_options =
257 RE_SYNTAX_POSIX_BASIC & ~RE_CONTEXT_INVALID_DUP & ~RE_NO_EMPTY_RANGES;
258 errmsg = re_compile_pattern (optarg, strlen (optarg), regexp);
259 if (errmsg)
260 error (EXIT_FAILURE, 0, "%s", errmsg);
261 break;
262 default:
263 rval = false;
264 break;
266 return rval;
269 /* Print the line number and separator; increment the line number. */
271 static void
272 print_lineno (void)
274 intmax_t next_line_no;
276 printf (lineno_format, lineno_width, line_no, separator_str);
278 next_line_no = line_no + page_incr;
279 if (next_line_no < line_no)
280 error (EXIT_FAILURE, 0, _("line number overflow"));
281 line_no = next_line_no;
284 /* Switch to a header section. */
286 static void
287 proc_header (void)
289 current_type = header_type;
290 current_regex = &header_regex;
291 if (reset_numbers)
292 line_no = starting_line_number;
293 putchar ('\n');
296 /* Switch to a body section. */
298 static void
299 proc_body (void)
301 current_type = body_type;
302 current_regex = &body_regex;
303 putchar ('\n');
306 /* Switch to a footer section. */
308 static void
309 proc_footer (void)
311 current_type = footer_type;
312 current_regex = &footer_regex;
313 putchar ('\n');
316 /* Process a regular text line in `line_buf'. */
318 static void
319 proc_text (void)
321 static intmax_t blank_lines = 0; /* Consecutive blank lines so far. */
323 switch (*current_type)
325 case 'a':
326 if (blank_join > 1)
328 if (1 < line_buf.length || ++blank_lines == blank_join)
330 print_lineno ();
331 blank_lines = 0;
333 else
334 fputs (print_no_line_fmt, stdout);
336 else
337 print_lineno ();
338 break;
339 case 't':
340 if (1 < line_buf.length)
341 print_lineno ();
342 else
343 fputs (print_no_line_fmt, stdout);
344 break;
345 case 'n':
346 fputs (print_no_line_fmt, stdout);
347 break;
348 case 'p':
349 switch (re_search (current_regex, line_buf.buffer, line_buf.length - 1,
350 0, line_buf.length - 1, (struct re_registers *) 0))
352 case -2:
353 error (EXIT_FAILURE, errno, _("error in regular expression search"));
355 case -1:
356 fputs (print_no_line_fmt, stdout);
357 break;
359 default:
360 print_lineno ();
361 break;
364 fwrite (line_buf.buffer, sizeof (char), line_buf.length, stdout);
367 /* Return the type of line in `line_buf'. */
369 static enum section
370 check_section (void)
372 size_t len = line_buf.length - 1;
374 if (len < 2 || memcmp (line_buf.buffer, section_del, 2))
375 return Text;
376 if (len == header_del_len
377 && !memcmp (line_buf.buffer, header_del, header_del_len))
378 return Header;
379 if (len == body_del_len
380 && !memcmp (line_buf.buffer, body_del, body_del_len))
381 return Body;
382 if (len == footer_del_len
383 && !memcmp (line_buf.buffer, footer_del, footer_del_len))
384 return Footer;
385 return Text;
388 /* Read and process the file pointed to by FP. */
390 static void
391 process_file (FILE *fp)
393 while (readlinebuffer (&line_buf, fp))
395 switch (check_section ())
397 case Header:
398 proc_header ();
399 break;
400 case Body:
401 proc_body ();
402 break;
403 case Footer:
404 proc_footer ();
405 break;
406 case Text:
407 proc_text ();
408 break;
413 /* Process file FILE to standard output.
414 Return true if successful. */
416 static bool
417 nl_file (const char *file)
419 FILE *stream;
421 if (STREQ (file, "-"))
423 have_read_stdin = true;
424 stream = stdin;
426 else
428 stream = fopen (file, "r");
429 if (stream == NULL)
431 error (0, errno, "%s", file);
432 return false;
436 process_file (stream);
438 if (ferror (stream))
440 error (0, errno, "%s", file);
441 return false;
443 if (STREQ (file, "-"))
444 clearerr (stream); /* Also clear EOF. */
445 else if (fclose (stream) == EOF)
447 error (0, errno, "%s", file);
448 return false;
450 return true;
454 main (int argc, char **argv)
456 int c;
457 size_t len;
458 bool ok = true;
460 initialize_main (&argc, &argv);
461 program_name = argv[0];
462 setlocale (LC_ALL, "");
463 bindtextdomain (PACKAGE, LOCALEDIR);
464 textdomain (PACKAGE);
466 atexit (close_stdout);
468 have_read_stdin = false;
470 while ((c = getopt_long (argc, argv, "h:b:f:v:i:pl:s:w:n:d:", longopts,
471 NULL)) != -1)
473 switch (c)
475 case 'h':
476 if (! build_type_arg (&header_type, &header_regex, header_fastmap))
478 error (0, 0, _("invalid header numbering style: %s"),
479 quote (optarg));
480 ok = false;
482 break;
483 case 'b':
484 if (! build_type_arg (&body_type, &body_regex, body_fastmap))
486 error (0, 0, _("invalid body numbering style: %s"),
487 quote (optarg));
488 ok = false;
490 break;
491 case 'f':
492 if (! build_type_arg (&footer_type, &footer_regex, footer_fastmap))
494 error (0, 0, _("invalid footer numbering style: %s"),
495 quote (optarg));
496 ok = false;
498 break;
499 case 'v':
500 if (xstrtoimax (optarg, NULL, 10, &starting_line_number, "")
501 != LONGINT_OK)
503 error (0, 0, _("invalid starting line number: %s"),
504 quote (optarg));
505 ok = false;
507 break;
508 case 'i':
509 if (! (xstrtoimax (optarg, NULL, 10, &page_incr, "") == LONGINT_OK
510 && 0 < page_incr))
512 error (0, 0, _("invalid line number increment: %s"),
513 quote (optarg));
514 ok = false;
516 break;
517 case 'p':
518 reset_numbers = false;
519 break;
520 case 'l':
521 if (! (xstrtoimax (optarg, NULL, 10, &blank_join, "") == LONGINT_OK
522 && 0 < blank_join))
524 error (0, 0, _("invalid number of blank lines: %s"),
525 quote (optarg));
526 ok = false;
528 break;
529 case 's':
530 separator_str = optarg;
531 break;
532 case 'w':
534 long int tmp_long;
535 if (xstrtol (optarg, NULL, 10, &tmp_long, "") != LONGINT_OK
536 || tmp_long <= 0 || tmp_long > INT_MAX)
538 error (0, 0, _("invalid line number field width: %s"),
539 quote (optarg));
540 ok = false;
542 else
544 lineno_width = tmp_long;
547 break;
548 case 'n':
549 if (STREQ (optarg, "ln"))
550 lineno_format = FORMAT_LEFT;
551 else if (STREQ (optarg, "rn"))
552 lineno_format = FORMAT_RIGHT_NOLZ;
553 else if (STREQ (optarg, "rz"))
554 lineno_format = FORMAT_RIGHT_LZ;
555 else
557 error (0, 0, _("invalid line numbering format: %s"),
558 quote (optarg));
559 ok = false;
561 break;
562 case 'd':
563 section_del = optarg;
564 break;
565 case_GETOPT_HELP_CHAR;
566 case_GETOPT_VERSION_CHAR (PROGRAM_NAME, AUTHORS);
567 default:
568 ok = false;
569 break;
573 if (!ok)
574 usage (EXIT_FAILURE);
576 /* Initialize the section delimiters. */
577 len = strlen (section_del);
579 header_del_len = len * 3;
580 header_del = xmalloc (header_del_len + 1);
581 strcat (strcat (strcpy (header_del, section_del), section_del), section_del);
583 body_del_len = len * 2;
584 body_del = xmalloc (body_del_len + 1);
585 strcat (strcpy (body_del, section_del), section_del);
587 footer_del_len = len;
588 footer_del = xmalloc (footer_del_len + 1);
589 strcpy (footer_del, section_del);
591 /* Initialize the input buffer. */
592 initbuffer (&line_buf);
594 /* Initialize the printf format for unnumbered lines. */
595 len = strlen (separator_str);
596 print_no_line_fmt = xmalloc (lineno_width + len + 1);
597 memset (print_no_line_fmt, ' ', lineno_width + len);
598 print_no_line_fmt[lineno_width + len] = '\0';
600 line_no = starting_line_number;
601 current_type = body_type;
602 current_regex = &body_regex;
604 /* Main processing. */
606 if (optind == argc)
607 ok = nl_file ("-");
608 else
609 for (; optind < argc; optind++)
610 ok &= nl_file (argv[optind]);
612 if (have_read_stdin && fclose (stdin) == EOF)
613 error (EXIT_FAILURE, errno, "-");
615 exit (ok ? EXIT_SUCCESS : EXIT_FAILURE);