1 /* tac - concatenate and print files in reverse
2 Copyright (C) 1988, 1989, 1990, 1991, 1995 Free Software Foundation, Inc.
4 This program is free software; you can redistribute it and/or modify
5 it under the terms of the GNU General Public License as published by
6 the Free Software Foundation; either version 2, or (at your option)
9 This program is distributed in the hope that it will be useful,
10 but WITHOUT ANY WARRANTY; without even the implied warranty of
11 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
12 GNU General Public License for more details.
14 You should have received a copy of the GNU General Public License
15 along with this program; if not, write to the Free Software
16 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA. */
18 /* Written by Jay Lepreau (lepreau@cs.utah.edu).
19 GNU enhancements by David MacKenzie (djm@gnu.ai.mit.edu). */
21 /* Copy each FILE, or the standard input if none are given or when a
22 FILE name of "-" is encountered, to the standard output with the
23 order of the records reversed. The records are separated by
24 instances of a string, or a newline if none is given. By default, the
25 separator string is attached to the end of the record that it
29 -b, --before The separator is attached to the beginning
30 of the record that it precedes in the file.
31 -r, --regex The separator is a regular expression.
32 -s, --separator=separator Use SEPARATOR as the record separator.
34 To reverse a file byte by byte, use (in bash, ksh, or sh):
42 #include <sys/types.h>
58 #ifndef DEFAULT_TMPDIR
59 #define DEFAULT_TMPDIR "/tmp"
62 /* The number of bytes per atomic read. */
63 #define INITIAL_READSIZE 8192
65 /* The number of bytes per atomic write. */
66 #define WRITESIZE 8192
73 /* The name this program was run with. */
76 /* The string that separates the records of the file. */
77 static char *separator
;
79 /* If nonzero, print `separator' along with the record preceding it
80 in the file; otherwise with the record following it. */
81 static int separator_ends_record
;
83 /* 0 if `separator' is to be matched as a regular expression;
84 otherwise, the length of `separator', used as a sentinel to
86 static int sentinel_length
;
88 /* The length of a match with `separator'. If `sentinel_length' is 0,
89 `match_length' is computed every time a match succeeds;
90 otherwise, it is simply the length of `separator'. */
91 static int match_length
;
93 /* The input buffer. */
96 /* The number of bytes to read at once into `buffer'. */
97 static unsigned read_size
;
99 /* The size of `buffer'. This is read_size * 2 + sentinel_length + 2.
100 The extra 2 bytes allow `past_end' to have a value beyond the
101 end of `buffer' and `match_start' to run off the front of `buffer'. */
102 static unsigned buffer_size
;
104 /* The compiled regular expression representing `separator'. */
105 static struct re_pattern_buffer compiled_separator
;
107 /* The name of a temporary file containing a copy of pipe input. */
108 static char *tempfile
;
110 /* If nonzero, display usage information and exit. */
111 static int show_help
;
113 /* If nonzero, print the version on standard output then exit. */
114 static int show_version
;
116 static struct option
const longopts
[] =
118 {"before", no_argument
, &separator_ends_record
, 0},
119 {"regex", no_argument
, &sentinel_length
, 0},
120 {"separator", required_argument
, NULL
, 's'},
121 {"help", no_argument
, &show_help
, 1},
122 {"version", no_argument
, &show_version
, 1},
130 fprintf (stderr
, _("Try `%s --help' for more information.\n"),
135 Usage: %s [OPTION]... [FILE]...\n\
139 Write each FILE to standard output, last line first.\n\
140 With no FILE, or when FILE is -, read standard input.\n\
142 -b, --before attach the separator before instead of after\n\
143 -r, --regex interpret the separator as a regular expression\n\
144 -s, --separator=STRING use STRING as the separator instead of newline\n\
145 --help display this help and exit\n\
146 --version output version information and exit\n\
169 struct sigaction sigact
;
171 sigact
.sa_handler
= SIG_DFL
;
172 sigemptyset (&sigact
.sa_mask
);
174 sigaction (sig
, &sigact
, NULL
);
175 #else /* !SA_INTERRUPT */
176 signal (sig
, SIG_DFL
);
177 #endif /* SA_INTERRUPT */
179 kill (getpid (), sig
);
182 /* Allocate N bytes of memory dynamically, with error checking. */
185 xmalloc (unsigned int n
)
192 error (0, 0, _("virtual memory exhausted"));
198 /* Change the size of memory area P to N bytes, with error checking. */
201 xrealloc (char *p
, unsigned int n
)
206 error (0, 0, _("virtual memory exhausted"));
213 xwrite (int desc
, const char *buffer
, int size
)
215 if (full_write (desc
, buffer
, size
) < 0)
217 error (0, errno
, _("write error"));
222 /* Print the characters from START to PAST_END - 1.
223 If START is NULL, just flush the buffer. */
226 output (const char *start
, const char *past_end
)
228 static char buffer
[WRITESIZE
];
229 static int bytes_in_buffer
= 0;
230 int bytes_to_add
= past_end
- start
;
231 int bytes_available
= WRITESIZE
- bytes_in_buffer
;
235 xwrite (STDOUT_FILENO
, buffer
, bytes_in_buffer
);
240 /* Write out as many full buffers as possible. */
241 while (bytes_to_add
>= bytes_available
)
243 memcpy (buffer
+ bytes_in_buffer
, start
, bytes_available
);
244 bytes_to_add
-= bytes_available
;
245 start
+= bytes_available
;
246 xwrite (STDOUT_FILENO
, buffer
, WRITESIZE
);
248 bytes_available
= WRITESIZE
;
251 memcpy (buffer
+ bytes_in_buffer
, start
, bytes_to_add
);
252 bytes_in_buffer
+= bytes_to_add
;
255 /* Print in reverse the file open on descriptor FD for reading FILE.
256 Return 0 if ok, 1 if an error occurs. */
259 tac (int fd
, const char *file
)
261 /* Pointer to the location in `buffer' where the search for
262 the next separator will begin. */
264 /* Pointer to one past the rightmost character in `buffer' that
265 has not been printed yet. */
267 unsigned saved_record_size
; /* Length of the record growing in `buffer'. */
268 off_t file_pos
; /* Offset in the file of the next read. */
269 /* Nonzero if `output' has not been called yet for any file.
270 Only used when the separator is attached to the preceding record. */
272 char first_char
= *separator
; /* Speed optimization, non-regexp. */
273 char *separator1
= separator
+ 1; /* Speed optimization, non-regexp. */
274 int match_length1
= match_length
- 1; /* Speed optimization, non-regexp. */
275 struct re_registers regs
;
277 /* Find the size of the input file. */
278 file_pos
= lseek (fd
, (off_t
) 0, SEEK_END
);
280 return 0; /* It's an empty file. */
282 /* Arrange for the first read to lop off enough to leave the rest of the
283 file a multiple of `read_size'. Since `read_size' can change, this may
284 not always hold during the program run, but since it usually will, leave
285 it here for i/o efficiency (page/sector boundaries and all that).
286 Note: the efficiency gain has not been verified. */
287 saved_record_size
= file_pos
% read_size
;
288 if (saved_record_size
== 0)
289 saved_record_size
= read_size
;
290 file_pos
-= saved_record_size
;
291 /* `file_pos' now points to the start of the last (probably partial) block
292 in the input file. */
294 lseek (fd
, file_pos
, SEEK_SET
);
295 if (safe_read (fd
, buffer
, saved_record_size
) != saved_record_size
)
297 error (0, errno
, "%s", file
);
301 match_start
= past_end
= buffer
+ saved_record_size
;
302 /* For non-regexp search, move past impossible positions for a match. */
304 match_start
-= match_length1
;
308 /* Search backward from `match_start' - 1 to `buffer' for a match
309 with `separator'; for speed, use strncmp if `separator' contains no
311 If the match succeeds, set `match_start' to point to the start of
312 the match and `match_length' to the length of the match.
313 Otherwise, make `match_start' < `buffer'. */
314 if (sentinel_length
== 0)
316 int i
= match_start
- buffer
;
319 ret
= re_search (&compiled_separator
, buffer
, i
, i
- 1, -i
, ®s
);
321 match_start
= buffer
- 1;
324 error (0, 0, _("error in regular expression search"));
329 match_start
= buffer
+ regs
.start
[0];
330 match_length
= regs
.end
[0] - regs
.start
[0];
335 /* `match_length' is constant for non-regexp boundaries. */
336 while (*--match_start
!= first_char
337 || (match_length1
&& strncmp (match_start
+ 1, separator1
,
342 /* Check whether we backed off the front of `buffer' without finding
343 a match for `separator'. */
344 if (match_start
< buffer
)
348 /* Hit the beginning of the file; print the remaining record. */
349 output (buffer
, past_end
);
353 saved_record_size
= past_end
- buffer
;
354 if (saved_record_size
> read_size
)
356 /* `buffer_size' is about twice `read_size', so since
357 we want to read in another `read_size' bytes before
358 the data already in `buffer', we need to increase
361 int offset
= sentinel_length
? sentinel_length
: 1;
364 buffer_size
= read_size
* 2 + sentinel_length
+ 2;
365 newbuffer
= xrealloc (buffer
- offset
, buffer_size
) + offset
;
366 /* Adjust the pointers for the new buffer location. */
367 match_start
+= newbuffer
- buffer
;
368 past_end
+= newbuffer
- buffer
;
372 /* Back up to the start of the next bufferfull of the file. */
373 if (file_pos
>= read_size
)
374 file_pos
-= read_size
;
377 read_size
= file_pos
;
380 lseek (fd
, file_pos
, SEEK_SET
);
382 /* Shift the pending record data right to make room for the new.
383 The source and destination regions probably overlap. */
384 memmove (buffer
+ read_size
, buffer
, saved_record_size
);
385 past_end
= buffer
+ read_size
+ saved_record_size
;
386 /* For non-regexp searches, avoid unneccessary scanning. */
388 match_start
= buffer
+ read_size
;
390 match_start
= past_end
;
392 if (safe_read (fd
, buffer
, read_size
) != read_size
)
394 error (0, errno
, "%s", file
);
400 /* Found a match of `separator'. */
401 if (separator_ends_record
)
403 char *match_end
= match_start
+ match_length
;
405 /* If this match of `separator' isn't at the end of the
406 file, print the record. */
407 if (first_time
== 0 || match_end
!= past_end
)
408 output (match_end
, past_end
);
409 past_end
= match_end
;
414 output (match_start
, past_end
);
415 past_end
= match_start
;
417 match_start
-= match_length
- 1;
422 /* Print FILE in reverse.
423 Return 0 if ok, 1 if an error occurs. */
426 tac_file (const char *file
)
430 fd
= open (file
, O_RDONLY
);
433 error (0, errno
, "%s", file
);
436 errors
= tac (fd
, file
);
439 error (0, errno
, "%s", file
);
445 /* Make a copy of the standard input in `tempfile'. */
450 static char *template = NULL
;
451 static char *tempdir
;
455 if (template == NULL
)
457 tempdir
= getenv ("TMPDIR");
459 tempdir
= DEFAULT_TMPDIR
;
460 template = xmalloc (strlen (tempdir
) + 11);
462 sprintf (template, "%s/tacXXXXXX", tempdir
);
463 tempfile
= mktemp (template);
465 fd
= creat (tempfile
, 0600);
468 error (0, errno
, "%s", tempfile
);
471 while ((bytes_read
= safe_read (0, buffer
, read_size
)) > 0)
472 if (full_write (fd
, buffer
, bytes_read
) < 0)
474 error (0, errno
, "%s", tempfile
);
479 error (0, errno
, "%s", tempfile
);
482 if (bytes_read
== -1)
484 error (0, errno
, _("read error"));
489 /* Print the standard input in reverse, saving it to temporary
490 file `tempfile' first if it is a pipe.
491 Return 0 if ok, 1 if an error occurs. */
496 /* Previous values of signal handlers. */
497 RETSIGTYPE (*sigint
) (), (*sighup
) (), (*sigpipe
) (), (*sigterm
) ();
501 struct sigaction oldact
, newact
;
502 #endif /* SA_INTERRUPT */
504 /* No tempfile is needed for "tac < file".
505 Use fstat instead of checking for errno == ESPIPE because
506 lseek doesn't work on some special files but doesn't return an
508 if (fstat (0, &stats
))
510 error (0, errno
, _("standard input"));
513 if (S_ISREG (stats
.st_mode
))
514 return tac (0, _("standard input"));
517 newact
.sa_handler
= sighandler
;
518 sigemptyset (&newact
.sa_mask
);
521 sigaction (SIGINT
, NULL
, &oldact
);
522 sigint
= oldact
.sa_handler
;
523 if (sigint
!= SIG_IGN
)
524 sigaction (SIGINT
, &newact
, NULL
);
526 sigaction (SIGHUP
, NULL
, &oldact
);
527 sighup
= oldact
.sa_handler
;
528 if (sighup
!= SIG_IGN
)
529 sigaction (SIGHUP
, &newact
, NULL
);
531 sigaction (SIGPIPE
, NULL
, &oldact
);
532 sigpipe
= oldact
.sa_handler
;
533 if (sigpipe
!= SIG_IGN
)
534 sigaction (SIGPIPE
, &newact
, NULL
);
536 sigaction (SIGTERM
, NULL
, &oldact
);
537 sigterm
= oldact
.sa_handler
;
538 if (sigterm
!= SIG_IGN
)
539 sigaction (SIGTERM
, &newact
, NULL
);
540 #else /* !SA_INTERRUPT */
541 sigint
= signal (SIGINT
, SIG_IGN
);
542 if (sigint
!= SIG_IGN
)
543 signal (SIGINT
, sighandler
);
545 sighup
= signal (SIGHUP
, SIG_IGN
);
546 if (sighup
!= SIG_IGN
)
547 signal (SIGHUP
, sighandler
);
549 sigpipe
= signal (SIGPIPE
, SIG_IGN
);
550 if (sigpipe
!= SIG_IGN
)
551 signal (SIGPIPE
, sighandler
);
553 sigterm
= signal (SIGTERM
, SIG_IGN
);
554 if (sigterm
!= SIG_IGN
)
555 signal (SIGTERM
, sighandler
);
556 #endif /* SA_INTERRUPT */
560 errors
= tac_file (tempfile
);
565 newact
.sa_handler
= sigint
;
566 sigaction (SIGINT
, &newact
, NULL
);
567 newact
.sa_handler
= sighup
;
568 sigaction (SIGHUP
, &newact
, NULL
);
569 newact
.sa_handler
= sigterm
;
570 sigaction (SIGTERM
, &newact
, NULL
);
571 newact
.sa_handler
= sigpipe
;
572 sigaction (SIGPIPE
, &newact
, NULL
);
573 #else /* !SA_INTERRUPT */
574 signal (SIGINT
, sigint
);
575 signal (SIGHUP
, sighup
);
576 signal (SIGTERM
, sigterm
);
577 signal (SIGPIPE
, sigpipe
);
578 #endif /* SA_INTERRUPT */
584 main (int argc
, char **argv
)
586 const char *error_message
; /* Return value from re_compile_pattern. */
588 int have_read_stdin
= 0;
590 program_name
= argv
[0];
591 setlocale (LC_ALL
, "");
592 bindtextdomain (PACKAGE
, LOCALEDIR
);
593 textdomain (PACKAGE
);
598 separator_ends_record
= 1;
600 while ((optc
= getopt_long (argc
, argv
, "brs:", longopts
, (int *) 0))
608 separator_ends_record
= 0;
616 error (1, 0, _("separator cannot be empty"));
625 printf ("tac - %s\n", version_string
);
632 if (sentinel_length
== 0)
634 compiled_separator
.allocated
= 100;
635 compiled_separator
.buffer
= (unsigned char *)
636 xmalloc (compiled_separator
.allocated
);
637 compiled_separator
.fastmap
= xmalloc (256);
638 compiled_separator
.translate
= 0;
639 error_message
= re_compile_pattern (separator
, strlen (separator
),
640 &compiled_separator
);
642 error (1, 0, "%s", error_message
);
645 match_length
= sentinel_length
= strlen (separator
);
647 read_size
= INITIAL_READSIZE
;
648 /* A precaution that will probably never be needed. */
649 while (sentinel_length
* 2 >= read_size
)
651 buffer_size
= read_size
* 2 + sentinel_length
+ 2;
652 buffer
= xmalloc (buffer_size
);
655 strcpy (buffer
, separator
);
656 buffer
+= sentinel_length
;
664 errors
= tac_stdin ();
667 for (; optind
< argc
; ++optind
)
669 if (strcmp (argv
[optind
], "-") == 0)
672 errors
|= tac_stdin ();
675 errors
|= tac_file (argv
[optind
]);
678 /* Flush the output buffer. */
679 output ((char *) NULL
, (char *) NULL
);
681 if (have_read_stdin
&& close (0) < 0)
682 error (1, errno
, "-");
684 error (1, errno
, _("write error"));