1 /* $NetBSD: sort.h,v 1.34 2011/09/16 15:39:29 joerg Exp $ */
4 * Copyright (c) 2000-2003 The NetBSD Foundation, Inc.
7 * This code is derived from software contributed to The NetBSD Foundation
8 * by Ben Harris and Jaromir Dolecek.
10 * Redistribution and use in source and binary forms, with or without
11 * modification, are permitted provided that the following conditions
13 * 1. Redistributions of source code must retain the above copyright
14 * notice, this list of conditions and the following disclaimer.
15 * 2. Redistributions in binary form must reproduce the above copyright
16 * notice, this list of conditions and the following disclaimer in the
17 * documentation and/or other materials provided with the distribution.
19 * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
20 * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
21 * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
22 * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
23 * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
24 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
25 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
26 * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
27 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
28 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
29 * POSSIBILITY OF SUCH DAMAGE.
34 * The Regents of the University of California. All rights reserved.
36 * This code is derived from software contributed to Berkeley by
39 * Redistribution and use in source and binary forms, with or without
40 * modification, are permitted provided that the following conditions
42 * 1. Redistributions of source code must retain the above copyright
43 * notice, this list of conditions and the following disclaimer.
44 * 2. Redistributions in binary form must reproduce the above copyright
45 * notice, this list of conditions and the following disclaimer in the
46 * documentation and/or other materials provided with the distribution.
47 * 3. Neither the name of the University nor the names of its contributors
48 * may be used to endorse or promote products derived from this software
49 * without specific prior written permission.
51 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
52 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
53 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
54 * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
55 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
56 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
57 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
58 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
59 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
60 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
63 * @(#)sort.h 8.1 (Berkeley) 6/6/93
66 #include <sys/param.h>
79 /* values for masks, weights, and other flags. */
80 /* R and F get used to index weight_tables[] */
81 #define R 0x01 /* Field is reversed */
82 #define F 0x02 /* weight lower and upper case the same */
83 #define I 0x04 /* mask out non-printable characters */
84 #define D 0x08 /* sort alphanumeric characters only */
85 #define N 0x10 /* Field is a number */
86 #define BI 0x20 /* ignore blanks in icol */
87 #define BT 0x40 /* ignore blanks in tcol */
88 #define L 0x80 /* Sort by field length */
90 #define X 0x100 /* Field is a hex number */
93 /* masks for delimiters: blanks, fields, and termination. */
94 #define BLANK 1 /* ' ', '\t'; '\n' if -R is invoked */
95 #define FLD_D 2 /* ' ', '\t' default; from -t otherwise */
96 #define REC_D_F 4 /* '\n' default; from -R otherwise */
98 #define min(a, b) ((a) < (b) ? (a) : (b))
99 #define max(a, b) ((a) > (b) ? (a) : (b))
101 #define FCLOSE(file) { \
102 if (EOF == fclose(file)) \
103 err(2, "%p", file); \
106 #define EWRITE(ptr, size, n, f) { \
107 if (!fwrite(ptr, size, n, f)) \
111 /* Records are limited to MAXBUFSIZE (8MB) and less if you want to sort
113 * Anyone who wants to sort data records longer than 2GB definitely needs a
114 * different program! */
115 typedef unsigned int length_t
;
117 /* A record is a key/line pair starting at rec.data. It has a total length
118 * and an offset to the start of the line half of the pair.
120 typedef struct recheader
{
121 length_t length
; /* total length of key and line */
122 length_t offset
; /* to line */
123 int keylen
; /* length of key */
124 u_char data
[]; /* key then line */
127 /* This is the column as seen by struct field. It is used by enterfield.
128 * They are matched with corresponding coldescs during initialization.
136 /* a coldesc has a number and pointers to the beginning and end of the
137 * corresponding column in the current line. This is determined in enterkey.
139 typedef struct coldesc
{
145 /* A field has an initial and final column; an omitted final column
146 * implies the end of the line. Flags regulate omission of blanks and
147 * numerical sorts; mask determines which characters are ignored (from -i, -d);
148 * weights determines the sort weights of a character (from -f, -r).
150 * The first field contain the global flags etc.
151 * The list terminates when icol = 0.
162 const char * const * names
;
165 typedef int (*get_func_t
)(FILE *, RECHEADER
*, u_char
*, struct field
*);
166 typedef void (*put_func_t
)(const RECHEADER
*, FILE *);
168 extern u_char ascii
[NBINS
], Rascii
[NBINS
], Ftable
[NBINS
], RFtable
[NBINS
];
169 extern u_char
*const weight_tables
[4]; /* ascii, Rascii, Ftable, RFtable */
170 extern u_char d_mask
[NBINS
];
171 extern int SINGL_FLD
, SEP_FLAG
, UNIQUE
, REVERSE
;
172 extern int posix_sort
;
174 extern const char *tmpdir
;
175 extern struct coldesc
*clist
;
178 #define DEBUG(ch) (debug_flags & (1 << ((ch) & 31)))
179 extern unsigned int debug_flags
;
181 RECHEADER
*allocrec(RECHEADER
*, size_t);
182 void append(RECHEADER
**, int, FILE *, void (*)(const RECHEADER
*, FILE *));
183 void concat(FILE *, FILE *);
184 length_t
enterkey(RECHEADER
*, const u_char
*, u_char
*, size_t, struct field
*);
185 void fixit(int *, char **, const char *);
186 void fldreset(struct field
*);
188 void fmerge(struct filelist
*, int, FILE *, struct field
*);
189 void save_for_merge(FILE *, get_func_t
, struct field
*);
190 void merge_sort(FILE *, put_func_t
, struct field
*);
191 void fsort(struct filelist
*, int, FILE *, struct field
*);
192 int geteasy(FILE *, RECHEADER
*, u_char
*, struct field
*);
193 int makekey(FILE *, RECHEADER
*, u_char
*, struct field
*);
194 int makeline(FILE *, RECHEADER
*, u_char
*, struct field
*);
195 void makeline_copydown(RECHEADER
*);
196 int optval(int, int);
197 __dead
void order(struct filelist
*, struct field
*);
198 void putline(const RECHEADER
*, FILE *);
199 void putrec(const RECHEADER
*, FILE *);
200 void putkeydump(const RECHEADER
*, FILE *);
201 void rd_append(int, int, int, FILE *, u_char
*, u_char
*);
202 void radix_sort(RECHEADER
**, RECHEADER
**, int);
203 int setfield(const char *, struct field
*, int);
204 void settables(void);