1 /* $NetBSD: merge.c,v 1.12 2009/02/12 03:12:36 lukem Exp $ */
4 * Copyright (c) 1992, 1993
5 * The Regents of the University of California. All rights reserved.
7 * This code is derived from software contributed to Berkeley by
10 * Redistribution and use in source and binary forms, with or without
11 * modification, are permitted provided that the following conditions
13 * 1. Redistributions of source code must retain the above copyright
14 * notice, this list of conditions and the following disclaimer.
15 * 2. Redistributions in binary form must reproduce the above copyright
16 * notice, this list of conditions and the following disclaimer in the
17 * documentation and/or other materials provided with the distribution.
18 * 3. Neither the name of the University nor the names of its contributors
19 * may be used to endorse or promote products derived from this software
20 * without specific prior written permission.
22 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
23 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
24 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
25 * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
26 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
27 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
28 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
29 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
30 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
31 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
35 #include <sys/cdefs.h>
36 #if defined(LIBC_SCCS) && !defined(lint)
38 static char sccsid
[] = "from: @(#)merge.c 8.2 (Berkeley) 2/14/94";
40 __RCSID("$NetBSD: merge.c,v 1.12 2009/02/12 03:12:36 lukem Exp $");
42 #endif /* LIBC_SCCS and not lint */
45 * Hybrid exponential search/linear search merge sort with hybrid
46 * natural/pairwise first pass. Requires about .3% more comparisons
47 * for random data than LSMS with pairwise first pass alone.
48 * It works for objects as small as two bytes.
52 #define THRESHOLD 16 /* Best choice for natural merge cut-off. */
54 /* #define NATURAL to get hybrid natural merge.
55 * (The default is pairwise merging.)
58 #include "namespace.h"
59 #include <sys/types.h>
67 __weak_alias(mergesort
,_mergesort
)
70 static void setup
__P((u_char
*, u_char
*, size_t, size_t,
71 int (*)(const void *, const void *)));
72 static void insertionsort
__P((u_char
*, size_t, size_t,
73 int (*)(const void *, const void *)));
75 #define ISIZE sizeof(int)
76 #define PSIZE sizeof(u_char *)
77 #define ICOPY_LIST(src, dst, last) \
79 *(int*)(void *)dst = *(int*)(void *)src, \
80 src += ISIZE, dst += ISIZE; \
82 #define ICOPY_ELT(src, dst, i) \
84 *(int*)(void *)dst = *(int*)(void *)src, \
85 src += ISIZE, dst += ISIZE; \
88 #define CCOPY_LIST(src, dst, last) \
92 #define CCOPY_ELT(src, dst, i) \
98 * Find the next possible pointer head. (Trickery for forcing an array
99 * to do double duty as a linked list when objects do not align with word
102 /* Assumption: PSIZE is a power of 2. */
103 #define EVAL(p) ((u_char **)(void *) \
105 (((u_char *)(void *)(p) + PSIZE - 1 - (u_char *) 0) & ~(PSIZE - 1))))
108 * Arguments are as for qsort.
111 mergesort(base
, nmemb
, size
, cmp
)
115 int (*cmp
) __P((const void *, const void *));
120 u_char
*f1
, *f2
, *t
, *b
, *tp2
, *q
, *l1
, *l2
;
121 u_char
*list2
, *list1
, *p2
, *p
, *last
, **p1
;
123 _DIAGASSERT(base
!= NULL
);
124 _DIAGASSERT(cmp
!= NULL
);
126 if (size
< PSIZE
/ 2) { /* Pointers must fit into 2 * size. */
133 * Stupid subtraction for the Cray.
136 if (!(size
% ISIZE
) && !(((char *)base
- (char *)0) % ISIZE
))
139 if ((list2
= malloc(nmemb
* size
+ PSIZE
)) == NULL
)
143 setup(list1
, list2
, nmemb
, size
, cmp
);
144 last
= list2
+ nmemb
* size
;
146 while (*EVAL(list2
) != last
) {
149 for (tp2
= p2
= list2
; p2
!= last
; p1
= EVAL(l2
)) {
152 f2
= l1
= list1
+ (p2
- list2
);
155 l2
= list1
+ (p2
- list2
);
156 while (f1
< l1
&& f2
< l2
) {
157 if ((*cmp
)(f1
, f2
) <= 0) {
166 if (!big
) { /* here i = 0 */
170 while ((b
+= size
) < t
&& cmp(q
, b
) >sense
)
176 EXPONENTIAL
: for (i
= size
; ; i
<<= 1)
177 if ((p
= (b
+ i
)) >= t
) {
178 if ((p
= t
- size
) > b
&&
179 (*cmp
)(q
, p
) <= sense
)
184 } else if ((*cmp
)(q
, p
) <= sense
) {
195 i
= (((t
- b
) / size
) >> 1) * size
;
196 if ((*cmp
)(q
, p
= b
+ i
) <= sense
)
202 FASTCASE
: while (i
> size
)
205 (i
= (unsigned int) i
>> 1)) <= sense
)
214 ICOPY_LIST(f2
, tp2
, b
);
215 ICOPY_ELT(f1
, tp2
, i
);
217 CCOPY_LIST(f2
, tp2
, b
);
218 CCOPY_ELT(f1
, tp2
, i
);
222 ICOPY_LIST(f1
, tp2
, b
);
223 ICOPY_ELT(f2
, tp2
, i
);
225 CCOPY_LIST(f1
, tp2
, b
);
226 CCOPY_ELT(f2
, tp2
, i
);
232 ICOPY_LIST(f2
, tp2
, l2
);
234 CCOPY_LIST(f2
, tp2
, l2
);
235 } else if (f1
< l1
) {
237 ICOPY_LIST(f1
, tp2
, l1
);
239 CCOPY_LIST(f1
, tp2
, l1
);
243 tp2
= list1
; /* swap list1, list2 */
246 last
= list2
+ nmemb
*size
;
249 memmove(list2
, list1
, nmemb
*size
);
256 #define swap(a, b) { \
260 tmp = *a; *a++ = *s; *s++ = tmp; \
264 #define reverse(bot, top) { \
269 tmp = *bot; *bot++ = *s; *s++ = tmp; \
276 * Optional hybrid natural/pairwise first pass. Eats up list1 in runs of
277 * increasing order, list2 in a corresponding linked list. Checks for runs
278 * when THRESHOLD/2 pairs compare with same sense. (Only used when NATURAL
279 * is defined. Otherwise simple pairwise merging is used.)
282 /* XXX: shouldn't this function be static? - lukem 990810 */
284 setup(list1
, list2
, n
, size
, cmp
)
286 int (*cmp
) __P((const void *, const void *));
287 u_char
*list1
, *list2
;
289 int i
, length
, size2
, tmp
, sense
;
290 u_char
*f1
, *f2
, *s
, *l2
, *last
, *p2
;
292 _DIAGASSERT(cmp
!= NULL
);
293 _DIAGASSERT(list1
!= NULL
);
294 _DIAGASSERT(list2
!= NULL
);
298 insertionsort(list1
, n
, size
, cmp
);
299 *EVAL(list2
) = list2
+ n
*size
;
303 * Avoid running pointers out of bounds; limit n to evens
307 insertionsort(list1
+ (n
- i
) * size
, (size_t)i
, size
, cmp
);
308 last
= list1
+ size
* (n
- i
);
309 *EVAL(list2
+ (last
- list1
)) = list2
+ n
* size
;
314 sense
= (cmp(f1
, f1
+ size
) > 0);
315 for (; f1
< last
; sense
= !sense
) {
317 /* Find pairs with same sense. */
318 for (f2
= f1
+ size2
; f2
< last
; f2
+= size2
) {
319 if ((cmp(f2
, f2
+ size
) > 0) != sense
)
323 if (length
< THRESHOLD
) { /* Pairwise merge */
325 p2
= *EVAL(p2
) = f1
+ size2
- list1
+ list2
;
327 swap (f1
, f1
+ size
);
328 } while ((f1
+= size2
) < f2
);
329 } else { /* Natural merge */
331 for (f2
= f1
+ size2
; f2
< l2
; f2
+= size2
) {
332 if ((cmp(f2
-size
, f2
) > 0) != sense
) {
333 p2
= *EVAL(p2
) = f2
- list1
+ list2
;
335 reverse(f1
, f2
-size
);
340 reverse (f1
, f2
-size
);
342 if (f2
< last
|| cmp(f2
- size
, f2
) > 0)
343 p2
= *EVAL(p2
) = f2
- list1
+ list2
;
345 p2
= *EVAL(p2
) = list2
+ n
*size
;
348 #else /* pairwise merge only. */
349 for (f1
= list1
, p2
= list2
; f1
< last
; f1
+= size2
) {
350 p2
= *EVAL(p2
) = p2
+ size2
;
351 if (cmp (f1
, f1
+ size
) > 0)
358 * This is to avoid out-of-bounds addresses in sorting the
362 insertionsort(a
, n
, size
, cmp
)
365 int (*cmp
) __P((const void *, const void *));
367 u_char
*ai
, *s
, *t
, *u
, tmp
;
370 _DIAGASSERT(a
!= NULL
);
371 _DIAGASSERT(cmp
!= NULL
);
373 for (ai
= a
+size
; --n
>= 1; ai
+= size
)
374 for (t
= ai
; t
> a
; t
-= size
) {