diff options
Diffstat (limited to 'src/lib/libc/stdlib/heapsort.c')
-rw-r--r-- | src/lib/libc/stdlib/heapsort.c | 173 |
1 files changed, 173 insertions, 0 deletions
diff --git a/src/lib/libc/stdlib/heapsort.c b/src/lib/libc/stdlib/heapsort.c new file mode 100644 index 0000000000..e6fb61ba2f --- /dev/null +++ b/src/lib/libc/stdlib/heapsort.c | |||
@@ -0,0 +1,173 @@ | |||
1 | /*- | ||
2 | * Copyright (c) 1991, 1993 | ||
3 | * The Regents of the University of California. All rights reserved. | ||
4 | * | ||
5 | * This code is derived from software contributed to Berkeley by | ||
6 | * Ronnie Kon at Mindcraft Inc., Kevin Lew and Elmer Yglesias. | ||
7 | * | ||
8 | * Redistribution and use in source and binary forms, with or without | ||
9 | * modification, are permitted provided that the following conditions | ||
10 | * are met: | ||
11 | * 1. Redistributions of source code must retain the above copyright | ||
12 | * notice, this list of conditions and the following disclaimer. | ||
13 | * 2. Redistributions in binary form must reproduce the above copyright | ||
14 | * notice, this list of conditions and the following disclaimer in the | ||
15 | * documentation and/or other materials provided with the distribution. | ||
16 | * 3. Neither the name of the University nor the names of its contributors | ||
17 | * may be used to endorse or promote products derived from this software | ||
18 | * without specific prior written permission. | ||
19 | * | ||
20 | * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND | ||
21 | * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE | ||
22 | * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE | ||
23 | * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE | ||
24 | * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL | ||
25 | * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS | ||
26 | * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) | ||
27 | * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT | ||
28 | * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY | ||
29 | * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF | ||
30 | * SUCH DAMAGE. | ||
31 | */ | ||
32 | |||
33 | #include <sys/types.h> | ||
34 | #include <errno.h> | ||
35 | #include <stdlib.h> | ||
36 | |||
37 | /* | ||
38 | * Swap two areas of size number of bytes. Although qsort(3) permits random | ||
39 | * blocks of memory to be sorted, sorting pointers is almost certainly the | ||
40 | * common case (and, were it not, could easily be made so). Regardless, it | ||
41 | * isn't worth optimizing; the SWAP's get sped up by the cache, and pointer | ||
42 | * arithmetic gets lost in the time required for comparison function calls. | ||
43 | */ | ||
44 | #define SWAP(a, b, count, size, tmp) { \ | ||
45 | count = size; \ | ||
46 | do { \ | ||
47 | tmp = *a; \ | ||
48 | *a++ = *b; \ | ||
49 | *b++ = tmp; \ | ||
50 | } while (--count); \ | ||
51 | } | ||
52 | |||
53 | /* Copy one block of size size to another. */ | ||
54 | #define COPY(a, b, count, size, tmp1, tmp2) { \ | ||
55 | count = size; \ | ||
56 | tmp1 = a; \ | ||
57 | tmp2 = b; \ | ||
58 | do { \ | ||
59 | *tmp1++ = *tmp2++; \ | ||
60 | } while (--count); \ | ||
61 | } | ||
62 | |||
63 | /* | ||
64 | * Build the list into a heap, where a heap is defined such that for | ||
65 | * the records K1 ... KN, Kj/2 >= Kj for 1 <= j/2 <= j <= N. | ||
66 | * | ||
67 | * There are two cases. If j == nmemb, select largest of Ki and Kj. If | ||
68 | * j < nmemb, select largest of Ki, Kj and Kj+1. | ||
69 | */ | ||
70 | #define CREATE(initval, nmemb, par_i, child_i, par, child, size, count, tmp) { \ | ||
71 | for (par_i = initval; (child_i = par_i * 2) <= nmemb; \ | ||
72 | par_i = child_i) { \ | ||
73 | child = base + child_i * size; \ | ||
74 | if (child_i < nmemb && compar(child, child + size) < 0) { \ | ||
75 | child += size; \ | ||
76 | ++child_i; \ | ||
77 | } \ | ||
78 | par = base + par_i * size; \ | ||
79 | if (compar(child, par) <= 0) \ | ||
80 | break; \ | ||
81 | SWAP(par, child, count, size, tmp); \ | ||
82 | } \ | ||
83 | } | ||
84 | |||
85 | /* | ||
86 | * Select the top of the heap and 'heapify'. Since by far the most expensive | ||
87 | * action is the call to the compar function, a considerable optimization | ||
88 | * in the average case can be achieved due to the fact that k, the displaced | ||
89 | * element, is usually quite small, so it would be preferable to first | ||
90 | * heapify, always maintaining the invariant that the larger child is copied | ||
91 | * over its parent's record. | ||
92 | * | ||
93 | * Then, starting from the *bottom* of the heap, finding k's correct place, | ||
94 | * again maintaining the invariant. As a result of the invariant no element | ||
95 | * is 'lost' when k is assigned its correct place in the heap. | ||
96 | * | ||
97 | * The time savings from this optimization are on the order of 15-20% for the | ||
98 | * average case. See Knuth, Vol. 3, page 158, problem 18. | ||
99 | * | ||
100 | * XXX Don't break the #define SELECT line, below. Reiser cpp gets upset. | ||
101 | */ | ||
102 | #define SELECT(par_i, child_i, nmemb, par, child, size, k, count, tmp1, tmp2) { \ | ||
103 | for (par_i = 1; (child_i = par_i * 2) <= nmemb; par_i = child_i) { \ | ||
104 | child = base + child_i * size; \ | ||
105 | if (child_i < nmemb && compar(child, child + size) < 0) { \ | ||
106 | child += size; \ | ||
107 | ++child_i; \ | ||
108 | } \ | ||
109 | par = base + par_i * size; \ | ||
110 | COPY(par, child, count, size, tmp1, tmp2); \ | ||
111 | } \ | ||
112 | for (;;) { \ | ||
113 | child_i = par_i; \ | ||
114 | par_i = child_i / 2; \ | ||
115 | child = base + child_i * size; \ | ||
116 | par = base + par_i * size; \ | ||
117 | if (child_i == 1 || compar(k, par) < 0) { \ | ||
118 | COPY(child, k, count, size, tmp1, tmp2); \ | ||
119 | break; \ | ||
120 | } \ | ||
121 | COPY(child, par, count, size, tmp1, tmp2); \ | ||
122 | } \ | ||
123 | } | ||
124 | |||
125 | /* | ||
126 | * Heapsort -- Knuth, Vol. 3, page 145. Runs in O (N lg N), both average | ||
127 | * and worst. While heapsort is faster than the worst case of quicksort, | ||
128 | * the BSD quicksort does median selection so that the chance of finding | ||
129 | * a data set that will trigger the worst case is nonexistent. Heapsort's | ||
130 | * only advantage over quicksort is that it requires little additional memory. | ||
131 | */ | ||
132 | int | ||
133 | heapsort(void *vbase, size_t nmemb, size_t size, | ||
134 | int (*compar)(const void *, const void *)) | ||
135 | { | ||
136 | int cnt, i, j, l; | ||
137 | char tmp, *tmp1, *tmp2; | ||
138 | char *base, *k, *p, *t; | ||
139 | |||
140 | if (nmemb <= 1) | ||
141 | return (0); | ||
142 | |||
143 | if (!size) { | ||
144 | errno = EINVAL; | ||
145 | return (-1); | ||
146 | } | ||
147 | |||
148 | if ((k = malloc(size)) == NULL) | ||
149 | return (-1); | ||
150 | |||
151 | /* | ||
152 | * Items are numbered from 1 to nmemb, so offset from size bytes | ||
153 | * below the starting address. | ||
154 | */ | ||
155 | base = (char *)vbase - size; | ||
156 | |||
157 | for (l = nmemb / 2 + 1; --l;) | ||
158 | CREATE(l, nmemb, i, j, t, p, size, cnt, tmp); | ||
159 | |||
160 | /* | ||
161 | * For each element of the heap, save the largest element into its | ||
162 | * final slot, save the displaced element (k), then recreate the | ||
163 | * heap. | ||
164 | */ | ||
165 | while (nmemb > 1) { | ||
166 | COPY(k, base + nmemb * size, cnt, size, tmp1, tmp2); | ||
167 | COPY(base + nmemb * size, base + size, cnt, size, tmp1, tmp2); | ||
168 | --nmemb; | ||
169 | SELECT(i, j, nmemb, t, p, size, k, cnt, tmp1, tmp2); | ||
170 | } | ||
171 | free(k); | ||
172 | return (0); | ||
173 | } | ||