LCOV - code coverage report
Current view: top level - third_party/heimdal/lib/roken - mergesort_r.c (source / functions) Hit Total Coverage
Test: coverage report for v4-17-test 1498b464 Lines: 84 138 60.9 %
Date: 2024-06-13 04:01:37 Functions: 3 3 100.0 %

          Line data    Source code
       1             : /*-
       2             :  * Copyright (c) 1992, 1993
       3             :  *      The Regents of the University of California.  All rights reserved.
       4             :  *
       5             :  * This code is derived from software contributed to Berkeley by
       6             :  * Peter McIlroy.
       7             :  *
       8             :  * Redistribution and use in source and binary forms, with or without
       9             :  * modification, are permitted provided that the following conditions
      10             :  * are met:
      11             :  * 1. Redistributions of source code must retain the above copyright
      12             :  *    notice, this list of conditions and the following disclaimer.
      13             :  * 2. Redistributions in binary form must reproduce the above copyright
      14             :  *    notice, this list of conditions and the following disclaimer in the
      15             :  *    documentation and/or other materials provided with the distribution.
      16             :  * 3. Neither the name of the University nor the names of its contributors
      17             :  *    may be used to endorse or promote products derived from this software
      18             :  *    without specific prior written permission.
      19             :  *
      20             :  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
      21             :  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
      22             :  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
      23             :  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
      24             :  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
      25             :  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
      26             :  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
      27             :  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
      28             :  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
      29             :  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
      30             :  * SUCH DAMAGE.
      31             :  */
      32             : 
      33             : #include <config.h>
      34             : #include "roken.h"
      35             : 
      36             : /*
      37             :  * Hybrid exponential search/linear search merge sort with hybrid
      38             :  * natural/pairwise first pass.  Requires about .3% more comparisons
      39             :  * for random data than LSMS with pairwise first pass alone.
      40             :  * It works for objects as small as two bytes.
      41             :  */
      42             : 
      43             : #define NATURAL
      44             : #define THRESHOLD 16    /* Best choice for natural merge cut-off. */
      45             : 
      46             : /* #define NATURAL to get hybrid natural merge.
      47             :  * (The default is pairwise merging.)
      48             :  */
      49             : 
      50             : #include <sys/types.h>
      51             : 
      52             : #include <errno.h>
      53             : #include <stdlib.h>
      54             : #include <string.h>
      55             : 
      56             : typedef int (*cmp_t)(const void *, const void *, void *);
      57             : 
      58             : static void setup(u_char *, u_char *, size_t, size_t, cmp_t, void *);
      59             : static void insertionsort(u_char *, size_t, size_t, cmp_t, void *);
      60             : 
      61             : #define ISIZE sizeof(int)
      62             : #define PSIZE sizeof(u_char *)
      63             : #define ICOPY_LIST(src, dst, last)                              \
      64             :         do                                                      \
      65             :         *(int*)dst = *(int*)src, src += ISIZE, dst += ISIZE;    \
      66             :         while(src < last)
      67             : #define ICOPY_ELT(src, dst, i)                                  \
      68             :         do                                                      \
      69             :         *(int*) dst = *(int*) src, src += ISIZE, dst += ISIZE;  \
      70             :         while (i -= ISIZE)
      71             : 
      72             : #define CCOPY_LIST(src, dst, last)              \
      73             :         do                                      \
      74             :                 *dst++ = *src++;                \
      75             :         while (src < last)
      76             : #define CCOPY_ELT(src, dst, i)                  \
      77             :         do                                      \
      78             :                 *dst++ = *src++;                \
      79             :         while (i -= 1)
      80             : 
      81             : /*
      82             :  * Find the next possible pointer head.  (Trickery for forcing an array
      83             :  * to do double duty as a linked list when objects do not align with word
      84             :  * boundaries.
      85             :  */
      86             : /* Assumption: PSIZE is a power of 2. */
      87             : #define EVAL(p) (u_char **)                                             \
      88             :         ((((uintptr_t)p + PSIZE - 1) & ~(PSIZE - 1)))
      89             : 
      90             : /*
      91             :  * Arguments are as for qsort_r, except thunk is moved to the last
      92             :  * parameter for glibc compatibility. See:
      93             :  * https://bugs.freebsd.org/bugzilla/show_bug.cgi?id=214248
      94             :  */
      95             : int
      96         154 : mergesort_r(void *base, size_t nmemb, size_t size, cmp_t cmp, void *thunk)
      97             : {
      98             :         size_t i;
      99             :         int sense;
     100             :         int big, iflag;
     101             :         u_char *f1, *f2, *t, *b, *tp2, *q, *l1, *l2;
     102             :         u_char *list2, *list1, *p2, *p, *last, **p1;
     103             : 
     104         154 :         if (size < PSIZE / 2) {              /* Pointers must fit into 2 * size. */
     105           0 :                 errno = EINVAL;
     106           0 :                 return (-1);
     107             :         }
     108             : 
     109         154 :         if (nmemb == 0)
     110           0 :                 return (0);
     111             : 
     112             :         /*
     113             :          * XXX
     114             :          * Stupid subtraction for the Cray.
     115             :          */
     116         154 :         iflag = 0;
     117         154 :         if (!(size % ISIZE) && !(((uintptr_t)base) % ISIZE))
     118         154 :                 iflag = 1;
     119             : 
     120         154 :         if ((list2 = malloc(nmemb * size + PSIZE)) == NULL)
     121           0 :                 return (-1);
     122             : 
     123         154 :         list1 = base;
     124         154 :         setup(list1, list2, nmemb, size, cmp, thunk);
     125         154 :         last = list2 + nmemb * size;
     126         154 :         i = big = 0;
     127         336 :         while (*EVAL(list2) != last) {
     128          28 :             l2 = list1;
     129          28 :             p1 = EVAL(list1);
     130          70 :             for (tp2 = p2 = list2; p2 != last; p1 = EVAL(l2)) {
     131          42 :                 p2 = *EVAL(p2);
     132          42 :                 f1 = l2;
     133          42 :                 f2 = l1 = list1 + (p2 - list2);
     134          42 :                 if (p2 != last)
     135          28 :                         p2 = *EVAL(p2);
     136          42 :                 l2 = list1 + (p2 - list2);
     137         140 :                 while (f1 < l1 && f2 < l2) {
     138          56 :                         if (cmp(f1, f2, thunk) <= 0) {
     139          42 :                                 q = f2;
     140          42 :                                 b = f1, t = l1;
     141          42 :                                 sense = -1;
     142             :                         } else {
     143          14 :                                 q = f1;
     144          14 :                                 b = f2, t = l2;
     145          14 :                                 sense = 0;
     146             :                         }
     147          56 :                         if (!big) {     /* here i = 0 */
     148         140 :                                 while ((b += size) < t && cmp(q, b, thunk) >sense)
     149          28 :                                         if (++i == 6) {
     150           0 :                                                 big = 1;
     151           0 :                                                 goto EXPONENTIAL;
     152             :                                         }
     153             :                         } else {
     154           0 : EXPONENTIAL:                    for (i = size; ; i <<= 1)
     155           0 :                                         if ((p = (b + i)) >= t) {
     156           0 :                                                 if ((p = t - size) > b &&
     157           0 :                                                     cmp(q, p, thunk) <= sense)
     158           0 :                                                         t = p;
     159             :                                                 else
     160           0 :                                                         b = p;
     161           0 :                                                 break;
     162           0 :                                         } else if (cmp(q, p, thunk) <= sense) {
     163           0 :                                                 t = p;
     164           0 :                                                 if (i == size)
     165           0 :                                                         big = 0;
     166           0 :                                                 goto FASTCASE;
     167             :                                         } else
     168           0 :                                                 b = p;
     169           0 :                                 while (t > b+size) {
     170           0 :                                         i = (((t - b) / size) >> 1) * size;
     171           0 :                                         if (cmp(q, p = b + i, thunk) <= sense)
     172           0 :                                                 t = p;
     173             :                                         else
     174           0 :                                                 b = p;
     175             :                                 }
     176           0 :                                 goto COPY;
     177           0 : FASTCASE:                       while (i > size)
     178           0 :                                         if (cmp(q,
     179           0 :                                                 p = b + (i >>= 1), thunk) <= sense)
     180           0 :                                                 t = p;
     181             :                                         else
     182           0 :                                                 b = p;
     183           0 : COPY:                           b = t;
     184             :                         }
     185          56 :                         i = size;
     186          56 :                         if (q == f1) {
     187          14 :                                 if (iflag) {
     188          28 :                                         ICOPY_LIST(f2, tp2, b);
     189          28 :                                         ICOPY_ELT(f1, tp2, i);
     190             :                                 } else {
     191           0 :                                         CCOPY_LIST(f2, tp2, b);
     192           0 :                                         CCOPY_ELT(f1, tp2, i);
     193             :                                 }
     194             :                         } else {
     195          42 :                                 if (iflag) {
     196         140 :                                         ICOPY_LIST(f1, tp2, b);
     197          84 :                                         ICOPY_ELT(f2, tp2, i);
     198             :                                 } else {
     199           0 :                                         CCOPY_LIST(f1, tp2, b);
     200           0 :                                         CCOPY_ELT(f2, tp2, i);
     201             :                                 }
     202             :                         }
     203             :                 }
     204          42 :                 if (f2 < l2) {
     205          28 :                         if (iflag)
     206          84 :                                 ICOPY_LIST(f2, tp2, l2);
     207             :                         else
     208           0 :                                 CCOPY_LIST(f2, tp2, l2);
     209          14 :                 } else if (f1 < l1) {
     210          14 :                         if (iflag)
     211         140 :                                 ICOPY_LIST(f1, tp2, l1);
     212             :                         else
     213           0 :                                 CCOPY_LIST(f1, tp2, l1);
     214             :                 }
     215          42 :                 *p1 = l2;
     216             :             }
     217          28 :             tp2 = list1;        /* swap list1, list2 */
     218          28 :             list1 = list2;
     219          28 :             list2 = tp2;
     220          28 :             last = list2 + nmemb*size;
     221             :         }
     222         154 :         if (base == list2) {
     223           0 :                 memmove(list2, list1, nmemb*size);
     224           0 :                 list2 = list1;
     225             :         }
     226         154 :         free(list2);
     227         154 :         return (0);
     228             : }
     229             : 
     230             : #define swap(a, b) {                                    \
     231             :                 s = b;                                  \
     232             :                 i = size;                               \
     233             :                 do {                                    \
     234             :                         tmp = *a; *a++ = *s; *s++ = tmp; \
     235             :                 } while (--i);                          \
     236             :                 a -= size;                              \
     237             :         }
     238             : #define reverse(bot, top) {                             \
     239             :         s = top;                                        \
     240             :         do {                                            \
     241             :                 i = size;                               \
     242             :                 do {                                    \
     243             :                         tmp = *bot; *bot++ = *s; *s++ = tmp; \
     244             :                 } while (--i);                          \
     245             :                 s -= size2;                             \
     246             :         } while(bot < s);                            \
     247             : }
     248             : 
     249             : /*
     250             :  * Optional hybrid natural/pairwise first pass.  Eats up list1 in runs of
     251             :  * increasing order, list2 in a corresponding linked list.  Checks for runs
     252             :  * when THRESHOLD/2 pairs compare with same sense.  (Only used when NATURAL
     253             :  * is defined.  Otherwise simple pairwise merging is used.)
     254             :  */
     255             : void
     256         154 : setup(u_char *list1, u_char *list2, size_t n, size_t size, cmp_t cmp, void *thunk)
     257             : {
     258             :         int i, length, size2, tmp, sense;
     259             :         u_char *f1, *f2, *s, *l2, *last, *p2;
     260             : 
     261         154 :         size2 = size*2;
     262         154 :         if (n <= 5) {
     263         140 :                 insertionsort(list1, n, size, cmp, thunk);
     264         140 :                 *EVAL(list2) = (u_char*) list2 + n*size;
     265         140 :                 return;
     266             :         }
     267             :         /*
     268             :          * Avoid running pointers out of bounds; limit n to evens
     269             :          * for simplicity.
     270             :          */
     271          14 :         i = 4 + (n & 1);
     272          14 :         insertionsort(list1 + (n - i) * size, i, size, cmp, thunk);
     273          14 :         last = list1 + size * (n - i);
     274          14 :         *EVAL(list2 + (last - list1)) = list2 + n * size;
     275             : 
     276             : #ifdef NATURAL
     277          14 :         p2 = list2;
     278          14 :         f1 = list1;
     279          14 :         sense = (cmp(f1, f1 + size, thunk) > 0);
     280          28 :         for (; f1 < last; sense = !sense) {
     281          14 :                 length = 2;
     282             :                                         /* Find pairs with same sense. */
     283          28 :                 for (f2 = f1 + size2; f2 < last; f2 += size2) {
     284          14 :                         if ((cmp(f2, f2+ size, thunk) > 0) != sense)
     285           0 :                                 break;
     286          14 :                         length += 2;
     287             :                 }
     288          14 :                 if (length < THRESHOLD) {            /* Pairwise merge */
     289             :                         do {
     290          28 :                                 p2 = *EVAL(p2) = f1 + size2 - list1 + list2;
     291          28 :                                 if (sense > 0)
     292           0 :                                         swap (f1, f1 + size);
     293          28 :                         } while ((f1 += size2) < f2);
     294             :                 } else {                                /* Natural merge */
     295           0 :                         l2 = f2;
     296           0 :                         for (f2 = f1 + size2; f2 < l2; f2 += size2) {
     297           0 :                                 if ((cmp(f2-size, f2, thunk) > 0) != sense) {
     298           0 :                                         p2 = *EVAL(p2) = f2 - list1 + list2;
     299           0 :                                         if (sense > 0)
     300           0 :                                                 reverse(f1, f2-size);
     301           0 :                                         f1 = f2;
     302             :                                 }
     303             :                         }
     304           0 :                         if (sense > 0)
     305           0 :                                 reverse (f1, f2-size);
     306           0 :                         f1 = f2;
     307           0 :                         if (f2 < last || cmp(f2 - size, f2, thunk) > 0)
     308           0 :                                 p2 = *EVAL(p2) = f2 - list1 + list2;
     309             :                         else
     310           0 :                                 p2 = *EVAL(p2) = list2 + n*size;
     311             :                 }
     312             :         }
     313             : #else           /* pairwise merge only. */
     314             :         for (f1 = list1, p2 = list2; f1 < last; f1 += size2) {
     315             :                 p2 = *EVAL(p2) = p2 + size2;
     316             :                 if (cmp (f1, f1 + size) > 0)
     317             :                         swap(f1, f1 + size);
     318             :         }
     319             : #endif /* NATURAL */
     320             : }
     321             : 
     322             : /*
     323             :  * This is to avoid out-of-bounds addresses in sorting the
     324             :  * last 4 elements.
     325             :  */
     326             : static void
     327         154 : insertionsort(u_char *a, size_t n, size_t size, cmp_t cmp, void *thunk)
     328             : {
     329             :         u_char *ai, *s, *t, *u, tmp;
     330             :         int i;
     331             : 
     332         364 :         for (ai = a+size; --n >= 1; ai += size)
     333         448 :                 for (t = ai; t > a; t -= size) {
     334         364 :                         u = t - size;
     335         364 :                         if (cmp(u, t, thunk) <= 0)
     336         126 :                                 break;
     337         238 :                         swap(u, t);
     338             :                 }
     339         154 : }

Generated by: LCOV version 1.13