mirror of
https://github.com/git/git.git
synced 2026-03-13 18:33:25 +01:00
qsort in Windows 2000 (and possibly other older Windows' C libraries)
is a Quicksort with the usual O(n^2) worst case. Unfortunately, sorting
Git trees seems to get very close to that worst case quite often:
$ /git/gitbad runstatus
# On branch master
qsort, nmemb = 30842
done, 237838087 comparisons.
This patch adds a simplified version of the merge sort that is glibc's
qsort(3). As a merge sort, this needs a temporary array equal in size
to the array that is to be sorted.
The complexity that was removed is:
* Doing direct stores for word-size and -aligned data.
* Falling back to quicksort if the allocation required to perform the
merge sort would likely push the machine into swap.
Even with these simplifications, this seems to outperform the Windows
qsort(3) implementation, even in Windows XP (where it is "fixed" and
doesn't trigger O(n^2) complexity on trees).
[jes: moved into compat/qsort.c, as per Johannes Sixt's suggestion]
Signed-off-by: Brian Downing <bdowning@lavos.net>
Signed-off-by: Steffen Prohaska <prohaska@zib.de>
Signed-off-by: Johannes Schindelin <johannes.schindelin@gmx.de>
61 lines
1.1 KiB
C
61 lines
1.1 KiB
C
#include "../git-compat-util.h"
|
|
|
|
/* This merge sort implementation is simplified from glibc's. */
|
|
static void msort_with_tmp(void *b, size_t n, size_t s,
|
|
int (*cmp)(const void *, const void *),
|
|
char *t)
|
|
{
|
|
char *tmp;
|
|
char *b1, *b2;
|
|
size_t n1, n2;
|
|
|
|
if (n <= 1)
|
|
return;
|
|
|
|
n1 = n / 2;
|
|
n2 = n - n1;
|
|
b1 = b;
|
|
b2 = (char *)b + (n1 * s);
|
|
|
|
msort_with_tmp(b1, n1, s, cmp, t);
|
|
msort_with_tmp(b2, n2, s, cmp, t);
|
|
|
|
tmp = t;
|
|
|
|
while (n1 > 0 && n2 > 0) {
|
|
if (cmp(b1, b2) <= 0) {
|
|
memcpy(tmp, b1, s);
|
|
tmp += s;
|
|
b1 += s;
|
|
--n1;
|
|
} else {
|
|
memcpy(tmp, b2, s);
|
|
tmp += s;
|
|
b2 += s;
|
|
--n2;
|
|
}
|
|
}
|
|
if (n1 > 0)
|
|
memcpy(tmp, b1, n1 * s);
|
|
memcpy(b, t, (n - n2) * s);
|
|
}
|
|
|
|
void git_qsort(void *b, size_t n, size_t s,
|
|
int (*cmp)(const void *, const void *))
|
|
{
|
|
const size_t size = n * s;
|
|
|
|
if (size < 1024) {
|
|
char buf[size]; /* gcc-ism */
|
|
|
|
/* The temporary array is small, so put it on
|
|
the stack. */
|
|
msort_with_tmp(b, n, s, cmp, buf);
|
|
} else {
|
|
/* It's somewhat large, so malloc it. */
|
|
char *tmp = malloc(size);
|
|
msort_with_tmp(b, n, s, cmp, tmp);
|
|
free(tmp);
|
|
}
|
|
}
|