2017-06-15 11:22:49 +08:00
|
|
|
/* -*- c++ -*- ----------------------------------------------------------
|
|
|
|
LAMMPS - Large-scale Atomic/Molecular Massively Parallel Simulator
|
|
|
|
http://lammps.sandia.gov, Sandia National Laboratories
|
|
|
|
Steve Plimpton, sjplimp@sandia.gov
|
|
|
|
|
|
|
|
Copyright (2003) Sandia Corporation. Under the terms of Contract
|
|
|
|
DE-AC04-94AL85000 with Sandia Corporation, the U.S. Government retains
|
|
|
|
certain rights in this software. This software is distributed under
|
|
|
|
the GNU General Public License.
|
|
|
|
|
|
|
|
See the README file in the top-level LAMMPS directory.
|
|
|
|
------------------------------------------------------------------------- */
|
|
|
|
|
|
|
|
#ifndef LMP_MERGESORT
|
|
|
|
#define LMP_MERGESORT
|
|
|
|
|
2018-04-28 05:41:04 +08:00
|
|
|
#include <cstring>
|
2017-06-15 11:22:49 +08:00
|
|
|
|
2017-06-16 20:05:55 +08:00
|
|
|
// custom hybrid upward merge sort implementation with support to pass
|
|
|
|
// an opaque pointer to the comparison function, e.g. for access to
|
|
|
|
// class members. this avoids having to use global variables.
|
|
|
|
// for improved performance, we employ an in-place insertion sort on
|
2017-06-17 06:17:48 +08:00
|
|
|
// chunks of up to 64 elements and switch to merge sort from then on.
|
2017-06-15 11:22:49 +08:00
|
|
|
|
2017-06-16 20:05:55 +08:00
|
|
|
// part 1. insertion sort for pre-sorting of small chunks
|
|
|
|
|
|
|
|
static void insertion_sort(int *index, int num, void *ptr,
|
|
|
|
int (*comp)(int, int, void*))
|
|
|
|
{
|
|
|
|
if (num < 2) return;
|
|
|
|
for (int i=1; i < num; ++i) {
|
|
|
|
int tmp = index[i];
|
|
|
|
for (int j=i-1; j >= 0; --j) {
|
|
|
|
if ((*comp)(index[j],tmp,ptr) > 0) {
|
|
|
|
index[j+1] = index[j];
|
|
|
|
} else {
|
|
|
|
index[j+1] = tmp;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
if (j == 0) index[0] = tmp;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
// part 2. merge two sublists
|
2017-06-15 11:22:49 +08:00
|
|
|
|
|
|
|
static void do_merge(int *idx, int *buf, int llo, int lhi, int rlo, int rhi,
|
|
|
|
void *ptr, int (*comp)(int, int, void *))
|
|
|
|
{
|
|
|
|
int i = llo;
|
|
|
|
int l = llo;
|
|
|
|
int r = rlo;
|
|
|
|
while ((l < lhi) && (r < rhi)) {
|
|
|
|
if ((*comp)(buf[l],buf[r],ptr) < 0)
|
|
|
|
idx[i++] = buf[l++];
|
|
|
|
else idx[i++] = buf[r++];
|
|
|
|
}
|
2017-06-17 06:17:48 +08:00
|
|
|
|
2017-06-16 20:05:55 +08:00
|
|
|
while (l < lhi) idx[i++] = buf[l++];
|
|
|
|
while (r < rhi) idx[i++] = buf[r++];
|
2017-06-15 11:22:49 +08:00
|
|
|
}
|
|
|
|
|
2017-06-16 20:05:55 +08:00
|
|
|
// part 3: loop over sublists doubling in size with each iteration.
|
|
|
|
// pre-sort sublists with insertion sort for better performance.
|
2017-06-15 11:22:49 +08:00
|
|
|
|
|
|
|
static void merge_sort(int *index, int num, void *ptr,
|
|
|
|
int (*comp)(int, int, void *))
|
|
|
|
{
|
|
|
|
if (num < 2) return;
|
|
|
|
|
2017-06-16 20:05:55 +08:00
|
|
|
int chunk,i,j;
|
|
|
|
|
2017-06-17 06:17:48 +08:00
|
|
|
// do insertion sort on chunks of up to 64 elements
|
2017-06-16 20:05:55 +08:00
|
|
|
|
2017-06-17 06:17:48 +08:00
|
|
|
chunk = 64;
|
2017-06-16 20:05:55 +08:00
|
|
|
for (i=0; i < num; i += chunk) {
|
|
|
|
j = (i+chunk > num) ? num-i : chunk;
|
|
|
|
insertion_sort(index+i,j,ptr,comp);
|
|
|
|
}
|
|
|
|
|
|
|
|
// already done?
|
|
|
|
|
|
|
|
if (chunk >= num) return;
|
|
|
|
|
|
|
|
// continue with merge sort on the pre-sorted chunks.
|
|
|
|
// we need an extra buffer for temporary storage and two
|
|
|
|
// pointers to operate on, so we can swap the pointers
|
|
|
|
// rather than copying to the hold buffer in each pass
|
|
|
|
|
|
|
|
int *buf = new int[num];
|
|
|
|
int *dest = index;
|
|
|
|
int *hold = buf;
|
|
|
|
|
|
|
|
while (chunk < num) {
|
|
|
|
int m;
|
2017-06-15 11:22:49 +08:00
|
|
|
|
2017-06-16 20:05:55 +08:00
|
|
|
// swap hold and destination buffer
|
|
|
|
|
|
|
|
int *tmp = dest; dest = hold; hold = tmp;
|
|
|
|
|
2018-10-23 20:57:33 +08:00
|
|
|
// merge from hold array to destination array
|
2017-06-16 20:05:55 +08:00
|
|
|
|
|
|
|
for (i=0; i < num-1; i += 2*chunk) {
|
|
|
|
j = i + 2*chunk;
|
|
|
|
if (j > num) j=num;
|
|
|
|
m = i+chunk;
|
2017-06-15 11:22:49 +08:00
|
|
|
if (m > num) m=num;
|
2017-06-16 20:05:55 +08:00
|
|
|
do_merge(dest,hold,i,m,m,j,ptr,comp);
|
2017-06-15 11:22:49 +08:00
|
|
|
}
|
2018-10-23 20:57:33 +08:00
|
|
|
|
|
|
|
// copy all indices not handled by the chunked merge sort loop
|
|
|
|
|
|
|
|
for ( ; i < num ; i++ ) dest[i] = hold[i];
|
2017-06-16 20:05:55 +08:00
|
|
|
chunk *= 2;
|
2017-06-15 11:22:49 +08:00
|
|
|
}
|
|
|
|
|
2017-06-16 20:05:55 +08:00
|
|
|
// if the final sorted data is in buf, copy back to index
|
|
|
|
|
|
|
|
if (dest == buf) memcpy(index,buf,sizeof(int)*num);
|
|
|
|
|
|
|
|
delete[] buf;
|
2017-06-15 11:22:49 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
#endif
|