@inbook{5e80b71fc3ee453b9000f9b8cc7314bc,
title = "Distribution-insensitive parallel external sorting on PC clusters",
abstract = "There have been many parallel external sorting algorithms reported such as NOW-Sort, SPsort, and hill sort, etc. They are for sorting large-scale data stored in the disk, but they differ in the speed, throughput, and cost-effectiveness. Mostly they deal with data that are uniformly distributed in their value range. Few research results have been yet reported for parallel external sort for data with arbitrary distribution. In this paper, we present two distribution-insensitive parallel external sorting algorithms that use sampling technique and histogram counts to achieve even distribution of data among processors, which eventually contribute to achieve superb performance. Experimental results on a cluster of Linux workstations show up to 63% reduction in the execution time compared to previous NOW-sort.",
author = "Minsoo Jeon and Dongseung Kim",
year = "2003",
doi = "10.1007/978-3-540-39707-6_15",
language = "English",
isbn = "3540203591",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
publisher = "Springer Verlag",
pages = "202--213",
editor = "Alex Veidenbaum and Kazuki Joe and Hideharu Amano and Hideo Aiso",
booktitle = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
}