@inproceedings{fe7ef58fe3514e1db447c9a49e8449c1,
title = "Optimization and Comparison of Coordinate- and Metric-Based Indexes on GPUs for Distance Similarity Searches",
abstract = "The distance similarity search (DSS) is a fundamental operation for large-scale data analytics, as it is used to find all points that are within a search distance of a query point. Given that new scientific instruments are generating a tremendous amount of data, it is critical that these searches are highly efficient. Recently, GPU algorithms have been proposed to parallelize the DSS. While most work shows that GPU algorithms largely outperform parallel CPU algorithms, there is no single GPU algorithm that outperforms all other state-of-the-art approaches; therefore, it is not clear which algorithm should be selected based on a dataset/workload. We compare two GPU DSS algorithms: one that indexes directly on the data coordinates, and one that indexes using the distances between data points to a set of reference points. A counterintuitive finding is that the data dimensionality is not a good indicator of which algorithm should be used on a given dataset. We also find that the intrinsic dimensionality (ID) which quantifies structure in the data can be used to parameter tune the algorithms to improve performance over the baselines reported in prior work. Lastly, we find that combining the data dimensionality and ID can be used to select between the best performing GPU algorithm on a dataset.",
keywords = "Distance Similarity Search, GPGPU, Metric-based Index",
author = "Michael Gowanlock and Benoit Gallet and Brian Donnelly",
note = "Publisher Copyright: {\textcopyright} 2023, The Author(s), under exclusive license to Springer Nature Switzerland AG.; 23rd International Conference on Computational Science, ICCS 2023 ; Conference date: 03-07-2023 Through 05-07-2023",
year = "2023",
doi = "10.1007/978-3-031-36021-3_37",
language = "English (US)",
isbn = "9783031360206",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
publisher = "Springer Science and Business Media Deutschland GmbH",
pages = "357--364",
editor = "Ji{\v r}{\'i} Miky{\v s}ka and {de Mulatier}, Cl{\'e}lia and Krzhizhanovskaya, {Valeria V.} and Sloot, {Peter M.A.} and Maciej Paszynski and Dongarra, {Jack J.}",
booktitle = "Computational Science – ICCS 2023 - 23rd International Conference, Proceedings",
address = "Germany",
}