@inproceedings{208df95b001e405583aac74ae2cbf49f,
title = "DP2: A Highly Parallel Range Join for Genome Analysis on Distributed Computing Platform",
abstract = "Rapid growth of the sheer amount of genome data and intense computation become great challenges for downstream genome analytics. Efficient parallel processing and distributed computing are the two effective schemes to address the analysis of big data. Range join is a widely used, effective, yet time-consuming operation that finds the overlap between two different sets of genome features. The current widely adopted BEDTools [6] pipeline adopts single-node binary tree approach, while the distributed GenAp scheme fails to exploit the massive parallel computation on modern throughput processors, such as GPU (Graphic Processing Unit). This paper proposes a novel Distributed Parallel P-ary search (DP2) that applies novel P-ary analysis to enable high parallelism at algorithmic level, and extensively utilize multiple GPUs at system and architecture level. Efficient computation allocation is implemented to leverage the distributed computing on clusters. The proposed framework can be well integrated with current BEDTools [6] pipeline, and achieves an average of 25x speedup for the actual range-join operation when compared with Binary tree approach of GenAp and a 13x end-to-end (total execution time) speedup in comparison to ADAM.",
keywords = "distributed heterogeneous systems, Range join, Sequence analysis",
author = "Aman Sinha and Lai, {Bo Cheng}",
year = "2019",
month = jul,
doi = "10.1109/HPCS48598.2019.9188222",
language = "English",
series = "2019 International Conference on High Performance Computing and Simulation, HPCS 2019",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
pages = "358--362",
booktitle = "2019 International Conference on High Performance Computing and Simulation, HPCS 2019",
address = "美國",
note = "2019 International Conference on High Performance Computing and Simulation, HPCS 2019 ; Conference date: 15-07-2019 Through 19-07-2019",
}