@inproceedings{0a2b3d320f344fbb9404cfa49613bb71,
title = "CloudTSS: A TagSNP selection approach on cloud computing",
abstract = "SNPs are fundamental roles for various applications including medical diagnostic, phylogenies and drug design. They provide the highest-resolution genetic fingerprint for identifying disease associations and human features. Genetic variants that are near each other tend to be inherited together; these regions of linked variants are known as haplotypes. Recently, genetics researches revealed that SNPs within certain haplotype blocks induce only a few distinct common haplotypes in the majority of the population. The existence of haplotype block structure has serious implications for association-based methods for the mapping of disease genes. This paper proposes a parallel haplotype block partition and SNPs selection method under a diversity function by using the Hadoop MapReduce framework. The experiment shows that the proposed MapReduce-paralleled combinatorial algorithm performs well on the real-world data obtained in from the HapMap data set; the computation efficiency can be significantly improved proportional to the number of processors being used.",
keywords = "Hadoop, Haplotype, MapReduce, SNPs, cloud computing",
author = "Hung, {Che Lun} and Lin, {Yaw Ling} and Hua, {Guan Jie} and Hu, {Yu Chen}",
year = "2011",
doi = "10.1007/978-3-642-27180-9_64",
language = "English",
isbn = "9783642271793",
series = "Communications in Computer and Information Science",
pages = "525--534",
booktitle = "Grid and Distributed Computing - International Conference, GDC 2011, Held as Part of the Future Generation Information Technology Conference, FGIT 2011, Proceedings",
note = "International Conference on Grid and Distributed Computing, GDC 2011, Held as Part of the 3rd International Mega-Conference on Future-Generation Information Technology, FGIT 2011 ; Conference date: 08-12-2011 Through 10-12-2011",
}