@inproceedings{0df7491a3d82465e91a9b6dd6ff0976a,
title = "Deep learning approach to biogeographical ancestry inference",
abstract = "Biogeographical ancestry (BGA) inference is based on the understanding of genetic diversity distribution among population groups. BGA inference is used to detect and measure the population structure that presents the natural assignment in genetic terms, identify genetic patterns found in individuals' genotypes, and estimate an individual's BGAs. In the context of forensic, BGA inference at an individual level gives the possibilities to achieve more complete identification of missing person or suspect. Current machine learning approach to BGA inference based on Bayesian theory and principle component analysis cannot operate on the data sequence directly and require predefined features extracted from the data sequence based on prior knowledge. In this paper, we conduct a survey of the state of the art of BGA inference and propose a new approach based on deep learning to BGA inference without prior feature extraction to find hidden genetic structure and provide more accurate predictions. Our experiments conducted on the dataset for Human Genome Diversity Project (HGDP) show better results for the proposed approach.",
keywords = "Biogeographical ancestry inference, machine learning",
author = "Yue Qu and Dat Tran and Wanli Ma",
year = "2019",
doi = "10.1016/j.procs.2019.09.210",
language = "English",
volume = "159",
series = "Procedia Computer Science",
publisher = "Elsevier",
pages = "552--561",
editor = "Rudas, {I. J} and C Janos and C. Toro and J. Botzheim and Howlett, {R. J.} and Jain, {L. C.}",
booktitle = "23rd KES International Conference on Knowledge-Based and Intelligent Information & Engineering Systems KES2019",
address = "Netherlands",
note = "23rd International Conference on Knowledge-Based and Intelligent Information & Engineering Systems, KES 2019 ; Conference date: 04-09-2019 Through 06-09-2019",
}