@inproceedings{491c26b6ca9445339eafc251a224bc5b,
title = "Assessment of Machine Learning Methods for Classification in Single Cell ATAC-seq",
abstract = "Single-cell assay for transposase accessible chromatin using sequencing(scATAC-seq) is rapidly advancing our understanding of the cellular composition of complex tissues and organisms. The similarity of data structure and feature between scRNA-seq and scATAC-seq makes it feasible to identify the cell types in scATAC-seq through traditional supervised machine learning methods. Here, we evaluated 6 popular machine learning methods for classification in scATAC-seq. The performance of the methods is evaluated using 4 public single cell ATAC-seq datasets of different tissues, sizes and technologies. We evaluated these methods using intradatasets experiments of 5-folds cross validation based on accuracy, recall and percentage of correctly predicted cells. We found that these methods may perform well in some types of cells in a single dataset, but the overall results are not as well as in scRNA-seq analysis. For testing the classification ability of machine learning methods across datasets, we applied inter-dataset experiments to test the performance of machine learning methods in realistic scenarios. SVM and NMC are overall the top 2 best-performing methods across all experiments. We recommend researchers to apply SVM and NMC as the underlying classifier when developing an automatic classification method in scATAC-seq.",
keywords = "classification, evaluation, machine learning, scATAC-seq",
author = "Zhe Cui and Bo Liu and Liran Juan and Tianyi Zang and Tao Jiang and Yadong Wang",
note = "Publisher Copyright: {\textcopyright} 2020 IEEE.; 2020 IEEE International Conference on Bioinformatics and Biomedicine, BIBM 2020 ; Conference date: 16-12-2020 Through 19-12-2020",
year = "2020",
month = dec,
day = "16",
doi = "10.1109/BIBM49941.2020.9313138",
language = "英语",
series = "Proceedings - 2020 IEEE International Conference on Bioinformatics and Biomedicine, BIBM 2020",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
pages = "412--416",
editor = "Taesung Park and Young-Rae Cho and Hu, \{Xiaohua Tony\} and Illhoi Yoo and Woo, \{Hyun Goo\} and Jianxin Wang and Julio Facelli and Seungyoon Nam and Mingon Kang",
booktitle = "Proceedings - 2020 IEEE International Conference on Bioinformatics and Biomedicine, BIBM 2020",
address = "美国",
}