@article{6c537892c7f34aa28d59da74c702d4f6,
title = "Synthetic DNA barcodes identify singlets in scRNA-seq datasets and evaluate doublet algorithms",
abstract = "Single-cell RNA sequencing (scRNA-seq) datasets contain true single cells, or singlets, in addition to cells that coalesce during the protocol, or doublets. Identifying singlets with high fidelity in scRNA-seq is necessary to avoid false negative and false positive discoveries. Although several methodologies have been proposed, they are typically tested on highly heterogeneous datasets and lack a priori knowledge of true singlets. Here, we leveraged datasets with synthetically introduced DNA barcodes for a hitherto unexplored application: to extract ground-truth singlets. We demonstrated the feasibility of our framework, “singletCode,” to evaluate existing doublet detection methods across a range of contexts. We also leveraged our ground-truth singlets to train a proof-of-concept machine learning classifier, which outperformed other doublet detection algorithms. Our integrative framework can identify ground-truth singlets and enable robust doublet detection in non-barcoded datasets.",
keywords = "barcoding, benchmarking, doublet detection, lineage tracing, machine learning, scRNA-seq, single-cell genomics, singletCode, singlets",
author = "Ziyang Zhang and Melzer, {Madeline E.} and Arun, {Keerthana M.} and Hanxiao Sun and Eriksson, {Carl Johan} and Itai Fabian and Sagi Shaashua and Karun Kiani and Yaara Oren and Yogesh Goyal",
note = "Publisher Copyright: {\textcopyright} 2024 The Author(s)",
year = "2024",
month = jul,
day = "10",
doi = "10.1016/j.xgen.2024.100592",
language = "אנגלית",
volume = "4",
journal = "Cell Genomics",
issn = "2666-979X",
publisher = "Cell Press",
number = "7",
}