@article{e33331b1ff0c4b788ab82040762b67ef,
title = "Combining tumor genome simulation with crowdsourcing to benchmark somatic single-nucleotide-variant detection",
abstract = "The detection of somatic mutations from cancer genome sequences is key to understanding the genetic basis of disease progression, patient survival and response to therapy. Benchmarking is needed for tool assessment and improvement but is complicated by a lack of gold standards, by extensive resource requirements and by difficulties in sharing personal genomic information. To resolve these issues, we launched the ICGC-TCGA DREAM Somatic Mutation Calling Challenge, a crowdsourced benchmark of somatic mutation detection algorithms. Here we report the BAMSurgeon tool for simulating cancer genomes and the results of 248 analyses of three in silico tumors created with it. Different algorithms exhibit characteristic error profiles, and, intriguingly, false positives show a trinucleotide profile very similar to one found in human tumors. Although the three simulated tumors differ in sequence contamination (deviation from normal cell sequence) and in subclonality, an ensemble of pipelines outperforms the best individual pipeline in all cases. BAMSurgeon is available at https://github.com/adamewing/bamsurgeon/.",
author = "Ewing, {Adam D.} and Houlahan, {Kathleen E.} and Yin Hu and Kyle Ellrott and Cristian Caloian and Yamaguchi, {Takafumi N.} and Bare, {J. Christopher} and Christine P'Ng and Daryl Waggott and Sabelnykova, {Veronica Y.} and Kellen, {Michael R.} and Norman, {Thea C.} and David Haussler and Friend, {Stephen H.} and Gustavo Stolovitzky and Margolin, {Adam A.} and Stuart, {Joshua M.} and Boutros, {Paul C.}",
note = "Funding Information: The authors thank G. Getz, S.P. Shah, R.D. Morin, L.D. Stein and P.T. Spellman for helpful suggestions; N.J. Harding, A.Y.H. Lee and all the members of the Boutros lab for insightful discussions; and K. Dang and all members of Sage for support. This study was conducted with the support of the Ontario Institute for Cancer Research to P.C.B. through funding provided by the government of Ontario. This work was supported by Prostate Cancer Canada and is proudly funded by the Movember Foundation, grant #RS2014-01. This project was supported by Genome Canada through a Large-Scale Applied Project contract to P.C.B., S.P. Shah and R.D. Morin. This work was supported by the Discovery Frontiers: Advancing Big Data Science in Genomics Research program, which is jointly funded by the Natural Sciences and Engineering Research Council (NSERC) of Canada, the Canadian Institutes of Health Research (CIHR), Genome Canada and the Canada Foundation for Innovation (CFI). P.C.B. was supported by a Terry Fox Research Institute New Investigator Award and a CIHR New Investigator Award. K.E.H. was supported by a CIHR Computational Biology Undergraduate Summer Student Health Research Award. A.D.E. was supported by the Mater Foundation. The following US National Institutes of Health grants supported this work: R01-CA180778 (J.M.S., A.A.M.), U24-CA143858 (J.M.S.) and U01-CA176303 (A.A.M.). The authors thank Google Inc. (in particular N. Deflaux) and Annai Systems (in particular D. Maltbie and F. De La Vega) for their ongoing support of the ICGC-TCGA DREAM Somatic Mutation Calling Challenge. Publisher Copyright: {\textcopyright} 2015 Nature America, Inc. All rights reserved.",
year = "2015",
month = jun,
day = "30",
doi = "10.1038/nmeth.3407",
language = "English (US)",
volume = "12",
pages = "623--630",
journal = "Nature Methods",
issn = "1548-7091",
publisher = "Nature Publishing Group",
number = "7",
}