@article{b979dff38b0d475e9bf8bb1185deb982,
title = "Comprehensive cross-population analysis of high-grade serous ovarian cancer supports no more than three subtypes",
abstract = "Four gene expression subtypes of high-grade serous ovarian cancer (HGSC) have been previously described. In these early studies, a fraction of samples that did not fit well into the four subtype classifications were excluded. Therefore, we sought to systematically determine the concordance of transcriptomic HGSC subtypes across populations without removing any samples. We created a bioinformatics pipeline to independently cluster the five largest mRNA expression datasets using k-means and nonnegative matrix factorization (NMF). We summarized differential expression patterns to compare clusters across studies. While previous studies reported four cause these results contrast with previous reports, we attempted to reproduce analyses performed in those studies. Our results suggest that early results favoring four subtypes may have been driven by the inclusion of serous borderline tumors. In summary, our analysis suggests that either two or three, but not four, gene expression subtypes are most consistent across datasets.",
keywords = "Molecular subtypes, Ovarian cancer, Reproducibility, Unsupervised clustering",
author = "Way, {Gregory P.} and James Rudd and Chen Wang and Habib Hamidi and Fridley, {Brooke L.} and Konecny, {Gottfried E.} and Goode, {Ellen L.} and Greene, {Casey S.} and Doherty, {Jennifer A.}",
note = "Funding Information: We thank Sebastian Armasu and Hsiao-Wang Chen for help with statistical analyses and data processing and Emily Kate Shea for helpful discussions. This work was supported by the National Cancer Institute at the National Institutes of Health (R01 CA168758 to J.A.D., F31 CA186625 to J.R., and R01 CA122443 to E.L.G.); the Mayo Clinic Ovarian Cancer Specialized Program of Research Excellence grant (P50 CA136393 to E.L.G.); the Mayo Clinic Comprehensive Cancer Center-Gene Analysis Shared Resource (P30 CA15083); the Gordon and Betty Moore Foundation's Data-Driven Discovery Initiative (grant number GBMF 4552 to C.S.G.); the American Cancer Society (grant number IRG 8200327 to C.S.G.); and by Norris Cotton Cancer Center Developmental Funds. The authors declare that they have no known conflicts of interest. Aspects of this study were presented at the 2015 American Association for Cancer Research Conference and the 2015 Rocky Mountain Bioinformatics Conference. Publisher Copyright: {\textcopyright} 2016 Way et al.",
year = "2016",
doi = "10.1534/g3.116.033514",
language = "English (US)",
volume = "6",
pages = "4097--4103",
journal = "G3 (Bethesda, Md.)",
issn = "2160-1836",
publisher = "Genetics Society of America",
number = "12",
}