@article{b930b9e18c3546fea28a51f2a076abed,
title = "Developing a 670k genotyping array to tag ~2M SNPs across 24 horse breeds",
abstract = "Background: To date, genome-scale analyses in the domestic horse have been limited by suboptimal single nucleotide polymorphism (SNP) density and uneven genomic coverage of the current SNP genotyping arrays. The recent availability of whole genome sequences has created the opportunity to develop a next generation, high-density equine SNP array. Results: Using whole genome sequence from 153 individuals representing 24 distinct breeds collated by the equine genomics community, we cataloged over 23 million de novo discovered genetic variants. Leveraging genotype data from individuals with both whole genome sequence, and genotypes from lower-density, legacy SNP arrays, a subset of ~5 million high-quality, high-density array candidate SNPs were selected based on breed representation and uniform spacing across the genome. Considering probe design recommendations from a commercial vendor (Affymetrix, now Thermo Fisher Scientific) a set of ~2 million SNPs were selected for a next-generation high-density SNP chip (MNEc2M). Genotype data were generated using the MNEc2M array from a cohort of 332 horses from 20 breeds and a lower-density array, consisting of ~670 thousand SNPs (MNEc670k), was designed for genotype imputation. Conclusions: Here, we document the steps taken to design both the MNEc2M and MNEc670k arrays, report genomic and technical properties of these genotyping platforms, and demonstrate the imputation capabilities of these tools for the domestic horse.",
keywords = "Equine genomics, Linkage disequilibrium, SNP chip, SNP discovery, SNP informativeness, SNP validation, SNP-tagging, Variant recalibration, Whole genome sequence",
author = "Schaefer, {Robert J.} and Mikkel Schubert and Ernest Bailey and Bannasch, {Danika L.} and Eric Barrey and Bar-Gal, {Gila Kahila} and Gottfried Brem and Brooks, {Samantha A.} and Ottmar Distl and Ruedi Fries and Finno, {Carrie J.} and Vinzenz Gerber and Bianca Haase and Vidhya Jagannathan and Ted Kalbfleisch and Tosso Leeb and Gabriella Lindgren and Lopes, {Maria Susana} and N{\'u}ria Mach and {da C{\^a}mara Machado}, Artur and MacLeod, {James N.} and Annette McCoy and Julia Metzger and Cecilia Penedo and Sagi Polani and Stefan Rieder and Imke Tammen and Jens Tetens and Georg Thaller and Andrea Verini-Supplizi and Wade, {Claire M.} and Barbara Wallner and Ludovic Orlando and Mickelson, {James R.} and McCue, {Molly E.}",
note = "Funding Information: Support for the generation of whole genome sequence came from the following sources: USDA NIFA project 2012-67,015-19,432 and Minnesota Agricultural Experiment Station Multistate project MIN-62-090. The National Animal Genome Project (NRSP8) through the equine genome coordinator: USDA-NRSP8 (2013-2018) horse-technical-committee coordinator funds. The Danish Council for Independent Research, Natural Sciences (Grant 4002-00152B); the Danish National Research Foundation (Grant DNRF94); Initiative d{\textquoteright}Excellence Chaires d{\textquoteright}attractivit{\'e}, Universit{\'e} de Toulouse (OURASI), and; the European Research Council (ERC-CoG-2015-681,605). The Bavarian Ministry State Ministry for Food and Agriculture, and Forestry (A/13/39). The Laboratory of Molecular Evolution, The Koret School of Veterinary Medicine, The Hebrew University of Jerusalem, Israel) for contributing pure-bred Arabian whole-genomes on behalf of The Israel Science Foundation (ISF) grant #1365/10. The Swedish Research Council Formas (221-2013-1661) and the Swedish Research Council VR (621-2012-4666). Funding sources played no role in the design of this study or the collection, analysis, and the interpretation of data and in writing the manuscript. Publisher Copyright: {\textcopyright} 2017 The Author(s).",
year = "2017",
month = jul,
day = "27",
doi = "10.1186/s12864-017-3943-8",
language = "English (US)",
volume = "18",
journal = "BMC genomics",
issn = "1471-2164",
publisher = "BioMed Central",
number = "1",
}