nih-gov/www.ncbi.nlm.nih.gov/books/n/helpsnpfaq/FTP_Finding_Specific/index.html
2025-03-17 02:05:34 +00:00

491 lines
No EOL
102 KiB
HTML
Raw Blame History

This file contains invisible Unicode characters

This file contains invisible Unicode characters that are indistinguishable to humans but may be processed differently by a computer. If you think that this is intentional, you can safely ignore this warning. Use the Escape button to reveal them.

This file contains Unicode characters that might be confused with other characters. If you think that this is intentional, you can safely ignore this warning. Use the Escape button to reveal them.

<?xml version="1.0" encoding="utf-8"?>
<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
<head><meta http-equiv="Content-Type" content="text/html; charset=utf-8" />
<!-- AppResources meta begin -->
<meta name="paf-app-resources" content="" />
<script type="text/javascript">var ncbi_startTime = new Date();</script>
<!-- AppResources meta end -->
<!-- TemplateResources meta begin -->
<meta name="paf_template" content="" />
<!-- TemplateResources meta end -->
<!-- Logger begin -->
<meta name="ncbi_db" content="books" /><meta name="ncbi_pdid" content="book-part" /><meta name="ncbi_acc" content="NBK573445" /><meta name="ncbi_domain" content="helpsnpfaq" /><meta name="ncbi_report" content="record" /><meta name="ncbi_type" content="fulltext" /><meta name="ncbi_objectid" content="" /><meta name="ncbi_pcid" content="/NBK573445/" /><meta name="ncbi_pagename" content="Finding Specific Data in dbSNPs FTP Files - SNP FAQ Archive - NCBI Bookshelf" /><meta name="ncbi_bookparttype" content="chapter" /><meta name="ncbi_app" content="bookshelf" />
<!-- Logger end -->
<title>Finding Specific Data in dbSNPs FTP Files - SNP FAQ Archive - NCBI Bookshelf</title>
<!-- AppResources external_resources begin -->
<link rel="stylesheet" href="/core/jig/1.15.2/css/jig.min.css" /><script type="text/javascript" src="/core/jig/1.15.2/js/jig.min.js"></script>
<!-- AppResources external_resources end -->
<!-- Page meta begin -->
<meta name="robots" content="NOINDEX,NOFOLLOW,NOARCHIVE,NOIMAGEINDEX" /><meta name="citation_inbook_title" content="SNP FAQ Archive [Internet]" /><meta name="citation_title" content="Finding Specific Data in dbSNPs FTP Files" /><meta name="citation_publisher" content="National Center for Biotechnology Information (US)" /><meta name="citation_date" content="2014/02/18" /><meta name="citation_fulltext_html_url" content="https://www.ncbi.nlm.nih.gov/books/NBK573445/" /><link rel="schema.DC" href="http://purl.org/DC/elements/1.0/" /><meta name="DC.Title" content="Finding Specific Data in dbSNPs FTP Files" /><meta name="DC.Type" content="Text" /><meta name="DC.Publisher" content="National Center for Biotechnology Information (US)" /><meta name="DC.Date" content="2014/02/18" /><meta name="DC.Identifier" content="https://www.ncbi.nlm.nih.gov/books/NBK573445/" /><meta name="og:title" content="Finding Specific Data in dbSNPs FTP Files" /><meta name="og:type" content="book" /><meta name="og:url" content="https://www.ncbi.nlm.nih.gov/books/NBK573445/" /><meta name="og:site_name" content="NCBI Bookshelf" /><meta name="og:image" content="https://www.ncbi.nlm.nih.gov/corehtml/pmc/pmcgifs/bookshelf/thumbs/th-helpsnpfaq-lrg.png" /><meta name="twitter:card" content="summary" /><meta name="twitter:site" content="@ncbibooks" /><meta name="warning" content="This publication is provided for historical reference only and the information may be out of date." /><meta name="bk-non-canon-loc" content="/books/n/helpsnpfaq/FTP_Finding_Specific/" /><link rel="canonical" href="https://www.ncbi.nlm.nih.gov/books/NBK573445/" /><link rel="stylesheet" href="/corehtml/pmc/css/figpopup.css" type="text/css" media="screen" /><link rel="stylesheet" href="/corehtml/pmc/css/bookshelf/2.26/css/books.min.css" type="text/css" /><link rel="stylesheet" href="/corehtml/pmc/css/bookshelf/2.26/css/books_print.min.css" type="text/css" media="print" /><style type="text/css">.main-content {background:transparent repeat-y top left;background-image:url(/corehtml/pmc/css/bookshelf/2.26/img/archive.png);background-size: auto, contain; padding:0 0 0 3em }</style><style type="text/css">p a.figpopup{display:inline !important} .bk_tt {font-family: monospace} .first-line-outdent .bk_ref {display: inline} .body-content h2, .body-content .h2 {border-bottom: 1px solid #97B0C8} .body-content h2.inline {border-bottom: none} a.page-toc-label , .jig-ncbismoothscroll a {text-decoration:none;border:0 !important} .temp-labeled-list .graphic {display:inline-block !important} .temp-labeled-list img{width:100%}</style><script type="text/javascript" src="/corehtml/pmc/js/jquery.hoverIntent.min.js"> </script><script type="text/javascript" src="/corehtml/pmc/js/common.min.js?_=3.18"> </script><script type="text/javascript" src="/corehtml/pmc/js/large-obj-scrollbars.min.js"> </script><script type="text/javascript">window.name="mainwindow";</script><script type="text/javascript" src="/corehtml/pmc/js/bookshelf/2.26/book-toc.min.js"> </script><script type="text/javascript" src="/corehtml/pmc/js/bookshelf/2.26/books.min.js"> </script><meta name="book-collection" content="helpcollect" />
<!-- Page meta end -->
<link rel="shortcut icon" href="//www.ncbi.nlm.nih.gov/favicon.ico" /><meta name="ncbi_phid" content="CE8E54F77C8BDCA10000000000CB00A9.m_13" />
<meta name='referrer' content='origin-when-cross-origin'/><link type="text/css" rel="stylesheet" href="//static.pubmed.gov/portal/portal3rc.fcgi/4216699/css/3852956/3985586/3808861/4121862/3974050/3917732/251717/4216701/14534/45193/4113719/3849091/3984811/3751656/4033350/3840896/3577051/3852958/4008682/4207974/4206132/4062871/12930/3964959/3854974/36029/4128070/9685/3549676/3609192/3609193/3609213/3395586.css" /><link type="text/css" rel="stylesheet" href="//static.pubmed.gov/portal/portal3rc.fcgi/4216699/css/3411343/3882866.css" media="print" /></head>
<body class="book-part">
<div class="grid">
<div class="col twelve_col nomargin shadow">
<!-- System messages like service outage or JS required; this is handled by the TemplateResources portlet -->
<div class="sysmessages">
<noscript>
<p class="nojs">
<strong>Warning:</strong>
The NCBI web site requires JavaScript to function.
<a href="/guide/browsers/#enablejs" title="Learn how to enable JavaScript" target="_blank">more...</a>
</p>
</noscript>
</div>
<!--/.sysmessage-->
<div class="wrap">
<div class="page">
<div class="top">
<div id="universal_header">
<section class="usa-banner">
<div class="usa-accordion">
<header class="usa-banner-header">
<div class="usa-grid usa-banner-inner">
<img src="https://www.ncbi.nlm.nih.gov/coreutils/uswds/img/favicons/favicon-57.png" alt="U.S. flag" />
<p>An official website of the United States government</p>
<button class="non-usa-accordion-button usa-banner-button" aria-expanded="false" aria-controls="gov-banner-top" type="button">
<span class="usa-banner-button-text">Here's how you know</span>
</button>
</div>
</header>
<div class="usa-banner-content usa-grid usa-accordion-content" id="gov-banner-top" aria-hidden="true">
<div class="usa-banner-guidance-gov usa-width-one-half">
<img class="usa-banner-icon usa-media_block-img" src="https://www.ncbi.nlm.nih.gov/coreutils/uswds/img/icon-dot-gov.svg" alt="Dot gov" />
<div class="usa-media_block-body">
<p>
<strong>The .gov means it's official.</strong>
<br />
Federal government websites often end in .gov or .mil. Before
sharing sensitive information, make sure you're on a federal
government site.
</p>
</div>
</div>
<div class="usa-banner-guidance-ssl usa-width-one-half">
<img class="usa-banner-icon usa-media_block-img" src="https://www.ncbi.nlm.nih.gov/coreutils/uswds/img/icon-https.svg" alt="Https" />
<div class="usa-media_block-body">
<p>
<strong>The site is secure.</strong>
<br />
The <strong>https://</strong> ensures that you are connecting to the
official website and that any information you provide is encrypted
and transmitted securely.
</p>
</div>
</div>
</div>
</div>
</section>
<div class="usa-overlay"></div>
<header class="ncbi-header" role="banner" data-section="Header">
<div class="usa-grid">
<div class="usa-width-one-whole">
<div class="ncbi-header__logo">
<a href="/" class="logo" aria-label="NCBI Logo" data-ga-action="click_image" data-ga-label="NIH NLM Logo">
<img src="https://www.ncbi.nlm.nih.gov/coreutils/nwds/img/logos/AgencyLogo.svg" alt="NIH NLM Logo" />
</a>
</div>
<div class="ncbi-header__account">
<a id="account_login" href="https://account.ncbi.nlm.nih.gov" class="usa-button header-button" style="display:none" data-ga-action="open_menu" data-ga-label="account_menu">Log in</a>
<button id="account_info" class="header-button" style="display:none" aria-controls="account_popup" type="button">
<span class="fa fa-user" aria-hidden="true">
<svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 24 24" width="20px" height="20px">
<g style="fill: #fff">
<ellipse cx="12" cy="8" rx="5" ry="6"></ellipse>
<path d="M21.8,19.1c-0.9-1.8-2.6-3.3-4.8-4.2c-0.6-0.2-1.3-0.2-1.8,0.1c-1,0.6-2,0.9-3.2,0.9s-2.2-0.3-3.2-0.9 C8.3,14.8,7.6,14.7,7,15c-2.2,0.9-3.9,2.4-4.8,4.2C1.5,20.5,2.6,22,4.1,22h15.8C21.4,22,22.5,20.5,21.8,19.1z"></path>
</g>
</svg>
</span>
<span class="username desktop-only" aria-hidden="true" id="uname_short"></span>
<span class="sr-only">Show account info</span>
</button>
</div>
<div class="ncbi-popup-anchor">
<div class="ncbi-popup account-popup" id="account_popup" aria-hidden="true">
<div class="ncbi-popup-head">
<button class="ncbi-close-button" data-ga-action="close_menu" data-ga-label="account_menu" type="button">
<span class="fa fa-times">
<svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 48 48" width="24px" height="24px">
<path d="M38 12.83l-2.83-2.83-11.17 11.17-11.17-11.17-2.83 2.83 11.17 11.17-11.17 11.17 2.83 2.83 11.17-11.17 11.17 11.17 2.83-2.83-11.17-11.17z"></path>
</svg>
</span>
<span class="usa-sr-only">Close</span></button>
<h4>Account</h4>
</div>
<div class="account-user-info">
Logged in as:<br />
<b><span class="username" id="uname_long">username</span></b>
</div>
<div class="account-links">
<ul class="usa-unstyled-list">
<li><a id="account_myncbi" href="/myncbi/" class="set-base-url" data-ga-action="click_menu_item" data-ga-label="account_myncbi">Dashboard</a></li>
<li><a id="account_pubs" href="/myncbi/collections/bibliography/" class="set-base-url" data-ga-action="click_menu_item" data-ga-label="account_pubs">Publications</a></li>
<li><a id="account_settings" href="/account/settings/" class="set-base-url" data-ga-action="click_menu_item" data-ga-label="account_settings">Account settings</a></li>
<li><a id="account_logout" href="/account/signout/" class="set-base-url" data-ga-action="click_menu_item" data-ga-label="account_logout">Log out</a></li>
</ul>
</div>
</div>
</div>
</div>
</div>
</header>
<div role="navigation" aria-label="access keys">
<a id="nws_header_accesskey_0" href="https://www.ncbi.nlm.nih.gov/guide/browsers/#ncbi_accesskeys" class="usa-sr-only" accesskey="0" tabindex="-1">Access keys</a>
<a id="nws_header_accesskey_1" href="https://www.ncbi.nlm.nih.gov" class="usa-sr-only" accesskey="1" tabindex="-1">NCBI Homepage</a>
<a id="nws_header_accesskey_2" href="/myncbi/" class="set-base-url usa-sr-only" accesskey="2" tabindex="-1">MyNCBI Homepage</a>
<a id="nws_header_accesskey_3" href="#maincontent" class="usa-sr-only" accesskey="3" tabindex="-1">Main Content</a>
<a id="nws_header_accesskey_4" href="#" class="usa-sr-only" accesskey="4" tabindex="-1">Main Navigation</a>
</div>
<section data-section="Alerts">
<div class="ncbi-alerts-placeholder"></div>
</section>
</div>
<div class="header">
<div class="res_logo"><h1 class="res_name"><a href="/books/" title="Bookshelf home">Bookshelf</a></h1><h2 class="res_tagline"></h2></div>
<div class="search"><form method="get" action="/books/"><div class="search_form"><label for="database" class="offscreen_noflow">Search database</label><select id="database"><optgroup label="Recent"><option value="books" selected="selected" data-ac_dict="bookshelf-search">Books</option><option value="biosample">BioSample</option><option value="medgen">MedGen</option><option value="dbvar" class="last">dbVar</option></optgroup><optgroup label="All"><option value="gquery">All Databases</option><option value="assembly">Assembly</option><option value="biocollections">Biocollections</option><option value="bioproject">BioProject</option><option value="biosample">BioSample</option><option value="books" data-ac_dict="bookshelf-search">Books</option><option value="clinvar">ClinVar</option><option value="cdd">Conserved Domains</option><option value="gap">dbGaP</option><option value="dbvar">dbVar</option><option value="gene">Gene</option><option value="genome">Genome</option><option value="gds">GEO DataSets</option><option value="geoprofiles">GEO Profiles</option><option value="gtr">GTR</option><option value="ipg">Identical Protein Groups</option><option value="medgen">MedGen</option><option value="mesh">MeSH</option><option value="nlmcatalog">NLM Catalog</option><option value="nuccore">Nucleotide</option><option value="omim">OMIM</option><option value="pmc">PMC</option><option value="protein">Protein</option><option value="proteinclusters">Protein Clusters</option><option value="protfam">Protein Family Models</option><option value="pcassay">PubChem BioAssay</option><option value="pccompound">PubChem Compound</option><option value="pcsubstance">PubChem Substance</option><option value="pubmed">PubMed</option><option value="snp">SNP</option><option value="sra">SRA</option><option value="structure">Structure</option><option value="taxonomy">Taxonomy</option><option value="toolkit">ToolKit</option><option value="toolkitall">ToolKitAll</option><option value="toolkitbookgh">ToolKitBookgh</option></optgroup></select><div class="nowrap"><label for="term" class="offscreen_noflow" accesskey="/">Search term</label><div class="nowrap"><input type="text" name="term" id="term" title="Search Books. Use up and down arrows to choose an item from the autocomplete." value="" class="jig-ncbiclearbutton jig-ncbiautocomplete" data-jigconfig="dictionary:'bookshelf-search',disableUrl:'NcbiSearchBarAutoComplCtrl'" autocomplete="off" data-sbconfig="ds:'no',pjs:'no',afs:'no'" /></div><button id="search" type="submit" class="button_search nowrap" cmd="go">Search</button></div></div></form><ul class="searchlinks inline_list"><li>
<a href="/books/browse/">Browse Titles</a>
</li><li>
<a href="/books/advanced/">Advanced</a>
</li><li class="help">
<a href="/books/NBK3833/">Help</a>
</li><li class="disclaimer">
<a target="_blank" data-ga-category="literature_resources" data-ga-action="link_click" data-ga-label="disclaimer_link" href="https://www.ncbi.nlm.nih.gov/books/about/disclaimer/">Disclaimer</a>
</li></ul></div>
</div>
<!--<component id="Page" label="headcontent"/>-->
</div>
<div class="content">
<!-- site messages -->
<!-- Custom content 1 -->
<div class="col1">
</div>
<div class="container">
<div id="maincontent" class="content eight_col col">
<!-- Custom content in the left column above book nav -->
<div class="col2">
</div>
<!-- Book content -->
<!-- Custom content between navigation and content -->
<div class="col3">
</div>
<div class="document">
<div class="pre-content"><div><div class="bk_prnt"><p class="small">NCBI Bookshelf. A service of the National Library of Medicine, National Institutes of Health.</p><p>SNP FAQ Archive [Internet]. Bethesda (MD): National Center for Biotechnology Information (US); 2005-. </p></div><div class="messagearea bk_noprnt" style="margin-bottom:1.3846em "><ul class="messages"><li class="warn icon"><span class="icon">This publication is provided for historical reference only and the information may be out of date.</span></li></ul></div><div class="bk_prnt"><p style="color:red;"><strong>This publication is provided for historical reference only and the information may be out of date.</strong></p></div><div class="iconblock clearfix whole_rhythm no_top_margin bk_noprnt"><a class="img_link icnblk_img" title="Table of Contents Page" href="/books/n/helpsnpfaq/"><img class="source-thumb" src="/corehtml/pmc/pmcgifs/bookshelf/thumbs/th-helpsnpfaq-lrg.png" alt="Cover of SNP FAQ Archive" height="100px" width="80px" /></a><div class="icnblk_cntnt eight_col"><h2>SNP FAQ Archive [Internet].</h2><a data-jig="ncbitoggler" href="#__NBK573445_dtls__">Show details</a><div style="display:none" class="ui-widget" id="__NBK573445_dtls__"><div>Bethesda (MD): <a href="https://www.ncbi.nlm.nih.gov/" ref="pagearea=page-banner&amp;targetsite=external&amp;targetcat=link&amp;targettype=publisher">National Center for Biotechnology Information (US)</a>; 2005-.</div></div><div class="half_rhythm"><ul class="inline_list"><li style="margin-right:1em"><a class="bk_cntns" href="/books/n/helpsnpfaq/">Contents</a></li></ul></div></div><div class="icnblk_cntnt two_col"><div class="pagination bk_noprnt"><a class="active page_link prev" href="/books/n/helpsnpfaq/FTP_Navigating_dbSNP/" title="Previous page in this title">&lt; Prev</a><a class="active page_link next" href="/books/n/helpsnpfaq/FTP_SNP_Report_Files/" title="Next page in this title">Next &gt;</a></div></div></div></div></div>
<div class="main-content lit-style" itemscope="itemscope" itemtype="http://schema.org/CreativeWork"><div class="meta-content fm-sec"><h1 id="_NBK573445_"><span class="title" itemprop="name">Finding Specific Data in dbSNP&#x02019;s FTP Files</span></h1><p class="small">Created: <span itemprop="datePublished">July 7, 2005</span>; Last Update: <span itemprop="dateModified">February 18, 2014</span>.</p><p><em>Estimated reading time: 17 minutes</em></p></div><div class="jig-ncbiinpagenav body-content whole_rhythm" data-jigconfig="allHeadingLevels: ['h2'],smoothScroll: false" itemprop="text"><ul class="simple-list"><li><h4>Finding Functional Class Data</h4></li><li><p><a href="#FTP_Finding_Specific.i_noticed_that_the">I noticed that the coding non-synonymous function code has been subdivided. Can you list and define the subdivisions?</a></p></li><li><p><a href="#FTP_Finding_Specific.where_can_i_find_a">Where can I find a flat file where the non-synonymous SNPs are mapped to their respective positions in the corresponding proteins along with the SNP and protein IDs?</a></p></li><li><p><a href="#FTP_Finding_Specific.i_noticed_that_b127">I noticed that b127 SNPs are no longer associated with function class codes 1,2,5, and 7. Does dbSNP no longer use these function class codes?</a></p></li><li><p><a href="#FTP_Finding_Specific.where_do_i_find_inf">Where do I find information on SNP functional classes?</a></p></li><li><p><a href="#FTP_Finding_Specific.does_dbsnp_have_ftp">Does dbSNP have ftp tables that contains splice site SNP location data?</a></p></li><li><p><a href="#FTP_Finding_Specific.how_do_i_search_for">How do I search for information regarding the number of SNPs found in coding regions within a gene using the gi, NM, or XM ID numbers?</a></p></li><li><p><a href="#FTP_Finding_Specific.is_it_possible_to_d">Is it possible to download a report that includes SNP function x gene model relationships?</a></p></li></ul><ul class="simple-list"><li><h4>Finding Population Diversity Data</h4></li><li><p><a href="#FTP_Finding_Specific.which_ftp_file_cont">Which FTP file contains the population diversity data tables?</a></p></li><ul class="simple-list"><li><h4>Finding Hardy Weinburg Probabilities</h4></li><li><p><a href="#FTP_Finding_Specific.where_can_i_downloa">Where can I download population diversity data such as Hardy Weinburg Probabilities via FTP for all of the SNPs described in dbSNP?</a></p></li></ul><ul class="simple-list"><li><h4>Finding Average Heterozygosity, Allele Frequency and Genotype Frequency</h4></li><li><p><a href="#FTP_Finding_Specific.is_there_a_table_th">Is there a table that shows that most common CYP2C9 alleles in Caucasians?</a></p></li><li><p><a href="#FTP_Finding_Specific.how_do_i_download_t">How do I download the data located in the variation summary section of the refSNP report for all human SNPs? Would I get it on your ftp site?</a></p></li></ul><ul class="simple-list"><li><h4>Finding All Alleles for a Given SNP</h4></li><li><p><a href="#FTP_Finding_Specific.where_is_the_bcp_fi">Where is the .bcp file that contains the alleles for any given SNP?</a></p></li></ul><ul class="simple-list"><li><h4>Finding Reference Alleles</h4></li><li><p><a href="#FTP_Finding_Specific.how_do_i_get_the_re">How do I get the reference allele (ie the allele on the reference contig) for each refSNP in human build 128?</a></p></li></ul><ul class="simple-list"><li><h4>Finding a Report of Allele Frequencies across Major Populations</h4></li><li><p><a href="#FTP_Finding_Specific.i_want_to_download">I want to download flat files that list all SNPs for which allele frequencies exist across the major human populations (European, East Asian, and African). Where can I find such data?</a></p></li></ul><ul class="simple-list"><li><h4>Finding Genotypes</h4></li><li><p><a href="#FTP_Finding_Specific.i_need_to_identify">I need to identify SNPs that are different between C57BL/J and A/J mice from a list of 50,000 SNPs. Downloading the data by chromosome is very time consuming. Is there a better was to do this?</a></p></li></ul></ul><ul class="simple-list"><li><h4>Finding IDs</h4></li><li><p><a href="#FTP_Finding_Specific.which_snp_tablescol">Which SNP tables/columns do I have to parse to find the local_snp_ids for all SNPs I submitted?</a></p></li><li><p><a href="#FTP_Finding_Specific.how_do_i_download_a">How do I download a complete list of refSNP (rs) IDs for the most recent SNP release?</a></p></li><li><p><a href="#FTP_Finding_Specific.where_can_i_find_a_1">Where can I find a file that contains the relationship between Ensembl IDs and RefSNP IDs?</a></p></li><li><p><a href="#FTP_Finding_Specific.how_do_i_fetch_data">How do I fetch data for a given refSNP ID (rsID) in XML format using a simple URL-request?</a></p></li></ul><ul class="simple-list"><li><h4>Finding Mapping Data</h4></li><li><p><a href="#FTP_Finding_Specific.where_can_i_find_a_2">Where can I find a flat file where the non-synonymous SNPs are mapped to their respective positions in the corresponding proteins along with the SNP and protein IDs?</a></p></li><li><p><a href="#FTP_Finding_Specific.where_in_the_ftp_si">Where in the FTP site do I find a table with coordinates of refSNPs (or subSNPs) in the genome (build 36)?</a></p></li><li><p><a href="#FTP_Finding_Specific.i_m_working_with_a">I&#x02019;m working with a local copy of dbSNP and need to know where I can find information that relates the orientation of a gene with the orientation of a SNP on that gene.</a></p></li><li><p><a href="#FTP_Finding_Specific.is_there_an_easy_wa">Is there an easy way to get SNP/human assembly mapping information from dbSNP, or do getting these require the downloading of the entire sql database?</a></p></li><li><p><a href="#FTP_Finding_Specific.can_i_determine_if">Can I determine if a SNP is uniquely mapped if I find a map location for the SNP in b126_SNPContigLoc_36_1, and if the following two mapping conditions are met: rf_ngbr - lf_ngbr - 1 = 1 and rf_ngbr - lf_ngbr = rc_ngbr - lc_ngbr ?</a></p></li><li><p><a href="#FTP_Finding_Specific.how_do_i_determine">How do I determine all trueSNPs that have unique mapping on one assembly?</a></p></li><li><p><a href="#FTP_Finding_Specific.i_m_looking_for_a_s">I&#x02019;m looking for a SNP that seems to have no genome mapping positions. I thought it would be in the 126 XML ds_chUn or ds_chNotOn files, but can&#x02019;t find it. Where is it?</a></p></li><ul class="simple-list"><li><h4>Finding Orientation Data</h4></li><li><p><a href="#FTP_Finding_Specific.i_have_a_huge_list">I have a huge list of human rs numbers, how do I get a list of their alleles in forward orientation?</a></p></li></ul></ul><ul class="simple-list"><li><h4>Finding Sequence Data in CSV Format</h4></li><li><p><a href="#FTP_Finding_Specific.i_am_submitting_seq">I am submitting sequence to Illumina for Golden Gate assay oligo design, which requires a Microsoft Excel file in csv format, where each FASTA sequence is in a single cell of the file. Can I retrieve data from dbSNP in this format?</a></p></li></ul><ul class="simple-list"><li><h4>Finding Microarray Data</h4></li><li><p><a href="#FTP_Finding_Specific.do_you_have_any_aff">Do you have any AFFY or ILLUMINA array data available?</a></p></li><li><p><a href="#FTP_Finding_Specific.where_can_i_downloa_1">Where can I download individual 1M Illumina SNP data from dbSNP?</a></p></li><li><p><a href="#FTP_Finding_Specific.we_are_using_illumi">We are using Illumina HumanHap550 V1, but Illumina provides chromosome positions based on Build 35. Can you give me the chromosome positions based on Build 36?</a></p></li></ul><ul class="simple-list"><li><h4>Finding Merged RefSNP (rs) Data</h4></li><li><p><a href="#FTP_Finding_Specific.i_want_to_find_all">I want to find all the refSNPs that got merged in build 127, but when I downloaded RsMergeArch.bcp.gz, I couldn&#x02019;t find a single entry for Build 127.</a></p></li><li><p><a href="#FTP_Finding_Specific.do_you_have_a_table">Do you have a table of merged SNPs somewhere within dbSNP?</a></p></li><li><p><a href="#FTP_Finding_Specific.how_do_i_query_dbsn">How do I query dbSNP so that it will return a flat or xml file containing the new RefSNP (rs) ID number into which a previously valid rs recently merged?</a></p></li></ul><ul class="simple-list"><li><h4>Finding Deleted (no longer used) refSNP Numbers</h4></li><li><p><a href="#FTP_Finding_Specific.the__rscurrent_fiel">The &#x0201c;rsCurrent" field in RsMergeArch contains 129,000 rs numbers not in the ASN.1 flat files or in a dbSNP web search. Is there a list of expired rs numbers?</a></p></li></ul><ul class="simple-list"><li><h4>Finding Method Data</h4></li><li><p><a href="#FTP_Finding_Specific.where_can_i_find_a_3">Where can I find a SNP file that contains method information?</a></p></li></ul><ul class="simple-list"><li><h4>Finding SNP data for NCBI Genome Builds</h4></li><li><p><a href="#FTP_Finding_Specific.how_can_i_get_the_s">How can I get the SNP data for NCBI&#x02019;s genome build 34?</a></p></li></ul><ul class="simple-list"><li><h4>Finding Submitter Data</h4></li><li><p><a href="#FTP_Finding_Specific.although_i_can_sear">Although I can search dbSNP for CSHL-HAPMAP, the output is too large and lists SNPs submitted by CSHL-HAPMAP and others, while I need just those submitted originally by HAPMAP.</a></p></li><li><p><a href="#FTP_Finding_Specific.where_do_i_find_a_l">Where do I find a list of submitters and the number of submitted SNP (ss) and refSNP (rs) clusters that each has submitted?</a></p></li></ul><ul class="simple-list"><li><h4>Finding Submitter Referenced Genbank Accessions</h4></li><li><p><a href="#FTP_Finding_Specific.are_snp_submitter_r">Are SNP submitter referenced Genbank accessions available for down load?</a></p></li></ul><ul class="simple-list"><li><h4>Finding Validation Data</h4></li><li><p><a href="#FTP_Finding_Specific.where_can_i_find_a_4">Where can I find a variation status field as defined in HGVbase for the mouse genome in dbSNP?</a></p></li></ul><ul class="simple-list"><li><h4>Finding Variation Class Data</h4></li><li><p><a href="#FTP_Finding_Specific.if_i_want_to_downlo">If I want to download all the indels from dbSNP, do I download the SNP table? If so, where is it?</a></p></li></ul><ul class="simple-list"><li><h4>Finding SNPs for a Specific Organism</h4></li><li><p><a href="#FTP_Finding_Specific.how_do_i_download_a_1">How do I download all the SNPs for Bos taurus? I need the SNP positions on each chromosome and the bovine reference build (Btau3.1 or Btau4).</a></p></li></ul><div id="FTP_Finding_Specific.Finding_Functional"><h2 id="_FTP_Finding_Specific_Finding_Functional_">Finding Functional Class Data</h2><div><h4 id="FTP_Finding_Specific.i_noticed_that_the">I noticed that the coding non-synonymous function code has been subdivided. Can you list and define the subdivisions?</h4><blockquote><p><b>Function Code 41:</b> &#x0201c;Nonsense&#x0201d; (coding nonsynonymous)</p><p>changes to the Stop codon</p><p><b>Function Code 42:</b> &#x0201c;Missense&#x0201d; (coding nonsynonymous)</p><p>alters codon to make an altered amino acid in protein product</p><p><b>Function Code 44:</b> &#x0201c;Frameshift&#x0201d; (coding nonsynonymous)</p><p>indel SNP causing frameshift</p><p>You can find up-to-date function codes and their definitions in the <a href="ftp://ftp.ncbi.nlm.nih.gov/snp/organisms/human_9606/database/shared_data/SnpFunctionCode.bcp.gz" ref="pagearea=body&amp;targetsite=external&amp;targetcat=link&amp;targettype=ftp">SnpFunctionCode.bcp.gz</a> table located in the /shared_data directory of the dbSNP FTP site. (<b>10/27/08</b>)</p></blockquote></div><div><h4 id="FTP_Finding_Specific.where_can_i_find_a">Where can I find a flat file where the non-synonymous SNPs are mapped to their respective positions in the corresponding proteins along with the SNP and protein IDs?</h4><blockquote><p>Please see the <a href="/books/n/helpsnpfaq/Schm_Locating_Schema/#Schm_Locating_Schema.Functional_synonymo">Functional (synonymous, non-synonymous, etc.)Data Table</a> section of this archive, and the <a href="/books/n/helpsnpfaq/Schm_Field_Definitio/#Schm_Field_Definitio.SNPContigLocusId_ta">SNPContigLocusId Table</a> section of this archive to get information about retrieving non-synonymous SNPs. You can download the SNPContigLocusId table from dbSNP&#x02019;s <a href="ftp://ftp.ncbi.nlm.nih.gov/snp/" ref="pagearea=body&amp;targetsite=external&amp;targetcat=link&amp;targettype=ftp">FTP site</a> in the <a href="ftp://ftp.ncbi.nlm.nih.gov/snp/database/organism_data/human_9606" ref="pagearea=body&amp;targetsite=external&amp;targetcat=link&amp;targettype=ftp">organism_data directory</a>(this link takes you to the directory for human) for your organism of interest. (<b>07/25/08</b>)</p></blockquote></div><div><h4 id="FTP_Finding_Specific.i_noticed_that_b127">I noticed that b127 SNPs are no longer associated with function class codes 1,2,5, and 7. Does dbSNP no longer use these function class codes?</h4><blockquote><p>As of build 127, function codes 1, 5 and 7 have been modified into two digit codes that will more precisely indicate the location of a SNP. The two digit codes have function codes 1, 5 or 7 as the first digit, each of these numbers keeping its original meaning, and 3 or 5 as the second digit, indicating whether the SNP is 3&#x02019; or 5&#x02019; to the region of interest. So the new function codes are as follows:</p><p><b>Function code13</b>: &#x0201c;nearGene-3&#x0201d;</p><p>Where:<br />1=locus region <br />3= SNP is 3&#x02019; to and 0.5kb away from gene</p><p><b>Function code 15</b>: &#x0201c;nearGene-5&#x0201d;</p><p>Where: <br />1=locus region <br />5= SNP is 5&#x02019; to and 2kb away from gene</p><p><b>Function code 53</b>: &#x0201c;UTR-3&#x0201d;</p><p>Where:<br />5= UTR (untranslated region)<br />3= SNP located in the 3&#x02019; untranslated region</p><p><b>Function code 55</b>: &#x0201c;UTR-5&#x0201d;</p><p>Where:<br />5= UTR (untranslated region)<br />5(as the second digit)= SNP located in the 5&#x02019; untranslated region</p><p><b>Function code 73</b>: &#x0201c;splice-3&#x0201d;</p><p>Where:<br />7=splice site<br />3=3&#x02019; acceptor dinucleotide</p><p><b>Function code 75</b>: &#x0201c;splice-5&#x0201d;</p><p>Where:<br />7=splice site<br />5=5&#x02019; donor dinucleotide</p><p>Function code 2, however, was retired permanently as of b127, as it identified a SNP as being in the coding region of a gene, but that other details about its location were unknown. Since mapping and annotation have improved dramatically since function code 2 was defined, it is no longer used. (<b>4/30/07</b>)</p></blockquote></div><div><h4 id="FTP_Finding_Specific.where_do_i_find_inf">Where do I find information on SNP functional classes?</h4><blockquote><p>Information on SNP functional classes is located in the SNPFunctionCode table. You can find a description of this table by doing the following:</p><dl class="temp-labeled-list"><dt>1.</dt><dd><p class="no_top_margin">Click on <a href="/SNP/snp_db_list_table.cgi" ref="pagearea=body&amp;targetsite=external&amp;targetcat=link&amp;targettype=uri">Database dictionary</a> in the documentation section of the left blue sidebar on the <a href="/SNP/index.html" ref="pagearea=body&amp;targetsite=external&amp;targetcat=link&amp;targettype=uri">dbSNP home page</a>.</p></dd><dt>2.</dt><dd><p class="no_top_margin">Type SNPFunctionCode in the text box located in the light blue &#x0201c;Search by&#x0201d; box located at the top of the page, and then click on the &#x0201c;Search&#x0201d; button located below the text box.</p></dd><dt>3.</dt><dd><p class="no_top_margin">Click on the SNPFunctionCode link on the response page to get a full <a href="/SNP/snp_db_table_description.cgi?t=SnpFunctionCode" ref="pagearea=body&amp;targetsite=external&amp;targetcat=link&amp;targettype=uri">description of the SNPFunctionCode table</a>. (<b>1/18/06</b>)</p></dd></dl></blockquote></div><div><h4 id="FTP_Finding_Specific.does_dbsnp_have_ftp">Does dbSNP have ftp tables that contains splice site SNP location data?</h4><blockquote><p>Look in the <a href="ftp://ftp.ncbi.nlm.nih.gov/snp/database/shared_data" ref="pagearea=body&amp;targetsite=external&amp;targetcat=link&amp;targettype=ftp">shared_data</a> directory for your organism on the dbSNP <a href="ftp://ftp.ncbi.nlm.nih.gov/snp" ref="pagearea=body&amp;targetsite=external&amp;targetcat=link&amp;targettype=ftp">ftp site</a> and download SnpFunctionCode.bcp.gz, which defines the codes used for function class. It indicates that a splice-site associated with the SNP is either code 73 (splice-3: 3 prime acceptor dinucleotide) or code 75 (splice-5:5 prime donor dinucleotide)</p><p>Then go to the <a href="ftp://ftp.ncbi.nlm.nih.gov/snp/database/organism_data/human_9606" ref="pagearea=body&amp;targetsite=external&amp;targetcat=link&amp;targettype=ftp">organism_data directory</a>(this link takes you to the directory for human) for your organism of interest, and download SNPContigLocusId.bcp.gz, which contains the snp_id and the functional class code for eachSNP. You can find a <a href="/projects/SNP/snp_db_table_description.cgi?t=SNPContigLocusId" ref="pagearea=body&amp;targetsite=external&amp;targetcat=link&amp;targettype=uri">description</a> of the columns in the SNPContigLocusId table online. Please note that the &#x0201c;locus_id&#x0201d; column of this table stores the NCBI gene ID. <b>(11/15/07)</b></p></blockquote></div><div><h4 id="FTP_Finding_Specific.how_do_i_search_for">How do I search for information regarding the number of SNPs found in coding regions within a gene using the gi, NM, or XM ID numbers?</h4><blockquote><p>Go to the <a href="ftp://ftp.ncbi.nlm.nih.gov/snp/organisms/human_9606/database/organism_data/" ref="pagearea=body&amp;targetsite=external&amp;targetcat=link&amp;targettype=ftp">organism_data</a> directory located in your organism&#x02019;s database and click on SNPContigLocusId.bcp.gz. This is an ASCII image of the database table containing all of our snp-to-gene information as gathered from the NCBI assembly processing. See below for column headings.</p><p>You probably only want to keep rows where fxn_class is 3, 4, or 8.</p><p>Here are the columns. The example is the first NON_SYNON encountered from the top:</p><pre>Columns Example COMMENT<br /><br />snp_id 47 snp_id<br />contig_acc <a href="/nuccore/568815311" class="bk_tag" ref="pagearea=body&amp;targetsite=entrez&amp;targetcat=link&amp;targettype=nuccore">NT_007819</a> contig accession<br />contig_ver 14 contig version<br />asn_from 10876794 contig position<br />asn_to 10876794 contig position<br />locus_id 23249 locus link identifier<br />locus_symbol KIAA0960 gene name<br />mrna_acc <a href="/nuccore/89024692" class="bk_tag" ref="pagearea=body&amp;targetsite=entrez&amp;targetcat=link&amp;targettype=nuccore">XM_371877</a> mrna accession<br />mrna_ver 2 mrna version<br />protein_acc <a href="/protein/89024693/?report=GenPept" class="bk_tag" ref="pagearea=body&amp;targetsite=entrez&amp;targetcat=link&amp;targettype=genpept">XP_371877</a> protein accession<br />protein_ver 2 protein version<br />fxn_class 4 2,3,4,8 are coding, 6=intron, 5=utr<br />reading_frame 1<br />allele G allele as found on mrna_acc<br />residue D residue as found on protein_acc<br />aa_position 514 position of residue I protein_acc<br />build_id 34_3 Genome build; assembly context<br /> is a property of contig</pre></blockquote></div><div><h4 id="FTP_Finding_Specific.is_it_possible_to_d">Is it possible to download a report that includes SNP function x gene model relationships?</h4><blockquote><p>The dbSNP XML format provides extensive information on SNP function x gene model relationships as a potential sub-property of each contig location defined for the variation. Protein structure data is provided in the complex element NSE-rs_structure-data when available.</p><p>If you are interested in a specific set of SNPs or genes (i.e. a small set of data), you can get the data via dbSNP's batch query service by selecting one of the XML reports in the &#x0201c;submission format&#x0201d; toggle menu at the bottom of the Batch query page.</p><p>If you are interested in the complete set of SNP functional data, it is available on the dbSNP <a href="ftp://ftp.ncbi.nlm.nih.gov/snp/" ref="pagearea=body&amp;targetsite=external&amp;targetcat=link&amp;targettype=ftp">FTP site</a>. The data are dumped by organism &#x00026; chromosome when a reference genome is available to organize the data.</p><p>OMIM functional mapping for human variations are currently not part of the XML file, but you can download the entire table of SNPxOMIM data from the ftp site as a <a href="ftp://ftp.ncbi.nlm.nih.gov/snp/organisms/human_9606/database/organism_data/OmimVarLocusIdSNP.bcp.gz" ref="pagearea=body&amp;targetsite=external&amp;targetcat=link&amp;targettype=ftp">relational table</a>. The relational table has the following structure:</p><pre>CREATE TABLE [SNP2Omim] <br />([omim_id] [int] NOT NULL ,<br />[var_id] [char] (4) COLLATE Latin1_General_BIN NOT NULL ,<br />[locus_id] [int] NOT NULL ,<br />[snp_id] [int] NOT NULL ,<br />[aa1] [char] (1) COLLATE Latin1_General_BIN NOT NULL ,<br />[aa_pos] [int] NOT NULL ,<br />[aa2] [char] (1) COLLATE Latin1_General_BIN NOT NULL) ON [PRIMARY]<br />GO</pre><p>
<b>(7/22/05)</b>
</p></blockquote></div></div><div id="FTP_Finding_Specific.Finding_Population"><h2 id="_FTP_Finding_Specific_Finding_Population_">Finding Population Diversity Data</h2><div><h4 id="FTP_Finding_Specific.which_ftp_file_cont">Which FTP file contains the population diversity data tables?</h4><blockquote><p>The ftp file that contains the genotype and allele frequency data for Human is:</p><p><a href="ftp://ftp.ncbi.nlm.nih.gov/snp/organisms/human_9606/genotype/" ref="pagearea=body&amp;targetsite=external&amp;targetcat=link&amp;targettype=ftp">ftp://ftp.ncbi.nih.gov/snp/organisms/human_9606/genotype/</a> (<b>4/21/06</b>)</p></blockquote></div><div id="FTP_Finding_Specific.Finding_Hardy_Weinb"><h3>Finding Hardy Weinburg Probabilities</h3><div><h4 id="FTP_Finding_Specific.where_can_i_downloa">Where can I download population diversity data such as Hardy Weinburg Probabilities via FTP for all of the SNPs described in dbSNP?</h4><blockquote><p>The information you are looking for is located in the &#x0201c;genotype&#x0201d; file for the particular organism you are interested in. For example, if you are interested in population diversity data for human, go to the dbSNP FTP site, select the <a href="ftp://ftp.ncbi.nlm.nih.gov/snp/organisms/" ref="pagearea=body&amp;targetsite=external&amp;targetcat=link&amp;targettype=ftp">organisms</a> directory, then select the <a href="ftp://ftp.ncbi.nlm.nih.gov/snp/organisms/human_9606/" ref="pagearea=body&amp;targetsite=external&amp;targetcat=link&amp;targettype=ftp">human</a> directory, and then select the <a href="ftp://ftp.ncbi.nlm.nih.gov/snp/organisms/human_9606/genotype/" ref="pagearea=body&amp;targetsite=external&amp;targetcat=link&amp;targettype=ftp">genotype</a> file. The format of these files is described <a href="/SNP/geno/genoex_doc.html" ref="pagearea=body&amp;targetsite=external&amp;targetcat=link&amp;targettype=uri">online</a>. (<b>10/5/06</b>)</p></blockquote></div></div><div id="FTP_Finding_Specific.Finding_Average_Het"><h3>Finding Average Heterozygosity, Allele Frequency and Genotype Frequency</h3><div><h4 id="FTP_Finding_Specific.is_there_a_table_th">Is there a table that shows that most common CYP2C9 alleles in Caucasians?</h4><blockquote><p>dbSNP doesn't have data for common alleles sorted by race. We only provide the allele frequency of populations defined by the submitter, some of which may be Caucasians. <a href="/SNP/GeneGt.cgi?rpttype=html&#x00026;lkup=human_9606/genotype_by_gene/by_GeneID/0_25000/1000_2000/1559_chr10&#x00026;tax_id=9606" ref="pagearea=body&amp;targetsite=external&amp;targetcat=link&amp;targettype=uri">The dbSNP Genotype and Allele Frequency Report</a> for CYP2C9 may help you find the common alleles you are looking for. (<b>09/07/07</b>)</p></blockquote></div><div><h4 id="FTP_Finding_Specific.how_do_i_download_t">How do I download the data located in the variation summary section of the refSNP report for all human SNPs? Would I get it on your ftp site?</h4><blockquote><p>You can get the data from the following three database table dump files located in the dbSNP <a href="ftp://ftp.ncbi.nlm.nih.gov/snp/" ref="pagearea=body&amp;targetsite=external&amp;targetcat=link&amp;targettype=ftp">ftp site</a>:</p><p>SNP.bcp.gz (the relevant fields are: snp_id is the rs#, avg_heterozygosity)</p><p>SNPAlleleFreq.bcp.gz</p><p>SNPGtyFreq.bcp.gz</p><p>Also located in the ftp directory are the Allele.bcp.gz and the UniGty.bcp.gz tables, where you can find the meaning of each allele_id and/or unigty_id. The column descriptions for all the tables can be found in the <a href="ftp://ftp.ncbi.nlm.nih.gov/snp/database/b124/mssql/schema/DataDictionary_b118.html" ref="pagearea=body&amp;targetsite=external&amp;targetcat=link&amp;targettype=ftp">dbSNP Data Dictionary</a>. <b>(4/1/05)</b></p></blockquote></div></div><div id="FTP_Finding_Specific.Finding_All_Alleles"><h3>Finding All Alleles for a Given SNP</h3><div><h4 id="FTP_Finding_Specific.where_is_the_bcp_fi">Where is the .bcp file that contains the alleles for any given SNP?</h4><blockquote><p>We don't have a table that keeps all alleles for a given refSNP. That&#x02019;s why you can't find a single .bcp file that has this information. You can get all the alleles for a given refSNP through the relationship between the following tables. Please see the ER diagram for table relationships:</p><p>SNPSubSNPLink, SubSNP, ObsVariation, VariAllele</p><p>When the submitted SNP is on a reverse strand with the refSNP (SNPSubSNPLink.substrand_reversed_flag=1), you need to also reverse the alleles of the submitted SNP. Another complication is that our current data model also allows submitters to submit new alleles (not reported in assay reports) with frequency or genotype on an existing SNP.</p></blockquote></div></div><div id="FTP_Finding_Specific.Finding_Reference_A"><h3>Finding Reference Alleles</h3><div><h4 id="FTP_Finding_Specific.how_do_i_get_the_re">How do I get the reference allele (ie the allele on the reference contig) for each refSNP in human build 128?</h4><blockquote><p>The alleles at the SNP contig position are in table SNPContigLoc.</p><p>Specifically for b128, it is in file b128_SNPContigLoc_36_2 which is located in the <a href="ftp://ftp.ncbi.nlm.nih.gov/snp/organisms/human_9606/database/organism_data/" ref="pagearea=body&amp;targetsite=external&amp;targetcat=link&amp;targettype=ftp">organism_data subdirectory</a> for human. The <a href="/SNP/snp_db_table_description.cgi?t=SNPContigLoc" ref="pagearea=body&amp;targetsite=external&amp;targetcat=link&amp;targettype=uri">column descriptions for SNPContigLoc</a> are located in dbSNP&#x02019;s data dictionary.(<b>02/26/08</b>)</p></blockquote></div></div><div id="FTP_Finding_Specific.Finding_a_Report_of"><h3>Finding a Report of Allele Frequencies across Major Populations</h3><div><h4 id="FTP_Finding_Specific.i_want_to_download">I want to download flat files that list all SNPs for which allele frequencies exist across the major human populations (European, East Asian, and African). Where can I find such data?</h4><blockquote><p>We currently do not have a flat file report of allele frequencies across major populations for all human SNPs. If you can work with XML files, you can find FTP files of genotype data (including genotype and allele frequency data) in the dbSNP FTP site. They are organized by chromosomes:</p><p>
<a href="ftp://ftp.ncbi.nlm.nih.gov/snp/organisms/human_9606/genotype/" ref="pagearea=body&amp;targetsite=external&amp;targetcat=link&amp;targettype=ftp">ftp://ftp.ncbi.nlm.nih.gov/snp/organisms/human_9606/genotype/</a>
</p><p>
<a href="ftp://ftp.ncbi.nlm.nih.gov/snp/organisms/human_9606/genotype_by_gene/" ref="pagearea=body&amp;targetsite=external&amp;targetcat=link&amp;targettype=ftp">ftp://ftp.ncbi.nlm.nih.gov/snp/organisms/human_9606/genotype_by_gene/</a>
</p><p>If you are working with a set of SNPs, you could use <a href="/SNP/SNPeutils.htm" ref="pagearea=body&amp;targetsite=external&amp;targetcat=link&amp;targettype=uri">eutils</a> to fetch the allele frequency information.</p><p>In the meantime, we will look at making a new FTP file format for reporting SNP frequencies. (<b>7/24/07</b>)</p></blockquote></div></div><div id="FTP_Finding_Specific.Finding_Genotypes"><h3>Finding Genotypes</h3><div><h4 id="FTP_Finding_Specific.i_need_to_identify">I need to identify SNPs that are different between C57BL/J and A/J mice from a list of 50,000 SNPs. Downloading the data by chromosome is very time consuming. Is there a better was to do this?</h4><blockquote><p>All the mouse genotype data submitted to dbSNP are available on the FTP site. Go to the mouse organism database, and select &#x0201c;<a href="ftp://ftp.ncbi.nlm.nih.gov/snp/organisms/mouse_10090/genotype/" ref="pagearea=body&amp;targetsite=external&amp;targetcat=link&amp;targettype=ftp">genotype</a>&#x0201d; from the list of available files. You can then download all of the data and do your own analysis.(<b>6/19/06</b>)</p></blockquote></div></div></div><div id="FTP_Finding_Specific.Finding_IDs"><h2 id="_FTP_Finding_Specific_Finding_IDs_">Finding IDs</h2><div><h4 id="FTP_Finding_Specific.which_snp_tablescol">Which SNP tables/columns do I have to parse to find the local_snp_ids for all SNPs I submitted?</h4><blockquote><p>To find the local IDs for specific submitted SNP (ss) numbers, all you need are the SubSNP.subsnp_id, SubSNP.loc_snp_id columns from <a href="ftp://ftp.ncbi.nlm.nih.gov/snp/organisms/human_9606/database/organism_data/SubSNP.bcp.gz" ref="pagearea=body&amp;targetsite=external&amp;targetcat=link&amp;targettype=ftp">SubSNP.bcp.gz</a> located in the <a href="ftp://ftp.ncbi.nlm.nih.gov/snp/organisms/human_9606/database/organism_data/" ref="pagearea=body&amp;targetsite=external&amp;targetcat=link&amp;targettype=ftp">organism_data</a> subdirectory for the organism of choice (the links above go to human). The SubSNP table column definitions are in <a href="ftp://ftp.ncbi.nlm.nih.gov/snp/organisms/human_9606/database/organism_schema/dbSNP_sup_table.sql.gz" ref="pagearea=body&amp;targetsite=external&amp;targetcat=link&amp;targettype=ftp">dbSNP_sup_table.sql.gz</a>, which is located in the <a href="ftp://ftp.ncbi.nlm.nih.gov/snp/organisms/human_9606/database/organism_schema/dbSNP_sup_table.sql.gz" ref="pagearea=body&amp;targetsite=external&amp;targetcat=link&amp;targettype=ftp">organism_schema</a> subdirectory of a particular organism (again, the links go to human). (<b>05/28/08</b>)</p></blockquote></div><div><h4 id="FTP_Finding_Specific.how_do_i_download_a">How do I download a complete list of refSNP (rs) IDs for the most recent SNP release?</h4><blockquote><p>You can get a list of valid rs for each organism for which dbSNP has data from the <a href="ftp://ftp.ncbi.nlm.nih.gov/snp/organisms/" ref="pagearea=body&amp;targetsite=external&amp;targetcat=link&amp;targettype=ftp">organism directory</a> of the dbSNP FTP site.</p><p>All report types in the dbSNP FTP site include the rs ID numbers. The most compact report you can download is &#x0201c;Chromosome Reports&#x0201d; (chr_rpts).(<b>11/23/07</b>)</p></blockquote></div><div><h4 id="FTP_Finding_Specific.where_can_i_find_a_1">Where can I find a file that contains the relationship between Ensembl IDs and RefSNP IDs?</h4><blockquote><p>We don&#x02019;t have a file that shows the relationship between Ensembl IDs and RefSNP IDs. On our refSNP page, however, we do have a link to Ensembl that you can use to examine the Ensembl entry for a particular SNP. Go to the refSNP page for a particular refSNP, say <a href="/SNP/snp_ref.cgi?rs=3180392" ref="pagearea=body&amp;targetsite=external&amp;targetcat=link&amp;targettype=uri">rs3180392</a>. Look at the top of the page to the right of the &#x0201c;Allele&#x0201d; section. Here you will find some small, blue text: &#x0201c;Links&#x0201d;. Click on &#x0201c;links&#x0201d; to release a drop-down menu. Click on &#x0201c;Ensembl&#x0201d; to go the<a href="http://www.ensembl.org/Homo_sapiens/snpview?snp=rs3180392&#x00026;source=dbSNP" ref="pagearea=body&amp;targetsite=external&amp;targetcat=link&amp;targettype=uri"> Ensembl page</a> for this SNP. (ud:<b>03/19/08</b>).</p></blockquote></div><div><h4 id="FTP_Finding_Specific.how_do_i_fetch_data">How do I fetch data for a given refSNP ID (rsID) in XML format using a simple URL-request?</h4><blockquote><p>Please see the <a href="/books/n/coursework/eutils/">online short course</a> for using eutils (<b>9/15/06</b>)</p></blockquote></div></div><div id="FTP_Finding_Specific.Finding_Mapping_Dat"><h2 id="_FTP_Finding_Specific_Finding_Mapping_Dat_">Finding Mapping Data</h2><div><h4 id="FTP_Finding_Specific.where_can_i_find_a_2">Where can I find a flat file where the non-synonymous SNPs are mapped to their respective positions in the corresponding proteins along with the SNP and protein IDs?</h4><blockquote><p>Please see the <a href="/books/n/helpsnpfaq/Schm_Locating_Schema/#Schm_Locating_Schema.Functional_synonymo">Functional (synonymous, non-synonymous, etc.)Data Table</a> section of this archive, and the <a href="/books/n/helpsnpfaq/Schm_Field_Definitio/#Schm_Field_Definitio.SNPContigLocusId_ta">SNPContigLocusId Table</a> section of this archive to get information about retrieving non-synonymous SNPs. You can download the SNPContigLocusId table from dbSNP&#x02019;s <a href="ftp://ftp.ncbi.nlm.nih.gov/snp/" ref="pagearea=body&amp;targetsite=external&amp;targetcat=link&amp;targettype=ftp">FTP site</a> in the <a href="ftp://ftp.ncbi.nlm.nih.gov/snp/database/organism_data/human_9606" ref="pagearea=body&amp;targetsite=external&amp;targetcat=link&amp;targettype=ftp">organism_data directory</a>(this link takes you to the directory for human) for your organism of interest. (<b>07/25/08</b>)</p></blockquote></div><div><h4 id="FTP_Finding_Specific.where_in_the_ftp_si">Where in the FTP site do I find a table with coordinates of refSNPs (or subSNPs) in the genome (build 36)?</h4><blockquote><p>You can find the latest chromosome position of a refSNP in the phys_pos_from column of the b129_SNPContigLoc_36_3 table. (<b>07/10/08</b>)</p></blockquote></div><div><h4 id="FTP_Finding_Specific.i_m_working_with_a">I&#x02019;m working with a local copy of dbSNP and need to know where I can find information that relates the orientation of a gene with the orientation of a SNP on that gene.</h4><blockquote><p><a href="/SNP/snp_db_list_table.cgi?fld=Description&#x00026;cond=contains&#x00026;srch=SNPContigloc&#x00026;cond=contains&#x00026;cond=&#x00026;type=&#x00026;fld=Description&#x00026;fld=&#x00026;srch=SNPcontigloc&#x00026;srch=&#x00026;go=Search+%28case+insensitive%29&#x00026;.cgifields=cond&#x00026;.cgifields=fld" ref="pagearea=body&amp;targetsite=external&amp;targetcat=link&amp;targettype=uri">SNPContigLoc</a> stores rs to Contig orientation and <a href="/SNP/snp_db_table_description.cgi?t=ContigExon" ref="pagearea=body&amp;targetsite=external&amp;targetcat=link&amp;targettype=uri">ContigExon</a> stores mRNA to contig orientation.</p><p>Please see the &#x0201c;<a href="/books/n/helpsnpfaq/Bld_dbSNP_Mapping/#Bld_dbSNP_Mapping.Forward_vs_Reverse_str">Forward vs. Reverse strand Orientation</a>&#x0201d; section in the Mapping Process section of this archive. (<b>05/08/08</b>)</p></blockquote></div><div><h4 id="FTP_Finding_Specific.is_there_an_easy_wa">Is there an easy way to get SNP/human assembly mapping information from dbSNP, or do getting these require the downloading of the entire sql database?</h4><blockquote><p><a href="ftp://ftp.ncbi.nlm.nih.gov/snp/organisms/human_9606/chr_rpts/" ref="pagearea=body&amp;targetsite=external&amp;targetcat=link&amp;targettype=ftp">Chromosome Reports</a> (This linked chr_rpts is for human) give the contig position and chromosome coordinates, plus the gene identifier if the SNP is in the locus of a gene. If you use chromosome reports, be aware that chromosome 7 has two complete assemblies, and the only way to differentiate them in the chromosome report is to look for "7" versus "7b" in the ctg ID field. For example, <a href="/snp/?term=7" class="bk_tag" ref="pagearea=body&amp;targetsite=entrez&amp;targetcat=term&amp;targettype=snp">rs7</a> hits both the reference assembly on Hs7_8090_34 at chromosome position 91391586 and the alternate assembly Hs7b_79660_34 at chromosome position 90737098. The thing that will drive you nuts if you're not careful is that the chromosome coordinates in the two assemblies are fairly close but not identical.</p></blockquote></div><div><h4 id="FTP_Finding_Specific.can_i_determine_if">Can I determine if a SNP is uniquely mapped if I find a map location for the SNP in b126_SNPContigLoc_36_1, and if the following two mapping conditions are met: rf_ngbr - lf_ngbr - 1 = 1 and rf_ngbr - lf_ngbr = rc_ngbr - lc_ngbr ?</h4><blockquote><p>What you are doing is generally correct, but SNPContigLoc has mapping data for all assemblies (e.g. the human data includes both the NCBI and Celera assemblies), so you&#x02019;ll need to determine which assembly you have by joining with the ContigInfo table. Also, rf_ngbr - lf_ngbr - 1 = 1 may also include other types of variations, as a result of the method we use to code the variation in rs FASTA: we always use "N" for any length of indel, mixed SNP, MNP, etc. Anything that not using the the IUPAC code letters, we make an "N". As a result, many variations may fit in the two conditions you listed.</p><p>There is an <a href="/SNP/snp_db_table_description.cgi?t=SNPContigLoc" ref="pagearea=body&amp;targetsite=external&amp;targetcat=link&amp;targettype=uri">online description</a> of the SNPContigLoc table that includes an example sql showing how to determine all trueSNPs that have unique mapping on one assembly. (<b>8/21/06</b>)</p></blockquote></div><div><h4 id="FTP_Finding_Specific.how_do_i_determine">How do I determine all trueSNPs that have unique mapping on one assembly?</h4><blockquote><p>The <a href="/SNP/snp_db_table_description.cgi?t=SNPContigLoc" ref="pagearea=body&amp;targetsite=external&amp;targetcat=link&amp;targettype=uri">online description</a> of the SNPContigLoc table includes an example sql that shows how to determine all trueSNPs that have unique mapping on one assembly.(<b>8/21/06</b>)</p></blockquote></div><div><h4 id="FTP_Finding_Specific.i_m_looking_for_a_s">I&#x02019;m looking for a SNP that seems to have no genome mapping positions. I thought it would be in the 126 XML ds_chUn or ds_chNotOn files, but can&#x02019;t find it. Where is it?</h4><blockquote><p>The SNP you are looking for is in the ds_ch11.xml file of the <a href="ftp://ftp.ncbi.nlm.nih.gov/snp/organisms/human_9606/XML" ref="pagearea=body&amp;targetsite=external&amp;targetcat=link&amp;targettype=ftp">human XML</a> directory. This SNP maps to the Celera assembly only, so it will not appear in your Entrez search results since Entrez indexes only SNPs that map to the NCBI reference assembly.(<b>8/30/06</b>)</p></blockquote></div><div id="FTP_Finding_Specific.Finding_Orientation"><h3>Finding Orientation Data</h3><div><h4 id="FTP_Finding_Specific.i_have_a_huge_list">I have a huge list of human rs numbers, how do I get a list of their alleles in forward orientation?</h4><blockquote><p>This information is available in the <a href="ftp://ftp.ncbi.nlm.nih.gov/snp/organisms/human_9606/database/organism_data/b129_SNPContigLoc_36_3.bcp.gz" ref="pagearea=body&amp;targetsite=external&amp;targetcat=link&amp;targettype=ftp">SNPContigLoc</a> and <a href="ftp://ftp.ncbi.nlm.nih.gov/snp/organisms/human_9606/database/organism_data/b129_ContigInfo_36_3.bcp.gz" ref="pagearea=body&amp;targetsite=external&amp;targetcat=link&amp;targettype=ftp">ContigInfo</a> tables.</p><p>SNPContigLoc contains the rs allele on the contig, while ContigInfo contains information about the contig position and orientation on the genome(chromosome), so from these two tables you should be able to derive the genomic allele orientation.</p><p>You will find descriptions for the <a href="/projects/SNP/snp_db_table_description.cgi?t=SNPContigLoc" ref="pagearea=body&amp;targetsite=external&amp;targetcat=link&amp;targettype=uri">SNPContigLoc</a> and <a href="/projects/SNP/snp_db_table_description.cgi?t=ContigInfo" ref="pagearea=body&amp;targetsite=external&amp;targetcat=link&amp;targettype=uri">ContigInfo</a> tables using the <a href="/SNP/snp_db_list_table.cgi" ref="pagearea=body&amp;targetsite=external&amp;targetcat=link&amp;targettype=uri">dbSNP Database Dictionary</a>.(<b>11/14/08</b>)</p></blockquote></div></div></div><div id="FTP_Finding_Specific.Finding_Sequence_Da"><h2 id="_FTP_Finding_Specific_Finding_Sequence_Da_">Finding Sequence Data in CSV Format</h2><div><h4 id="FTP_Finding_Specific.i_am_submitting_seq">I am submitting sequence to Illumina for Golden Gate assay oligo design, which requires a Microsoft Excel file in csv format, where each FASTA sequence is in a single cell of the file. Can I retrieve data from dbSNP in this format?</h4><blockquote><p>Both flanks and the alleles need to be in the same cell of an excel file. An adjacent cell in the same row would have the rsID number.</p><p>The data you need can be obtained from dbSNP's current FTP reports.</p><p>For example, you can look at the <a href="ftp://ftp.ncbi.nlm.nih.gov/snp/organisms/dog_9615/rs_fasta/" ref="pagearea=body&amp;targetsite=external&amp;targetcat=link&amp;targettype=ftp">FASTA report for dog</a></p><p>Please note that the sequences are directly from submissions. You may want to verify the sequences during your oligo design.(<b>06/02/08</b>)</p></blockquote></div></div><div id="FTP_Finding_Specific.Finding_Microarray"><h2 id="_FTP_Finding_Specific_Finding_Microarray_">Finding Microarray Data</h2><div><h4 id="FTP_Finding_Specific.do_you_have_any_aff">Do you have any AFFY or ILLUMINA array data available?</h4><blockquote><p>What we have is located in the dbSNP FTP site in the human <a href="ftp://ftp.ncbi.nlm.nih.gov/snp/organisms/human_9606/GWAS_arrays/" ref="pagearea=body&amp;targetsite=external&amp;targetcat=link&amp;targettype=ftp">GWAS_arrays</a> directory.(<b>10/08/08</b>)</p></blockquote></div><div><h4 id="FTP_Finding_Specific.where_can_i_downloa_1">Where can I download individual 1M Illumina SNP data from dbSNP?</h4><blockquote><p>The data is available in XML format in the <a href="ftp://ftp.ncbi.nlm.nih.gov/snp/organisms/human_9606/" ref="pagearea=body&amp;targetsite=external&amp;targetcat=link&amp;targettype=ftp">&#x0201c;/organisms/human_9606/</a>&#x0201d; directory of the dbSNP FTP site. Go to &#x0201c;<a href="ftp://ftp.ncbi.nlm.nih.gov/snp/organisms/human_9606/GWAS_arrays/" ref="pagearea=body&amp;targetsite=external&amp;targetcat=link&amp;targettype=ftp">GWAS arrays</a>&#x0201d; and then select <a href="ftp://ftp.ncbi.nlm.nih.gov/snp/organisms/human_9606/GWAS_arrays/ILLUMINA.ILLUMINA_Human_1M.xml.gz" ref="pagearea=body&amp;targetsite=external&amp;targetcat=link&amp;targettype=ftp">/ILLUMINA.ILLUMINA_Human_1M.xml.gz</a>(<b>11/28/08</b>)</p></blockquote></div><div><h4 id="FTP_Finding_Specific.we_are_using_illumi">We are using Illumina HumanHap550 V1, but Illumina provides chromosome positions based on Build 35. Can you give me the chromosome positions based on Build 36?</h4><blockquote><p>Please check the <a href="ftp://ftp.ncbi.nlm.nih.gov/snp/organisms/human_9606/GWAS_arrays/" ref="pagearea=body&amp;targetsite=external&amp;targetcat=link&amp;targettype=ftp">Human GWAS array directory</a>, located in the <a href="ftp://ftp.ncbi.nlm.nih.gov/snp" ref="pagearea=body&amp;targetsite=external&amp;targetcat=link&amp;targettype=ftp">dbSNP FTP site</a> dbSNP ftp site (<b>06/02/08</b>)</p></blockquote></div></div><div id="FTP_Finding_Specific.Finding_Merged_RefS"><h2 id="_FTP_Finding_Specific_Finding_Merged_RefS_">Finding Merged RefSNP (rs) Data</h2><div><h4 id="FTP_Finding_Specific.i_want_to_find_all">I want to find all the refSNPs that got merged in build 127, but when I downloaded RsMergeArch.bcp.gz, I couldn&#x02019;t find a single entry for Build 127.</h4><blockquote><p>You are right that the build_id in RsMergeArch should be set to 127. This will be fixed for the next build.</p><p>For now, please use the following rule to find all the merged refSNPs in build 127: Since build 126 was released on May 4, 2006, find all the rows in RsMergeArch that were created after May 4, 2006.</p><p>For example, the sql could be:</p><p>select * from RsMergeArch where create_time &#x0003e; '5/4/06'</p><p>There should be 324938 merged pairs of human SNPs for build 127. (<b>5/28/07</b>)</p></blockquote></div><div><h4 id="FTP_Finding_Specific.do_you_have_a_table">Do you have a table of merged SNPs somewhere within dbSNP?</h4><blockquote><p>The <a href="ftp://ftp.ncbi.nlm.nih.gov/snp/organisms/human_9606/database/organism_data/RsMergeArch.bcp.gz" ref="pagearea=body&amp;targetsite=external&amp;targetcat=link&amp;targettype=ftp">rs merge table</a> (RsMergeArch) is on the dbSNP ftp site, and the column definitions for it are located in dbSNP_main_table.sql.gz, which can be found in the <a href="ftp://ftp.ncbi.nlm.nih.gov/snp/database/shared_schema" ref="pagearea=body&amp;targetsite=external&amp;targetcat=link&amp;targettype=ftp">shared_schema</a> directory of the dbSNP FTP site. The rsHigh column in the RsMergeArch table contains the rsID numbers that merged away (rsHigh is merged to rsLow). Due to multiple merge events, sometimes rsLow is merged even further. The &#x0201c;rsCurrent&#x0201d; column refers to the current refSNP. (<b>11/14/07</b>)</p></blockquote></div><div><h4 id="FTP_Finding_Specific.how_do_i_query_dbsn">How do I query dbSNP so that it will return a flat or xml file containing the new RefSNP (rs) ID number into which a previously valid rs recently merged?</h4><blockquote><p>You can get the rs merge history of all rs numbers from your organism&#x02019;s (human in this case) <a href="ftp://ftp.ncbi.nlm.nih.gov/snp/organisms/human_9606/database/organism_data/RsMergeArch.bcp.gz" ref="pagearea=body&amp;targetsite=external&amp;targetcat=link&amp;targettype=ftp">RsMergeArch table</a> located in on the dbSNP ftp site.</p><p>The following example shows that rs4344934 has been merged to <a href="/snp/?term=1107123" class="bk_tag" ref="pagearea=body&amp;targetsite=entrez&amp;targetcat=term&amp;targettype=snp">rs1107123</a>:</p><pre>gzcat RsMergeArch.bcp.gz | grep 4344934<br />4344934 1107123 123&#x000a0;&#x000a0;&#x000a0;&#x000a0; 1&#x000a0;&#x000a0;&#x000a0;&#x000a0;&#x000a0;&#x000a0; 2004-09-24 18:49:00&#x000a0;&#x000a0;&#x000a0;&#x000a0; 2004-10-10 <br />11:55:00&#x000a0;&#x000a0;&#x000a0;&#x000a0; 1107123 1</pre><p>Also, you can now retrieve a list of merged rs numbers from <a href="/sites/entrez?db=snp" ref="pagearea=body&amp;targetsite=external&amp;targetcat=link&amp;targettype=uri">Entrez SNP</a>. Just type &#x0201c;mergedrs&#x0201d; (without the quotation marks) in the text box at the top of the page and click the &#x0201c;go&#x0201d; button. Each entry in the returned list will include the old rs numbers that has merged, and the new rs number it has merged into (with a link to the refSNPpage for the new rs number). You can limit the output to merged rs numbers within a certain species by clicking on the &#x0201c;Limits&#x0201d; tab and then selecting the organism you wish from the organism selection box. <b>(5/25/05:11/03/08)</b></p></blockquote></div></div><div id="FTP_Finding_Specific.Finding_Deleted_no"><h2 id="_FTP_Finding_Specific_Finding_Deleted_no_">Finding Deleted (no longer used) refSNP Numbers</h2><div><h4 id="FTP_Finding_Specific.the__rscurrent_fiel">The &#x0201c;rsCurrent" field in RsMergeArch contains 129,000 rs numbers not in the ASN.1 flat files or in a dbSNP web search. Is there a list of expired rs numbers?</h4><blockquote><p>Let me explain how we track both merged and deleted (an entirely different process from merging) refSNP (rs) numbers, by using a hypothetical example where a &#x0201c;chain merge&#x0201d; (multiple rs numbers merge into each other) occurs:</p><p>For example, let us say rs &#x0201d;A&#x0201d; merged into rs &#x0201d;B&#x0201d;, and later, rs &#x0201d;B&#x0201d; merged into rs &#x0201c;C&#x0201d;. As a result of the first merge, the entry for rs &#x0201d;A&#x0201d; in rsCurrent is updated to rs &#x0201c;B&#x0201d;; after the second merge, rsCurrent is then updated to rs &#x0201c;C&#x0201d;. Now, if rs &#x0201c;C&#x0201d;&#x02019;s submitters withdraw all the member ss numbers within the refSNP cluster rs &#x0201c;C&#x0201d;, then rs &#x0201c;C&#x0201d; will get an entry in the SNPHistory table (the SNPHistory table ONLY contains SNPs that have "become history" &#x02014; that is, SNPs that have been completely deleted). Please see ftp file for SNPHistory.bcp (located in the <a href="ftp://ftp.ncbi.nlm.nih.gov/snp/database/organism_data/human_9606/" ref="pagearea=body&amp;targetsite=external&amp;targetcat=link&amp;targettype=ftp">snp/database/organism_data/species of interest</a> directory). To find the column names for the SNPHistory table, download the human_9606_table.sql, which is located in the <a href="ftp://ftp.ncbi.nlm.nih.gov/snp/organisms/human_9606/database/organism_schema/" ref="pagearea=body&amp;targetsite=external&amp;targetcat=link&amp;targettype=ftp">human organism_schema directory</a>.</p><p>Getting back to RsMergeArch: since "withdrawing rs &#x0201c;C" is not a merge action, the table RsMergeArch is not updated. RsMergeArch is used to track "rs merge" actions only. I can see that this might be confusing, so when time allows, we will add the following explanation to the RsMergeAch table definition, to make the RsMergeArch.rsCurrent meaning clearer:</p><p>RsMergeArch is used to track each rs merge event.</p><p>If an rs number in RsMergeArch.rsCurrent is withdrawn from dbSNP by submitter request, then an the rs number of the same value as that in rsCurrent will be entered into the SNPHistory table (which contains deleted rs numbers only).</p><p>Please note: "rsCurrent" in RsMergeArch does not mean the "current rs number" in the current dbSNP build". (<b>08/12/08</b>)</p></blockquote></div></div><div id="FTP_Finding_Specific.Finding_Method_Data"><h2 id="_FTP_Finding_Specific_Finding_Method_Data_">Finding Method Data</h2><div><h4 id="FTP_Finding_Specific.where_can_i_find_a_3">Where can I find a SNP file that contains method information?</h4><blockquote><p>Go to the <a href="ftp://ftp.ncbi.nlm.nih.gov/snp/database/shared_data/" ref="pagearea=body&amp;targetsite=external&amp;targetcat=link&amp;targettype=ftp">shared_data directory</a> of the dbSNP FTP site, and look at the <a href="ftp://ftp.ncbi.nlm.nih.gov/snp/database/shared_data/Method.bcp.gz" ref="pagearea=body&amp;targetsite=external&amp;targetcat=link&amp;targettype=ftp">Method</a> and <a href="ftp://ftp.ncbi.nlm.nih.gov/snp/database/shared_data/MethodLine.bcp.gz" ref="pagearea=body&amp;targetsite=external&amp;targetcat=link&amp;targettype=ftp">MethodLine</a> .bcp files for information on the methods used by submittors for their submissions. (<b>1/18/06</b>)</p></blockquote></div></div><div id="FTP_Finding_Specific.Finding_SNP_data_fo"><h2 id="_FTP_Finding_Specific_Finding_SNP_data_fo_">Finding SNP data for NCBI Genome Builds</h2><div><h4 id="FTP_Finding_Specific.how_can_i_get_the_s">How can I get the SNP data for NCBI&#x02019;s genome build 34?</h4><blockquote><p>To get the mapping coordinates for build 34.3, please see the <a href="ftp://ftp.ncbi.nlm.nih.gov/snp/database/organism_data/human_9606/b125_SNPContigLoc_34_3.bcp.gz" ref="pagearea=body&amp;targetsite=external&amp;targetcat=link&amp;targettype=ftp">SNPContigLoc_34_3.bcp.gz </a> table for the species of interest on the dbSNP FTP site.</p><p>You might also wish to consult tables b125_SNPMapInfo_34_5 and b125_ContigInfo_34_5. in the same FTP directory. Please see the <a href="/SNP/snp_db_list_table.cgi" ref="pagearea=body&amp;targetsite=external&amp;targetcat=link&amp;targettype=uri">Data Dictonary</a> for table descriptions of the above tables.</p><p>Please note that some refSNP (rs) numbers might have been merged ( if they are found to map the same location at a later build). The rs merge history is located in the RsMergeArch table, located in the same FTP directory as the aforementioned tables, or you can retrieve a list of merged rs numbers from <a href="/sites/entrez?db=snp" ref="pagearea=body&amp;targetsite=external&amp;targetcat=link&amp;targettype=uri">Entrez SNP</a>. Just type &#x0201c;mergedrs&#x0201d; (without the quotation marks) in the text box at the top of the page and click the &#x0201c;go&#x0201d; button. Each entry in the returned list will include the old rs numbers that has merged, and the new rs number it has merged into (with a link to the refSNPpage for the new rs number). You can limit the output to merged rs numbers within a certain species by clicking on the &#x0201c;Limits&#x0201d; tab and then selecting the organism you wish from the organism selection box. (<b>4/28/06:11/03/08</b>)</p></blockquote></div></div><div id="FTP_Finding_Specific.Finding_Submitter_D"><h2 id="_FTP_Finding_Specific_Finding_Submitter_D_">Finding Submitter Data</h2><div><h4 id="FTP_Finding_Specific.although_i_can_sear">Although I can search dbSNP for CSHL-HAPMAP, the output is too large and lists SNPs submitted by CSHL-HAPMAP and others, while I need just those submitted originally by HAPMAP.</h4><blockquote><p>CSHL-HAPMAP genotyped about 4 million of the 10 million refSNPs in dbSNP, so I&#x02019;m assuming you&#x02019;d like to find those SNPs that have genotype data from HapMap as opposed to novel SNP assays submitted by HapMap,</p><p>When you said the EntrezSNP gives you too much output, what display format did you choose? If you select the "brief" format, you will get a list of just the search&#x02019;s resulting refSNP numbers. Or, you can take a look at <a href="/projects/SNP/SNPeutils.htm" ref="pagearea=body&amp;targetsite=external&amp;targetcat=link&amp;targettype=uri">eUtils</a> as a means of retrieving data in batches.</p><p>Another alternative would be to use the *.bcp file approach:</p><p>A *.bcp file is a text file of table column values separated by tabs. If you can work with *.bcp files either by using scripts or databases, then you can achieve what you want by using two tables: SNP_bitfield and SNPChrPosOnRef, both of which are located in the <a href="ftp://ftp.ncbi.nlm.nih.gov/snp/organisms/human_9606/database/organism_data/" ref="pagearea=body&amp;targetsite=external&amp;targetcat=link&amp;targettype=ftp">organism_data</a> directory of the dbSNP FTP site. First, take a look at page 2 (F6-HapMpa properties) of the <a href="ftp://ftp.ncbi.nlm.nih.gov/snp/specs/dbSNP_bitField_v3.pdf" ref="pagearea=body&amp;targetsite=external&amp;targetcat=link&amp;targettype=ftp">bitfield pdf</a>. Here, you&#x02019;ll see that when the SNP_bitfield.hapmap_prop equals 2, it means that the SNP has had a HapMap geneotype (phase2) submitted. By using this information in conjunction with the data in SNPChrPosOnRef, which lists the chromosome and position for each SNP on reference assembly, you can get the list of refSNP numbers you wanted.</p><p>For future queries of this sort, you can use the *.bcp file approach or check back with us for a SNP Genome Workbench plug in which will allow flexible queries and reporting using the data in SNP_bitfield within <a href="/projects/gbench/" ref="pagearea=body&amp;targetsite=external&amp;targetcat=link&amp;targettype=uri">Genome Workbench</a>. This system is currently under development, and should be available soon.(<b>11/01/07</b>)</p></blockquote></div><div><h4 id="FTP_Finding_Specific.where_do_i_find_a_l">Where do I find a list of submitters and the number of submitted SNP (ss) and refSNP (rs) clusters that each has submitted?</h4><blockquote><p>You can get this information from the <a href="ftp://ftp.ncbi.nlm.nih.gov/snp/organisms/human_9606/database/organism_data/dn_handleCount.bcp.gz" ref="pagearea=body&amp;targetsite=external&amp;targetcat=link&amp;targettype=ftp">dn_handleCount.bcp table</a> for your organism on the dbSNP ftp site. If you know the submitter handle for the lab you are interested in, try the following:</p><dl class="temp-labeled-list"><dt>1.</dt><dd><p class="no_top_margin">Find the &#x0201c;Submitter Information&#x0201d; section of the <a href="/SNP/" ref="pagearea=body&amp;targetsite=external&amp;targetcat=link&amp;targettype=uri">dbSNP home page</a>, and click on the words&#x0201d;By Submitter&#x0201d;.</p></dd><dt>2.</dt><dd><p class="no_top_margin">You will get a page with a text box. Enter the handle of the lab of interest in the text box (e.g. SNP500CANCER) and click the &#x0201c;Search&#x0201d; button.</p></dd></dl><p>You will receive a report that includes the submitter&#x02019;s name, their institution, batch types as well as the ss counts and the rs counts for that submitter. <b>(1/4/05)</b></p></blockquote></div></div><div id="FTP_Finding_Specific.Finding_Submitter_R"><h2 id="_FTP_Finding_Specific_Finding_Submitter_R_">Finding Submitter Referenced Genbank Accessions</h2><div><h4 id="FTP_Finding_Specific.are_snp_submitter_r">Are SNP submitter referenced Genbank accessions available for down load?</h4><blockquote><p>You can find SNP submitter referenced accessions in the <a href="ftp://ftp.ncbi.nlm.nih.gov/snp/organisms/zebrafish_7955/database/organism_data/SubSNPAcc.bcp.gz" ref="pagearea=body&amp;targetsite=external&amp;targetcat=link&amp;targettype=ftp">SubSNPAcc.bcp.gz</a> and <a href="ftp://ftp.ncbi.nlm.nih.gov/snp/organisms/zebrafish_7955/database/organism_data/SubSNPAcc.bcp.gz" ref="pagearea=body&amp;targetsite=external&amp;targetcat=link&amp;targettype=ftp">SubSNP.bcp.gz</a> tables located in the organism_data sub-directory for your particular organism on the dbSNP the FTP site. You'll have to join these tables using subsnp_id to get the submitted accession for the refSNP (rs) numbers of interest. (<b>3/10/06</b>).</p></blockquote></div></div><div id="FTP_Finding_Specific.Finding_Validation"><h2 id="_FTP_Finding_Specific_Finding_Validation_">Finding Validation Data</h2><div><h4 id="FTP_Finding_Specific.where_can_i_find_a_4">Where can I find a variation status field as defined in HGVbase for the mouse genome in dbSNP?</h4><blockquote><p>The validation fields are in the XML dump. The complete dbSNP XML mouse data dump is on the <a href="ftp://ftp.ncbi.nlm.nih.gov/snp/organisms/mouse_10090/" ref="pagearea=body&amp;targetsite=external&amp;targetcat=link&amp;targettype=ftp">FTP site</a>. The validation fields are defined in the <a href="ftp://ftp.ncbi.nlm.nih.gov/snp/specs/docsum_2005.xsd" ref="pagearea=body&amp;targetsite=external&amp;targetcat=link&amp;targettype=ftp">docsum_2005</a>. (ud:<b>03/19/08</b>)</p></blockquote></div></div><div id="FTP_Finding_Specific.Finding_Variation_C"><h2 id="_FTP_Finding_Specific_Finding_Variation_C_">Finding Variation Class Data</h2><div><h4 id="FTP_Finding_Specific.if_i_want_to_downlo">If I want to download all the indels from dbSNP, do I download the SNP table? If so, where is it?</h4><blockquote><p>Before I give you the steps to download the SNP table, I would like to mention that you can also get all the indels housed in dbSNP using an Entrez Search:</p><dl class="temp-labeled-list"><dt>1.</dt><dd><p class="no_top_margin">Go to the <a href="/sites/entrez?db=snp" ref="pagearea=body&amp;targetsite=external&amp;targetcat=link&amp;targettype=uri">Entrez SNP page</a>, click on the grey &#x0201c;Limits&#x0201d; tab near the top of the page.</p></dd><dt>2.</dt><dd><p class="no_top_margin">Once you are on the <a href="/sites/entrez" ref="pagearea=body&amp;targetsite=external&amp;targetcat=link&amp;targettype=uri">limits page</a>, go to the &#x0201c;SNP Class&#x0201d; box, and click on &#x0201c;in del&#x0201d;.</p></dd></dl><p>Here are the steps for downloading the SNP table:</p><dl class="temp-labeled-list"><dt>1.</dt><dd><p class="no_top_margin">Go to the left blue side bar on the <a href="/SNP" ref="pagearea=body&amp;targetsite=external&amp;targetcat=link&amp;targettype=uri">dbSNP home page</a>, and Click on &#x0201c;General&#x0201d;.</p></dd><dt>2.</dt><dd><p class="no_top_margin">From the released set of choices, click on &#x0201c;FTP Download&#x0201d;.</p></dd><dt>3.</dt><dd><p class="no_top_margin">For the purpose of this example, I will assume you need the SNP table for human. To find it, you would go to the human <a href="ftp://ftp.ncbi.nlm.nih.gov/snp/organisms/human_9606/database/organism_data/" ref="pagearea=body&amp;targetsite=external&amp;targetcat=link&amp;targettype=ftp"><wbr style="display:inline-block"></wbr>/database/organism_data/</a> directory.</p></dd></dl><p>(<b>10/08/08</b>)</p></blockquote></div></div><div id="FTP_Finding_Specific.Finding_SNPs_for_a"><h2 id="_FTP_Finding_Specific_Finding_SNPs_for_a_">Finding SNPs for a Specific Organism</h2><div><h4 id="FTP_Finding_Specific.how_do_i_download_a_1">How do I download all the SNPs for Bos taurus? I need the SNP positions on each chromosome and the bovine reference build (Btau3.1 or Btau4).</h4><blockquote><p>You can download all of the SNPs <a href="ftp://ftp.ncbi.nlm.nih.gov/snp/organisms/" ref="pagearea=body&amp;targetsite=external&amp;targetcat=link&amp;targettype=ftp">for an organism</a> from the dbSNP <a href="ftp://ftp.ncbi.nlm.nih.gov/snp/" ref="pagearea=body&amp;targetsite=external&amp;targetcat=link&amp;targettype=ftp">FTP</a> site in various formats. The XML, ASN.1, flat file, or chromosome report should have the SNP positions.(<b>05/22/08</b>)</p></blockquote></div></div><div id="bk_toc_contnr"></div></div></div>
<div class="post-content"><div><div class="half_rhythm"><a href="/books/about/copyright/">Copyright Notice</a></div><div class="small"><span class="label">Bookshelf ID: NBK573445</span></div><div style="margin-top:2em" class="bk_noprnt"><a class="bk_cntns" href="/books/n/helpsnpfaq/">Contents</a><div class="pagination bk_noprnt"><a class="active page_link prev" href="/books/n/helpsnpfaq/FTP_Navigating_dbSNP/" title="Previous page in this title">&lt; Prev</a><a class="active page_link next" href="/books/n/helpsnpfaq/FTP_SNP_Report_Files/" title="Next page in this title">Next &gt;</a></div></div></div></div>
</div>
<!-- Custom content below content -->
<div class="col4">
</div>
<!-- Book content -->
<!-- Custom contetnt below bottom nav -->
<div class="col5">
</div>
</div>
<div id="rightcolumn" class="four_col col last">
<!-- Custom content above discovery portlets -->
<div class="col6">
<div id="ncbi_share_book"><a href="#" class="ncbi_share" data-ncbi_share_config="popup:false,shorten:true" ref="id=NBK573445&amp;db=books">Share</a></div>
</div>
<div xmlns:np="http://ncbi.gov/portal/XSLT/namespace" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"></div><div class="portlet"><div class="portlet_head"><div class="portlet_title"><h3><span>Views</span></h3></div><a name="Shutter" sid="1" href="#" class="portlet_shutter" title="Show/hide content" remembercollapsed="true" pgsec_name="PDF_download" id="Shutter"></a></div><div class="portlet_content"><ul xmlns:np="http://ncbi.gov/portal/XSLT/namespace" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" class="simple-list"><li><a href="/books/NBK573445/?report=reader">PubReader</a></li><li><a href="/books/NBK573445/?report=printable">Print View</a></li><li><a data-jig="ncbidialog" href="#_ncbi_dlg_citbx_NBK573445" data-jigconfig="width:400,modal:true">Cite this Page</a><div id="_ncbi_dlg_citbx_NBK573445" style="display:none" title="Cite this Page"><div class="bk_tt">SNP FAQ Archive [Internet]. Bethesda (MD): National Center for Biotechnology Information (US); 2005-. Finding Specific Data in dbSNPs FTP Files. 2005 Jul 7 [Updated 2014 Feb 18].<span class="bk_cite_avail"></span></div></div></li><li><a href="/books/NBK573445/pdf/Bookshelf_NBK573445.pdf">PDF version of this page</a> (137K)</li><li><a href="/books/n/helpsnpfaq/pdf/">PDF version of this title</a> (17K)</li></ul></div></div><div class="portlet"><div class="portlet_head"><div class="portlet_title"><h3><span>In this Page</span></h3></div><a name="Shutter" sid="1" href="#" class="portlet_shutter" title="Show/hide content" remembercollapsed="true" pgsec_name="page-toc" id="Shutter"></a></div><div class="portlet_content"><ul xmlns:np="http://ncbi.gov/portal/XSLT/namespace" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" class="simple-list"><li><a href="#FTP_Finding_Specific.Finding_Functional" ref="log$=inpage&amp;link_id=inpage">Finding Functional Class Data</a></li><li><a href="#FTP_Finding_Specific.Finding_Population" ref="log$=inpage&amp;link_id=inpage">Finding Population Diversity Data</a></li><li><a href="#FTP_Finding_Specific.Finding_IDs" ref="log$=inpage&amp;link_id=inpage">Finding IDs</a></li><li><a href="#FTP_Finding_Specific.Finding_Mapping_Dat" ref="log$=inpage&amp;link_id=inpage">Finding Mapping Data</a></li><li><a href="#FTP_Finding_Specific.Finding_Sequence_Da" ref="log$=inpage&amp;link_id=inpage">Finding Sequence Data in CSV Format</a></li><li><a href="#FTP_Finding_Specific.Finding_Microarray" ref="log$=inpage&amp;link_id=inpage">Finding Microarray Data</a></li><li><a href="#FTP_Finding_Specific.Finding_Merged_RefS" ref="log$=inpage&amp;link_id=inpage">Finding Merged RefSNP (rs) Data</a></li><li><a href="#FTP_Finding_Specific.Finding_Deleted_no" ref="log$=inpage&amp;link_id=inpage">Finding Deleted (no longer used) refSNP Numbers</a></li><li><a href="#FTP_Finding_Specific.Finding_Method_Data" ref="log$=inpage&amp;link_id=inpage">Finding Method Data</a></li><li><a href="#FTP_Finding_Specific.Finding_SNP_data_fo" ref="log$=inpage&amp;link_id=inpage">Finding SNP data for NCBI Genome Builds</a></li><li><a href="#FTP_Finding_Specific.Finding_Submitter_D" ref="log$=inpage&amp;link_id=inpage">Finding Submitter Data</a></li><li><a href="#FTP_Finding_Specific.Finding_Submitter_R" ref="log$=inpage&amp;link_id=inpage">Finding Submitter Referenced Genbank Accessions</a></li><li><a href="#FTP_Finding_Specific.Finding_Validation" ref="log$=inpage&amp;link_id=inpage">Finding Validation Data</a></li><li><a href="#FTP_Finding_Specific.Finding_Variation_C" ref="log$=inpage&amp;link_id=inpage">Finding Variation Class Data</a></li><li><a href="#FTP_Finding_Specific.Finding_SNPs_for_a" ref="log$=inpage&amp;link_id=inpage">Finding SNPs for a Specific Organism</a></li></ul></div></div><div class="portlet"><div class="portlet_head"><div class="portlet_title"><h3><span>Other titles in this collection</span></h3></div><a name="Shutter" sid="1" href="#" class="portlet_shutter" title="Show/hide content" remembercollapsed="true" pgsec_name="source-links" id="Shutter"></a></div><div class="portlet_content"><ul xmlns:np="http://ncbi.gov/portal/XSLT/namespace" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" class="simple-list"><li><a href="/books/n/helpcollect/">NCBI Help Manual</a></li></ul></div></div><div class="portlet"><div class="portlet_head"><div class="portlet_title"><h3><span>Recent Activity</span></h3></div><a name="Shutter" sid="1" href="#" class="portlet_shutter" title="Show/hide content" remembercollapsed="true" pgsec_name="recent_activity" id="Shutter"></a></div><div class="portlet_content"><div xmlns:np="http://ncbi.gov/portal/XSLT/namespace" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" id="HTDisplay" class=""><div class="action"><a href="javascript:historyDisplayState('ClearHT')">Clear</a><a href="javascript:historyDisplayState('HTOff')" class="HTOn">Turn Off</a><a href="javascript:historyDisplayState('HTOn')" class="HTOff">Turn On</a></div><ul id="activity"><li class="ra_rcd ralinkpopper two_line"><a class="htb ralinkpopperctrl" ref="log$=activity&amp;linkpos=1" href="/portal/utils/pageresolver.fcgi?recordid=67c8c52ab15b832ebc8310fe">Finding Specific Data in dbSNPs FTP Files - SNP FAQ Archive</a><div class="ralinkpop offscreen_noflow">Finding Specific Data in dbSNPs FTP Files - SNP FAQ Archive<div class="brieflinkpopdesc"></div></div><div class="tertiary"></div></li><li class="ra_rcd ralinkpopper two_line"><a class="htb ralinkpopperctrl" ref="log$=activity&amp;linkpos=2" href="/portal/utils/pageresolver.fcgi?recordid=67c8c529f4a390645ea4ae66">Navigating in dbSNPs FTP Site - SNP FAQ Archive</a><div class="ralinkpop offscreen_noflow">Navigating in dbSNPs FTP Site - SNP FAQ Archive<div class="brieflinkpopdesc"></div></div><div class="tertiary"></div></li><li class="ra_rcd ralinkpopper two_line"><a class="htb ralinkpopperctrl" ref="log$=activity&amp;linkpos=3" href="/portal/utils/pageresolver.fcgi?recordid=67c8c528b15b832ebc83080e">Locating and Using Data from dbSNPs FTP Site - SNP FAQ Archive</a><div class="ralinkpop offscreen_noflow">Locating and Using Data from dbSNPs FTP Site - SNP FAQ Archive<div class="brieflinkpopdesc"></div></div><div class="tertiary"></div></li><li class="ra_rcd ralinkpopper two_line"><a class="htb ralinkpopperctrl" ref="log$=activity&amp;linkpos=4" href="/portal/utils/pageresolver.fcgi?recordid=67c8c528ab82281a80ad906f">dbSNP and HapMap Data - SNP FAQ Archive</a><div class="ralinkpop offscreen_noflow">dbSNP and HapMap Data - SNP FAQ Archive<div class="brieflinkpopdesc"></div></div><div class="tertiary"></div></li><li class="ra_rcd ralinkpopper two_line"><a class="htb ralinkpopperctrl" ref="log$=activity&amp;linkpos=5" href="/portal/utils/pageresolver.fcgi?recordid=67c8c527f4a390645ea49f81">dbSNP and Haplotype Tagged SNPs - SNP FAQ Archive</a><div class="ralinkpop offscreen_noflow">dbSNP and Haplotype Tagged SNPs - SNP FAQ Archive<div class="brieflinkpopdesc"></div></div><div class="tertiary"></div></li></ul><p class="HTOn">Your browsing activity is empty.</p><p class="HTOff">Activity recording is turned off.</p><p id="turnOn" class="HTOff"><a href="javascript:historyDisplayState('HTOn')">Turn recording back on</a></p><a class="seemore" href="/sites/myncbi/recentactivity">See more...</a></div></div></div>
<!-- Custom content below discovery portlets -->
<div class="col7">
</div>
</div>
</div>
<!-- Custom content after all -->
<div class="col8">
</div>
<div class="col9">
</div>
<script type="text/javascript" src="/corehtml/pmc/js/jquery.scrollTo-1.4.2.js"></script>
<script type="text/javascript">
(function($){
$('.skiplink').each(function(i, item){
var href = $($(item).attr('href'));
href.attr('tabindex', '-1').addClass('skiptarget'); // ensure the target can receive focus
$(item).on('click', function(event){
event.preventDefault();
$.scrollTo(href, 0, {
onAfter: function(){
href.focus();
}
});
});
});
})(jQuery);
</script>
</div>
<div class="bottom">
<script type="text/javascript">
var PBooksSearchTermData = {
highlighter: "bold",
dateTime: "03/05/2025 16:32:49",
terms: [
'attack', 'heart', 'heart attack', 'infarction', 'myocardial', 'myocardial infarction', 'myocardial infarction', 'myocardial infarction'
]
};
</script>
<div id="NCBIFooter_dynamic">
<!--<component id="Breadcrumbs" label="breadcrumbs"/>
<component id="Breadcrumbs" label="helpdesk"/>-->
</div>
<div class="footer" id="footer">
<section class="icon-section">
<div id="icon-section-header" class="icon-section_header">Follow NCBI</div>
<div class="grid-container container">
<div class="icon-section_container">
<a class="footer-icon" id="footer_twitter" href="https://twitter.com/ncbi" aria-label="Twitter"><svg xmlns="http://www.w3.org/2000/svg" data-name="Layer 1" viewBox="0 0 300 300">
<defs>
<style>
.cls-11 {
fill: #737373;
}
</style>
</defs>
<title>Twitter</title>
<path class="cls-11" d="M250.11,105.48c-7,3.14-13,3.25-19.27.14,8.12-4.86,8.49-8.27,11.43-17.46a78.8,78.8,0,0,1-25,9.55,39.35,39.35,0,0,0-67,35.85,111.6,111.6,0,0,1-81-41.08A39.37,39.37,0,0,0,81.47,145a39.08,39.08,0,0,1-17.8-4.92c0,.17,0,.33,0,.5a39.32,39.32,0,0,0,31.53,38.54,39.26,39.26,0,0,1-17.75.68,39.37,39.37,0,0,0,36.72,27.3A79.07,79.07,0,0,1,56,223.34,111.31,111.31,0,0,0,116.22,241c72.3,0,111.83-59.9,111.83-111.84,0-1.71,0-3.4-.1-5.09C235.62,118.54,244.84,113.37,250.11,105.48Z">
</path>
</svg></a>
<a class="footer-icon" id="footer_facebook" href="https://www.facebook.com/ncbi.nlm" aria-label="Facebook"><svg xmlns="http://www.w3.org/2000/svg" data-name="Layer 1" viewBox="0 0 300 300">
<title>Facebook</title>
<path class="cls-11" d="M210.5,115.12H171.74V97.82c0-8.14,5.39-10,9.19-10h27.14V52l-39.32-.12c-35.66,0-42.42,26.68-42.42,43.77v19.48H99.09v36.32h27.24v109h45.41v-109h35Z">
</path>
</svg></a>
<a class="footer-icon" id="footer_linkedin" href="https://www.linkedin.com/company/ncbinlm" aria-label="LinkedIn"><svg xmlns="http://www.w3.org/2000/svg" data-name="Layer 1" viewBox="0 0 300 300">
<title>LinkedIn</title>
<path class="cls-11" d="M101.64,243.37H57.79v-114h43.85Zm-22-131.54h-.26c-13.25,0-21.82-10.36-21.82-21.76,0-11.65,8.84-21.15,22.33-21.15S101.7,78.72,102,90.38C102,101.77,93.4,111.83,79.63,111.83Zm100.93,52.61A17.54,17.54,0,0,0,163,182v61.39H119.18s.51-105.23,0-114H163v13a54.33,54.33,0,0,1,34.54-12.66c26,0,44.39,18.8,44.39,55.29v58.35H198.1V182A17.54,17.54,0,0,0,180.56,164.44Z">
</path>
</svg></a>
<a class="footer-icon" id="footer_github" href="https://github.com/ncbi" aria-label="GitHub"><svg xmlns="http://www.w3.org/2000/svg" data-name="Layer 1" viewBox="0 0 300 300">
<defs>
<style>
.cls-11,
.cls-12 {
fill: #737373;
}
.cls-11 {
fill-rule: evenodd;
}
</style>
</defs>
<title>GitHub</title>
<path class="cls-11" d="M151.36,47.28a105.76,105.76,0,0,0-33.43,206.1c5.28,1,7.22-2.3,7.22-5.09,0-2.52-.09-10.85-.14-19.69-29.42,6.4-35.63-12.48-35.63-12.48-4.81-12.22-11.74-15.47-11.74-15.47-9.59-6.56.73-6.43.73-6.43,10.61.75,16.21,10.9,16.21,10.9,9.43,16.17,24.73,11.49,30.77,8.79,1-6.83,3.69-11.5,6.71-14.14C108.57,197.1,83.88,188,83.88,147.51a40.92,40.92,0,0,1,10.9-28.39c-1.1-2.66-4.72-13.42,1-28,0,0,8.88-2.84,29.09,10.84a100.26,100.26,0,0,1,53,0C198,88.3,206.9,91.14,206.9,91.14c5.76,14.56,2.14,25.32,1,28a40.87,40.87,0,0,1,10.89,28.39c0,40.62-24.74,49.56-48.29,52.18,3.79,3.28,7.17,9.71,7.17,19.58,0,14.15-.12,25.54-.12,29,0,2.82,1.9,6.11,7.26,5.07A105.76,105.76,0,0,0,151.36,47.28Z">
</path>
<path class="cls-12" d="M85.66,199.12c-.23.52-1.06.68-1.81.32s-1.2-1.06-.95-1.59,1.06-.69,1.82-.33,1.21,1.07.94,1.6Zm-1.3-1">
</path>
<path class="cls-12" d="M90,203.89c-.51.47-1.49.25-2.16-.49a1.61,1.61,0,0,1-.31-2.19c.52-.47,1.47-.25,2.17.49s.82,1.72.3,2.19Zm-1-1.08">
</path>
<path class="cls-12" d="M94.12,210c-.65.46-1.71,0-2.37-.91s-.64-2.07,0-2.52,1.7,0,2.36.89.65,2.08,0,2.54Zm0,0"></path>
<path class="cls-12" d="M99.83,215.87c-.58.64-1.82.47-2.72-.41s-1.18-2.06-.6-2.7,1.83-.46,2.74.41,1.2,2.07.58,2.7Zm0,0">
</path>
<path class="cls-12" d="M107.71,219.29c-.26.82-1.45,1.2-2.64.85s-2-1.34-1.74-2.17,1.44-1.23,2.65-.85,2,1.32,1.73,2.17Zm0,0">
</path>
<path class="cls-12" d="M116.36,219.92c0,.87-1,1.59-2.24,1.61s-2.29-.68-2.3-1.54,1-1.59,2.26-1.61,2.28.67,2.28,1.54Zm0,0">
</path>
<path class="cls-12" d="M124.42,218.55c.15.85-.73,1.72-2,1.95s-2.37-.3-2.52-1.14.73-1.75,2-2,2.37.29,2.53,1.16Zm0,0"></path>
</svg></a>
<a class="footer-icon" id="footer_blog" href="https://ncbiinsights.ncbi.nlm.nih.gov/" aria-label="Blog">
<svg xmlns="http://www.w3.org/2000/svg" id="Layer_1" data-name="Layer 1" viewBox="0 0 40 40">
<defs><style>.cls-1{fill:#737373;}</style></defs>
<title>NCBI Insights Blog</title>
<path class="cls-1" d="M14,30a4,4,0,1,1-4-4,4,4,0,0,1,4,4Zm11,3A19,19,0,0,0,7.05,15a1,1,0,0,0-1,1v3a1,1,0,0,0,.93,1A14,14,0,0,1,20,33.07,1,1,0,0,0,21,34h3a1,1,0,0,0,1-1Zm9,0A28,28,0,0,0,7,6,1,1,0,0,0,6,7v3a1,1,0,0,0,1,1A23,23,0,0,1,29,33a1,1,0,0,0,1,1h3A1,1,0,0,0,34,33Z"></path>
</svg>
</a>
</div>
</div>
</section>
<section class="container-fluid bg-primary">
<div class="container pt-5">
<div class="row mt-3">
<div class="col-lg-3 col-12">
<p><a class="text-white" href="https://www.nlm.nih.gov/socialmedia/index.html">Connect with NLM</a></p>
<ul class="list-inline social_media">
<li class="list-inline-item"><a href="https://twitter.com/NLM_NIH" aria-label="Twitter" target="_blank" rel="noopener noreferrer"><svg xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" version="1.1" x="0px" y="0px" viewBox="0 0 249 249" style="enable-background:new 0 0 249 249;" xml:space="preserve">
<style type="text/css">
.st20 {
fill: #FFFFFF;
}
.st30 {
fill: none;
stroke: #FFFFFF;
stroke-width: 8;
stroke-miterlimit: 10;
}
</style>
<title>Twitter</title>
<g>
<g>
<g>
<path class="st20" d="M192.9,88.1c-5,2.2-9.2,2.3-13.6,0.1c5.7-3.4,6-5.8,8.1-12.3c-5.4,3.2-11.4,5.5-17.6,6.7 c-10.5-11.2-28.1-11.7-39.2-1.2c-7.2,6.8-10.2,16.9-8,26.5c-22.3-1.1-43.1-11.7-57.2-29C58,91.6,61.8,107.9,74,116 c-4.4-0.1-8.7-1.3-12.6-3.4c0,0.1,0,0.2,0,0.4c0,13.2,9.3,24.6,22.3,27.2c-4.1,1.1-8.4,1.3-12.5,0.5c3.6,11.3,14,19,25.9,19.3 c-11.6,9.1-26.4,13.2-41.1,11.5c12.7,8.1,27.4,12.5,42.5,12.5c51,0,78.9-42.2,78.9-78.9c0-1.2,0-2.4-0.1-3.6 C182.7,97.4,189.2,93.7,192.9,88.1z"></path>
</g>
</g>
<circle class="st30" cx="124.4" cy="128.8" r="108.2"></circle>
</g>
</svg></a></li>
<li class="list-inline-item"><a href="https://www.facebook.com/nationallibraryofmedicine" aria-label="Facebook" rel="noopener noreferrer" target="_blank">
<svg xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" version="1.1" x="0px" y="0px" viewBox="0 0 249 249" style="enable-background:new 0 0 249 249;" xml:space="preserve">
<style type="text/css">
.st10 {
fill: #FFFFFF;
}
.st110 {
fill: none;
stroke: #FFFFFF;
stroke-width: 8;
stroke-miterlimit: 10;
}
</style>
<title>Facebook</title>
<g>
<g>
<path class="st10" d="M159,99.1h-24V88.4c0-5,3.3-6.2,5.7-6.2h16.8V60l-24.4-0.1c-22.1,0-26.2,16.5-26.2,27.1v12.1H90v22.5h16.9 v67.5H135v-67.5h21.7L159,99.1z"></path>
</g>
</g>
<circle class="st110" cx="123.6" cy="123.2" r="108.2"></circle>
</svg>
</a></li>
<li class="list-inline-item"><a href="https://www.youtube.com/user/NLMNIH" aria-label="Youtube" target="_blank" rel="noopener noreferrer"><svg xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" version="1.1" x="0px" y="0px" viewBox="0 0 249 249" style="enable-background:new 0 0 249 249;" xml:space="preserve">
<title>Youtube</title>
<style type="text/css">
.st4 {
fill: none;
stroke: #FFFFFF;
stroke-width: 8;
stroke-miterlimit: 10;
}
.st5 {
fill: #FFFFFF;
}
</style>
<circle class="st4" cx="124.2" cy="123.4" r="108.2"></circle>
<g transform="translate(0,-952.36218)">
<path class="st5" d="M88.4,1037.4c-10.4,0-18.7,8.3-18.7,18.7v40.1c0,10.4,8.3,18.7,18.7,18.7h72.1c10.4,0,18.7-8.3,18.7-18.7 v-40.1c0-10.4-8.3-18.7-18.7-18.7H88.4z M115.2,1058.8l29.4,17.4l-29.4,17.4V1058.8z"></path>
</g>
</svg></a></li>
</ul>
</div>
<div class="col-lg-3 col-12">
<p class="address_footer text-white">National Library of Medicine<br />
<a href="https://www.google.com/maps/place/8600+Rockville+Pike,+Bethesda,+MD+20894/@38.9959508,-77.101021,17z/data=!3m1!4b1!4m5!3m4!1s0x89b7c95e25765ddb:0x19156f88b27635b8!8m2!3d38.9959508!4d-77.0988323" class="text-white" target="_blank" rel="noopener noreferrer">8600 Rockville Pike<br />
Bethesda, MD 20894</a></p>
</div>
<div class="col-lg-3 col-12 centered-lg">
<p><a href="https://www.nlm.nih.gov/web_policies.html" class="text-white">Web Policies</a><br />
<a href="https://www.nih.gov/institutes-nih/nih-office-director/office-communications-public-liaison/freedom-information-act-office" class="text-white">FOIA</a><br />
<a href="https://www.hhs.gov/vulnerability-disclosure-policy/index.html" class="text-white" id="vdp">HHS Vulnerability Disclosure</a></p>
</div>
<div class="col-lg-3 col-12 centered-lg">
<p><a class="supportLink text-white" href="https://support.nlm.nih.gov/">Help</a><br />
<a href="https://www.nlm.nih.gov/accessibility.html" class="text-white">Accessibility</a><br />
<a href="https://www.nlm.nih.gov/careers/careers.html" class="text-white">Careers</a></p>
</div>
</div>
<div class="row">
<div class="col-lg-12 centered-lg">
<nav class="bottom-links">
<ul class="mt-3">
<li>
<a class="text-white" href="//www.nlm.nih.gov/">NLM</a>
</li>
<li>
<a class="text-white" href="https://www.nih.gov/">NIH</a>
</li>
<li>
<a class="text-white" href="https://www.hhs.gov/">HHS</a>
</li>
<li>
<a class="text-white" href="https://www.usa.gov/">USA.gov</a>
</li>
</ul>
</nav>
</div>
</div>
</div>
</section>
<script type="text/javascript" src="/portal/portal3rc.fcgi/rlib/js/InstrumentOmnitureBaseJS/InstrumentNCBIConfigJS/InstrumentNCBIBaseJS/InstrumentPageStarterJS.js?v=1"> </script>
<script type="text/javascript" src="/portal/portal3rc.fcgi/static/js/hfjs2.js"> </script>
</div>
</div>
</div>
<!--/.page-->
</div>
<!--/.wrap-->
</div><!-- /.twelve_col -->
</div>
<!-- /.grid -->
<span class="PAFAppResources"></span>
<!-- BESelector tab -->
<noscript><img alt="statistics" src="/stat?jsdisabled=true&amp;ncbi_db=books&amp;ncbi_pdid=book-part&amp;ncbi_acc=NBK573445&amp;ncbi_domain=helpsnpfaq&amp;ncbi_report=record&amp;ncbi_type=fulltext&amp;ncbi_objectid=&amp;ncbi_pcid=/NBK573445/&amp;ncbi_pagename=Finding Specific Data in dbSNPs FTP Files - SNP FAQ Archive - NCBI Bookshelf&amp;ncbi_bookparttype=chapter&amp;ncbi_app=bookshelf" /></noscript>
<!-- usually for JS scripts at page bottom -->
<!--<component id="PageFixtures" label="styles"></component>-->
<!-- CE8B5AF87C7FFCB1_0191SID /projects/books/PBooks@9.11 portal107 v4.1.r689238 Tue, Oct 22 2024 16:10:51 -->
<span id="portal-csrf-token" style="display:none" data-token="CE8B5AF87C7FFCB1_0191SID"></span>
<script type="text/javascript" src="//static.pubmed.gov/portal/portal3rc.fcgi/4216699/js/3879255/4121861/3501987/4008961/3893018/3821238/4062932/4209313/4212053/4076480/3921943/3400083/3426610.js" snapshot="books"></script></body>
</html>