nih-gov/www.ncbi.nlm.nih.gov/refseq/announcements/2015/index.html

798 lines
58 KiB
HTML
Raw Blame History

This file contains ambiguous Unicode characters

This file contains Unicode characters that might be confused with other characters. If you think that this is intentional, you can safely ignore this warning. Use the Escape button to reveal them.

<?xml version="1.0" encoding="utf-8"?>
<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
<head><meta http-equiv="Content-Type" content="text/html; charset=utf-8" />
<!-- AppResources meta begin -->
<meta name="paf-app-resources" content="" />
<!-- AppResources meta end -->
<!-- TemplateResources meta begin -->
<meta name="paf_template" content="StdNCol" />
<!-- TemplateResources meta end -->
<!-- Page meta begin -->
<!-- Page meta end -->
<!-- Logger begin -->
<meta xmlns:ncbi-portal="http://ncbi.gov/portal/XSLT/namespace" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" name="ncbi_app" content="refseq" /><meta xmlns:ncbi-portal="http://ncbi.gov/portal/XSLT/namespace" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" name="ncbi_pdid" content="static" />
<!-- Logger end -->
<title>RefSeq Announcements for 2015</title>
<!-- PageFixtures headcontent begin -->
<link type="text/css" rel="stylesheet" href="/core/assets/genome/css/genome.css" /><link type="text/css" rel="stylesheet" href="/core/assets/genome/css/genome_links.css" />
<!-- PageFixtures headcontent end -->
<!-- AppResources external_resources begin -->
<script type="text/javascript" src="/core/jig/1.15.6/js/jig.min.js"></script>
<!-- AppResources external_resources end -->
<!-- Page headcontent begin -->
<meta name="subsite" content="refseq" />
<meta name="path" content="refseq/announcements/2015" />
<meta name="modified" content="2017-12-01T21:32:03Z" />
<!-- Page headcontent end -->
<!-- PageFixtures resources begin -->
<link xmlns="http://www.w3.org/1999/xhtml" type="text/css" rel="stylesheet" href="//static.pubmed.gov/portal/portal3rc.fcgi/4218191/css/4207974/4206132.css" xml:base="http://127.0.0.1/sites/static/header_footer" />
<!-- PageFixtures resources end -->
<link rel="shortcut icon" href="//www.ncbi.nlm.nih.gov/favicon.ico" /><meta name="ncbi_phid" content="CE8B84157C9B19810000000000940077.m_5" /><script type="text/javascript"><!--
var ScriptPath = '/portal/';
var objHierarchy = {"name":"PAFAppLayout","type":"Layout","realname":"PAFAppLayout",
"children":[{"name":"PAFAppLayout.AppController","type":"Cluster","realname":"PAFAppLayout.AppController",
"children":[{"name":"PAFAppLayout.AppController.AppResources","type":"Portlet","realname":"PAFAppLayout.AppController.AppResources","shortname":"AppResources"},
{"name":"PAFAppLayout.AppController.RequestProcessor","type":"Portlet","realname":"PAFAppLayout.AppController.RequestProcessor","shortname":"RequestProcessor"},
{"name":"PAFAppLayout.AppController.Controller","type":"Cluster","realname":"PAFAppLayout.AppController.Controller",
"children":[{"name":"PAFAppLayout.AppController.Controller.AnnotStatusStaticContentController","type":"Portlet","realname":"PAFAppLayout.AppController.Controller.AnnotStatusStaticContentController","shortname":"AnnotStatusStaticContentController"}]},
{"name":"PAFAppLayout.AppController.Page","type":"Cluster","realname":"PAFAppLayout.AppController.Page",
"children":[{"name":"PAFAppLayout.AppController.Page.PAFPageSelectorData","type":"Portlet","realname":"PAFAppLayout.AppController.Page.PAFPageSelector.PAFPageSelectorData","shortname":"PAFPageSelectorData"},
{"name":"PAFAppLayout.AppController.Page.PAFStaticPage","type":"Cluster","realname":"PAFAppLayout.AppController.Page.PAFPageSelector.PAFStaticPage",
"children":[{"name":"PAFAppLayout.AppController.Page.PAFStaticPage.MainPortlet","type":"Portlet","realname":"PAFAppLayout.AppController.Page.PAFPageSelector.PAFStaticPage.MainPortlet","shortname":"MainPortlet"}]}]},
{"name":"PAFAppLayout.AppController.PageFixtures","type":"Cluster","realname":"PAFAppLayout.AppController.PageFixtures",
"children":[{"name":"PAFAppLayout.AppController.PageFixtures.PageFixturesP","type":"Portlet","realname":"PAFAppLayout.AppController.PageFixtures.PAFPageFixtures.PageFixturesP","shortname":"PageFixturesP"},
{"name":"PAFAppLayout.AppController.PageFixtures.SearchBar","type":"Cluster","realname":"PAFAppLayout.AppController.PageFixtures.PAFPageFixtures.SearchBar",
"children":[{"name":"PAFAppLayout.AppController.PageFixtures.SearchBar.SearchBarChooser","type":"Portlet","realname":"PAFAppLayout.AppController.PageFixtures.PAFPageFixtures.SearchBar.SearchBarChooser","shortname":"SearchBarChooser"},
{"name":"PAFAppLayout.AppController.PageFixtures.SearchBar.PAFSearchBar","type":"Portlet","realname":"PAFAppLayout.AppController.PageFixtures.PAFPageFixtures.SearchBar.PAFSearchBar","shortname":"PAFSearchBar"}]},
{"name":"PAFAppLayout.AppController.PageFixtures.HeaderFooter","type":"Cluster","realname":"PAFAppLayout.AppController.PageFixtures.PAFPageFixtures.HeaderFooter",
"children":[{"name":"PAFAppLayout.AppController.PageFixtures.HeaderFooter.NCBIBreadcrumbs","type":"Portlet","realname":"PAFAppLayout.AppController.PageFixtures.PAFPageFixtures.HeaderFooter.NCBIBreadcrumbs","shortname":"NCBIBreadcrumbs"},
{"name":"PAFAppLayout.AppController.PageFixtures.HeaderFooter.NCBIHelpDesk","type":"Portlet","realname":"PAFAppLayout.AppController.PageFixtures.PAFPageFixtures.HeaderFooter.NCBIHelpDesk","shortname":"NCBIHelpDesk"},
{"name":"PAFAppLayout.AppController.PageFixtures.HeaderFooter.NCBIApplog_NoScript_Ping","type":"Portlet","realname":"PAFAppLayout.AppController.PageFixtures.PAFPageFixtures.HeaderFooter.NCBIApplog_NoScript_Ping","shortname":"NCBIApplog_NoScript_Ping"}]},
{"name":"PAFAppLayout.AppController.PageFixtures.DummyPortlet","type":"Portlet","realname":"PAFAppLayout.AppController.PageFixtures.DummyPortlet","shortname":"DummyPortlet"}]},
{"name":"PAFAppLayout.AppController.TemplateResources","type":"Cluster","realname":"PAFAppLayout.AppController.TemplateResources",
"children":[{"name":"PAFAppLayout.AppController.TemplateResources.StdNColResources","type":"Portlet","realname":"PAFAppLayout.AppController.TemplateResources.PAFTemplateResources.StdNColResources","shortname":"StdNColResources"}]},
{"name":"PAFAppLayout.AppController.Logger","type":"Portlet","realname":"PAFAppLayout.AppController.Logger","shortname":"Logger"},
{"name":"PAFAppLayout.AppController.DebugConsole","type":"Portlet","realname":"PAFAppLayout.AppController.DebugConsole","shortname":"DebugConsole"}]}]};
--></script>
<meta name='referrer' content='origin-when-cross-origin'/><link type="text/css" rel="stylesheet" href="//static.pubmed.gov/portal/portal3rc.fcgi/4218658/css/4121862/3974050/3917732/251717/4218659/4218660/14534/45193/3534283/4128070/4062871.css" /><link type="text/css" rel="stylesheet" href="//static.pubmed.gov/portal/portal3rc.fcgi/4218658/css/3529741.css" media="print" /><script type="text/javascript">
var ObjectLinks=[{i:0, ename: "p$ExL", esid:"*", sname: "p$ExL", ssid:"*", dname:"p$el", dsid:"0",m:"CopyValue",p:[],f: function(src, dst) {fn_CopyValue(src, dst);}}]
var ActiveNames = {"p$ExL":1};
</script></head>
<body class=" static">
<div class="grid">
<div class="col twelve_col nomargin shadow">
<!-- System messages like service outage or JS required; this is handled by the TemplateResources portlet -->
<div class="sysmessages">
<noscript>
<p class="nojs">
<strong>Warning:</strong>
The NCBI web site requires JavaScript to function.
<a href="/guide/browsers/#enablejs" title="Learn how to enable JavaScript" target="_blank">more...</a>
</p>
</noscript>
</div>
<!--/.sysmessage-->
<div class="wrap">
<div class="page">
<div xmlns:xi="http://www.w3.org/2001/XInclude">
<div xmlns="http://www.w3.org/1999/xhtml" id="universal_header" xml:base="http://127.0.0.1/sites/static/header_footer">
<section class="usa-banner">
<div class="usa-accordion">
<header class="usa-banner-header">
<div class="usa-grid usa-banner-inner">
<img src="https://www.ncbi.nlm.nih.gov/coreutils/uswds/img/favicons/favicon-57.png" alt="U.S. flag" />
<p>An official website of the United States government</p>
<button class="non-usa-accordion-button usa-banner-button" aria-expanded="false" aria-controls="gov-banner-top" type="button">
<span class="usa-banner-button-text">Here's how you know</span>
</button>
</div>
</header>
<div class="usa-banner-content usa-grid usa-accordion-content" id="gov-banner-top" aria-hidden="true">
<div class="usa-banner-guidance-gov usa-width-one-half">
<img class="usa-banner-icon usa-media_block-img" src="https://www.ncbi.nlm.nih.gov/coreutils/uswds/img/icon-dot-gov.svg" alt="Dot gov" />
<div class="usa-media_block-body">
<p>
<strong>The .gov means it's official.</strong>
<br />
Federal government websites often end in .gov or .mil. Before
sharing sensitive information, make sure you're on a federal
government site.
</p>
</div>
</div>
<div class="usa-banner-guidance-ssl usa-width-one-half">
<img class="usa-banner-icon usa-media_block-img" src="https://www.ncbi.nlm.nih.gov/coreutils/uswds/img/icon-https.svg" alt="Https" />
<div class="usa-media_block-body">
<p>
<strong>The site is secure.</strong>
<br />
The <strong>https://</strong> ensures that you are connecting to the
official website and that any information you provide is encrypted
and transmitted securely.
</p>
</div>
</div>
</div>
</div>
</section>
<div class="usa-overlay"></div>
<header class="ncbi-header" role="banner" data-section="Header">
<div class="usa-grid">
<div class="usa-width-one-whole">
<div class="ncbi-header__logo">
<a href="/" class="logo" aria-label="NCBI Logo" data-ga-action="click_image" data-ga-label="NIH NLM Logo">
<img src="https://www.ncbi.nlm.nih.gov/coreutils/nwds/img/logos/AgencyLogo.svg" alt="NIH NLM Logo" />
</a>
</div>
<div class="ncbi-header__account">
<a id="account_login" href="https://account.ncbi.nlm.nih.gov" class="usa-button header-button" style="display:none" data-ga-action="open_menu" data-ga-label="account_menu">Log in</a>
<button id="account_info" class="header-button" style="display:none" aria-controls="account_popup" type="button">
<span class="fa fa-user" aria-hidden="true">
<svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 24 24" width="20px" height="20px">
<g style="fill: #fff">
<ellipse cx="12" cy="8" rx="5" ry="6"></ellipse>
<path d="M21.8,19.1c-0.9-1.8-2.6-3.3-4.8-4.2c-0.6-0.2-1.3-0.2-1.8,0.1c-1,0.6-2,0.9-3.2,0.9s-2.2-0.3-3.2-0.9 C8.3,14.8,7.6,14.7,7,15c-2.2,0.9-3.9,2.4-4.8,4.2C1.5,20.5,2.6,22,4.1,22h15.8C21.4,22,22.5,20.5,21.8,19.1z"></path>
</g>
</svg>
</span>
<span class="username desktop-only" aria-hidden="true" id="uname_short"></span>
<span class="sr-only">Show account info</span>
</button>
</div>
<div class="ncbi-popup-anchor">
<div class="ncbi-popup account-popup" id="account_popup" aria-hidden="true">
<div class="ncbi-popup-head">
<button class="ncbi-close-button" data-ga-action="close_menu" data-ga-label="account_menu" type="button">
<span class="fa fa-times">
<svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 48 48" width="24px" height="24px">
<path d="M38 12.83l-2.83-2.83-11.17 11.17-11.17-11.17-2.83 2.83 11.17 11.17-11.17 11.17 2.83 2.83 11.17-11.17 11.17 11.17 2.83-2.83-11.17-11.17z"></path>
</svg>
</span>
<span class="usa-sr-only">Close</span></button>
<h4>Account</h4>
</div>
<div class="account-user-info">
Logged in as:<br />
<b><span class="username" id="uname_long">username</span></b>
</div>
<div class="account-links">
<ul class="usa-unstyled-list">
<li><a id="account_myncbi" href="/myncbi/" class="set-base-url" data-ga-action="click_menu_item" data-ga-label="account_myncbi">Dashboard</a></li>
<li><a id="account_pubs" href="/myncbi/collections/bibliography/" class="set-base-url" data-ga-action="click_menu_item" data-ga-label="account_pubs">Publications</a></li>
<li><a id="account_settings" href="/account/settings/" class="set-base-url" data-ga-action="click_menu_item" data-ga-label="account_settings">Account settings</a></li>
<li><a id="account_logout" href="/account/signout/" class="set-base-url" data-ga-action="click_menu_item" data-ga-label="account_logout">Log out</a></li>
</ul>
</div>
</div>
</div>
</div>
</div>
</header>
<div role="navigation" aria-label="access keys">
<a id="nws_header_accesskey_0" href="https://www.ncbi.nlm.nih.gov/guide/browsers/#ncbi_accesskeys" class="usa-sr-only" accesskey="0" tabindex="-1">Access keys</a>
<a id="nws_header_accesskey_1" href="https://www.ncbi.nlm.nih.gov" class="usa-sr-only" accesskey="1" tabindex="-1">NCBI Homepage</a>
<a id="nws_header_accesskey_2" href="/myncbi/" class="set-base-url usa-sr-only" accesskey="2" tabindex="-1">MyNCBI Homepage</a>
<a id="nws_header_accesskey_3" href="#maincontent" class="usa-sr-only" accesskey="3" tabindex="-1">Main Content</a>
<a id="nws_header_accesskey_4" href="#" class="usa-sr-only" accesskey="4" tabindex="-1">Main Navigation</a>
</div>
<section data-section="Alerts">
<div class="ncbi-alerts-placeholder"></div>
</section>
</div>
</div>
<!--/.header-->
<div class="header">
<div class="res_logo"><h1 class="res_name"><a href="/refseq/" title="RefSeq home">RefSeq</a></h1><h2 class="res_tagline">Integrated reference sequences</h2></div>
<div class="search"><form method="get" action="/refseq/"><div class="search_form"><label for="database" class="offscreen_noflow">Search database</label><select id="database"><optgroup label="Recent"><option value="refseq" selected="selected">RefSeq</option><option value="nuccore">Nucleotide</option><option value="pmc">PMC</option><option value="protein" class="last">Protein</option></optgroup><optgroup label="All"><option value="gquery">All Databases</option><option value="assembly">Assembly</option><option value="biocollections">Biocollections</option><option value="bioproject">BioProject</option><option value="biosample">BioSample</option><option value="books">Books</option><option value="clinvar">ClinVar</option><option value="cdd">Conserved Domains</option><option value="gap">dbGaP</option><option value="dbvar">dbVar</option><option value="gene">Gene</option><option value="genome">Genome</option><option value="gds">GEO DataSets</option><option value="geoprofiles">GEO Profiles</option><option value="gtr">GTR</option><option value="ipg">Identical Protein Groups</option><option value="medgen">MedGen</option><option value="mesh">MeSH</option><option value="nlmcatalog">NLM Catalog</option><option value="nuccore">Nucleotide</option><option value="omim">OMIM</option><option value="pmc">PMC</option><option value="protein">Protein</option><option value="proteinclusters">Protein Clusters</option><option value="protfam">Protein Family Models</option><option value="pcassay">PubChem BioAssay</option><option value="pccompound">PubChem Compound</option><option value="pcsubstance">PubChem Substance</option><option value="pubmed">PubMed</option><option value="refseq">RefSeq</option><option value="snp">SNP</option><option value="sra">SRA</option><option value="structure">Structure</option><option value="taxonomy">Taxonomy</option><option value="toolkit">ToolKit</option><option value="toolkitall">ToolKitAll</option><option value="toolkitbookgh">ToolKitBookgh</option></optgroup></select><div class="nowrap"><label for="term" class="offscreen_noflow" accesskey="/">Search term</label><div class="nowrap"><input type="text" name="term" id="term" title="Search RefSeq" value="" class="jig-ncbiclearbutton jig-ncbiautocomplete" data-jigconfig="isEnabled:false,disableUrl:'NcbiSearchBarAutoComplCtrl'" autocomplete="off" data-sbconfig="ds:'no',pjs:'no',afs:'yes'" /></div><button id="search" type="submit" class="button_search nowrap" cmd="go">Search</button></div></div><input type="hidden" name="p$a" id="p$a" /><input type="hidden" name="p$l" id="p$l" value="PAFAppLayout" /><input type="hidden" name="p$st" id="p$st" value="refseq" /><input name="SessionId" id="SessionId" value="CE8B5AF87C7FFCB1_0191SID" disabled="disabled" type="hidden" /><input name="Snapshot" id="Snapshot" value="/projects/refseq/refseq@1.21" disabled="disabled" type="hidden" /></form></div>
</div>
<div class="nav_and_browser">
</div>
<!-- was itemctrl -->
<div class="container">
<div id="maincontent" class="content col twelve_col last">
<div class="col1">
<h1 id="refseq-announcements-for-2015">RefSeq Announcements for 2015</h1>
<div class="toc">
<ul>
<li><a href="#january-7-2015-announcing-refseq">January 7, 2015: Announcing RefSeq Release 69</a><ul>
<li><a href="#changes-since-the-previous-relea">Changes since the previous release:</a></li>
</ul>
</li>
<li><a href="#march-2015-delayed-installation-">March 2015: Delayed installation of RefSeq Release 70</a></li>
<li><a href="#may-7-2015-announcing-refseq-rel">May 7, 2015: Announcing RefSeq Release 70</a><ul>
<li><a href="#changes-since-the-previous-relea_1">Changes since the previous release:</a></li>
<li><a href="#protein-records">Protein records</a></li>
<li><a href="#nucleotide-records">Nucleotide records</a></li>
<li><a href="#quality-control">Quality control</a></li>
<li><a href="#locus_tag-format">locus_tag format</a></li>
<li><a href="#available-reports-and-documentat">Available Reports and Documentation</a></li>
<li><a href="#impact-to-ncbi-gene">Impact to NCBI Gene</a></li>
<li><a href="#ongoing-work">Ongoing work</a></li>
<li><a href="#using-this-data">Using this data</a></li>
<li><a href="#measurable-reduction-in-protein-">Measurable reduction in protein redundancy</a></li>
<li><a href="#definitions">Definitions</a></li>
</ul>
</li>
<li><a href="#july-13-2015-announcing-refseq-r">July 13, 2015: Announcing RefSeq Release 71</a><ul>
<li><a href="#changes-since-the-previous-relea_2">Changes since the previous release:</a></li>
</ul>
</li>
<li><a href="#august-27-2015-announcing-refseq">August 27, 2015: Announcing RefSeq Release 72</a><ul>
<li><a href="#changes-since-the-previous-relea_3">Changes since the previous release:</a></li>
</ul>
</li>
<li><a href="#november-2-2015-announcing-refse">November 2, 2015: Announcing RefSeq Release 73</a><ul>
<li><a href="#changes-since-the-previous-relea_4">Changes since the previous release:</a></li>
</ul>
</li>
</ul>
</div>
<h2 id="january-7-2015-announcing-refseq">January 7, 2015: Announcing RefSeq Release 69</h2>
<p>This full release incorporates genomic, transcript, and protein data available, as of January 2, 2015 and includes 74,127,019 records, 52,276,468 proteins, 9,973,568 RNAs, and sequences from 51,661 organisms. Additional information is available in the <a href="https://ftp.ncbi.nlm.nih.gov/refseq/release/release-notes/archive/RefSeq-release69.txt">Release Notes</a>.</p>
<h3 id="changes-since-the-previous-relea">Changes since the previous release:</h3>
<p>[1] A list of updated organisms and dbSNP annotation summary is available here:
ftp://ftp.ncbi.nih.gov/snp/release-notes/RefSeq/refseq69.snp.rpt </p>
<p>[2] In this release, we saw almost 50% increase in the count of genomic records in the vertebrate_other node, from 2161339 to 3081632. This increase correlates with the effort to annotate a large number of bird genome assemblies in late 2014. The complete list RefSeq genomes annotated by NCBI's Eukaryotic Genome Annotation Pipeline is available here: http://www.ncbi.nlm.nih.gov/genome/annotation_euk/all/</p>
<p>Other nodes saw modest increases in record counts.</p>
<p>[3] The International Nucleotide Sequence Database Consortium (INSDC) has introduced a new feature key 'regulatory' and a set of feature classes. http://www.insdc.org/files/feature_table.html#7.2</p>
<p>It is RefSeq's policy to adhere to INSDC formats. NCBI has made the changes necessary to start using the new feature key and consequently poly-adenylation signal features are now displayed using the new format.</p>
<p>For example:
http://www.ncbi.nlm.nih.gov/nuccore/NM_001303444.1</p>
<pre><code> regulatory 1191..1196
/gene="HEXIM2"
/gene_synonym="L3"
/regulatory_class="polyA_signal_sequence"
</code></pre>
<h2 id="march-2015-delayed-installation-">March 2015: Delayed installation of RefSeq Release 70</h2>
<p>March 10, 2015: We are delaying the installation of RefSeq release 70 in order to do some additional quality assessment and prepare supplemental reports specific to this release. We anticipate releasing the data in approximately a week and apologize for the inconvenience.</p>
<p>March 12, 2015: We have identified some data concerns in the initial extraction for RefSeq release 70. We are currently working to update these issues and then will re-process data for the FTP release. We hope to install the release near the end of the month but cannot provide a firm date at this time.</p>
<p>March 31, 2015: The next RefSeq release (release number 70) will be provided in early May. In the meantime, new and updated RefSeq records continue to be provided in the RefSeq daily update directory, weekly updates of transcript and protein accessions are provided for a small number of more highly accessed vertebrates, and organism-specific genome plus annotation data (a snapshot in time) is available from the genomes FTP area. Example links to these areas include:</p>
<ol>
<li>
<p><a href="https://ftp.ncbi.nlm.nih.gov/refseq/daily/">ftp://ftp.ncbi.nlm.nih.gov/refseq/daily/</a> (RefSeq daily updates)</p>
</li>
<li>
<p><a href="https://ftp.ncbi.nlm.nih.gov/refseq/H_sapiens/mRNA_Prot">ftp://ftp.ncbi.nlm.nih.gov/refseq/H_sapiens/mRNA_Prot</a> (weekly transcript and protein updates; also available for rat, mouse, cow, pig, and Xenopus tropicalis)</p>
</li>
<li>
<p><a href="https://ftp.ncbi.nlm.nih.gov/genomes/refseq/vertebrate_mammalian/Homo_sapiens/all_assembly_versions/GCF_000001405.28_GRCh38.p2/">ftp://ftp.ncbi.nlm.nih.gov/genomes/refseq/vertebrate_mammalian/Homo_sapiens/all_assembly_versions/GCF_000001405.28_GRCh38.p2/</a> (updated annotation for the human reference genome)</p>
</li>
<li>
<p><a href="https://ftp.ncbi.nlm.nih.gov/genomes/refseq/vertebrate_mammalian/Mus_musculus/all_assembly_versions/GCF_000001635.23_GRCm38.p3">ftp://ftp.ncbi.nlm.nih.gov/genomes/refseq/vertebrate_mammalian/Mus_musculus/all_assembly_versions/GCF_000001635.23_GRCm38.p3</a> (updated annotation for the mouse reference genome)</p>
</li>
</ol>
<h2 id="may-7-2015-announcing-refseq-rel">May 7, 2015: Announcing RefSeq Release 70</h2>
<p>This full release incorporates genomic, transcript, and protein data available, as of April 30, 2015 and includes 74,720,563 records, 50,351,119 proteins, 11,310,700 RNAs, and sequences from 54,118 organisms. Additional information is available in the <a href="https://ftp.ncbi.nlm.nih.gov/refseq/release/release-notes/archive/RefSeq-release70.txt">Release Notes</a>.</p>
<p>This comprehensive RefSeq release includes a number of changes to the bacterial RefSeq genomes including completion of the <a href="/refseq/about/prokaryotes/reannotation/">bacterial re-annotation project</a> and transition to the new <a href="/refseq/about/nonredundantproteins/">non-redundant RefSeq protein data model</a>. A similar update for Archaeal genomes will occur later this year. To facilitate your transition to using this data we are providing additional extensive <a href="/refseq/about/prokaryotes/">online documentation</a>, additional report files in the RefSeq FTP release-catalog&lt;<a href="https://ftp.ncbi.nlm.nih.gov/refseq/release/release-catalog/">ftp://ftp.ncbi.nlm.nih.gov/refseq/release/release-catalog/</a>&gt; directory, custom informational messages on suppressed protein records (now replaced with non-redundant protein accessions), and custom messages on discontinued Gene records (the scope definition for Gene changed). The bacterial data model change offers advantages in annotation consistency, reduced protein redundancy, and improved management of protein names. Since the January RefSeq release, we have started a major initiative to improve bacterial RefSeq protein names.</p>
<h3 id="changes-since-the-previous-relea_1">Changes since the previous release:</h3>
<p>[1] A list of updated organisms and dbSNP annotation summary is available here:
ftp://ftp.ncbi.nih.gov/snp/release-notes/RefSeq/refseq70.snp.rpt </p>
<p>[2] Eukaryotic genome updates
This release includes updated annotation for the human reference genome (GRCh38.p2), the mouse reference genome (GRCm38) and the Caenorhabditis elegans reference genome corresponding to WormBase release WS245.</p>
<p>[3] Prokaryotic RefSeq data
This release reflects a large update of complete bacterial RefSeq genomes, proteins, and Genes.</p>
<p>NCBI decided to re-annotate all RefSeq prokaryotic genomes using NCBI’s genome annotation pipeline in order to make genome annotation comparable across genomes and species, instead of representing submitted annotation that was provided using different methods reflecting different states of technology development over time. Previously, it was possible that the same gene, in the same species, with an identical sequence for the genes genomic region might be annotated with a different protein simply because it was annotated using different methods. Because of the re-annotation, the same gene in the same species with the same sequence will now be annotated with exactly the same protein in RefSeq. If you’d like to learn more about the re-annotation project and what NCBI is doing to help you transition to using this new data, please see the RefSeq Re-annotation Project page at: http://www.ncbi.nlm.nih.gov/refseq/about/prokaryotes/reannotation/.</p>
<p>Previously, each annotated CDS was tracked with a distinct RefSeq protein accession number; however, given the facts that the identical protein sequence has been found on multiple re-annotated RefSeq genomes, coupled with the extensive sequencing of bacterial genomes (often of the same strain but different isolates) the RefSeq prokaryotic protein dataset was rapidly becoming very redundant. Therefore, rather than flood the protein database with thousands of completely identical proteins, NCBI has adopted the use of non-redundant (WP_) proteins for RefSeq prokaryotic genomes that are annotated using the NCBI pipeline. If the identical protein sequence (exactly the same protein sequence and length) appears on more than one RefSeq genome, NCBI simply re-uses the existing WP accession number instead of creating a new accession for each new occurrence and genome. For conserved proteins the same WP accession may appear on thousands of genomes. This is a first step toward dealing with a world when genomes are sequenced just for assays, rather than to discover novel proteins. We appreciate that this is new and a major change for RefSeq prokaryotic genomes, and that there are some issues still to be worked out to use these data smoothly, but we felt we needed to start making this change as the number of disease-outbreak and other isolate sequencing continues to increase rapidly.</p>
<p>Advantages of comprehensive re-annotation and non-redundant proteins:
- More consistent annotation across RefSeq bacterial genomes.
- Significant reduction in protein redundancy. This is most notable for heavily sequenced species.
For more information please see: http://www.ncbi.nlm.nih.gov/refseq/about/prokaryotes/reannotation/#reducedredundancy
- Significant improvement in protein name management. </p>
<p>This release:
The long term plan to re-annotate all RefSeq bacterial genomes using NCBI's prokaryotic genome annotation pipeline has now nearly completed and is included in this release. We anticipate that the remaining very small number of re-annotated bacterial genomes will be released by the end of the summer 2015. We also plan to re-annotate the archaeal genomes. As RefSeq bacterial genomes were re-annotated, the proteins were replaced with non-redundant RefSeq proteins (having the WP_ accession prefix). This data type was first announced in June 2013: http://www.ncbi.nlm.nih.gov/news/06-11-2013-wp-refseqs/. Thus &gt;7 million YP/NP protein accessions were removed since January, resulting in a decrease in the total number of protein accessions and a significant reduction in protein redundancy for the prokaryotic dataset. Removed accessions are reported here: ftp://ftp.ncbi.nlm.nih.gov/refseq/release/release-catalog/release70.removed-records.gz </p>
<p>A data mapping report is available in the release-catalog directory (<a href="https://ftp.ncbi.nlm.nih.gov/refseq/release/release-catalog/archive/">release70.bacterial-reannotation-report.txt.gz</a>). </p>
<h3 id="protein-records">Protein records</h3>
<p>In all bacterial genomes, except reference genomes and a small number which have yet to be re-annotated, protein accessions NP/YP have been replaced with non-redundant protein accession numbers (WP_).</p>
<ul>
<li>&gt; 7 million bacterial YP_ and NP_ RefSeq proteins were suppressed as complete bacterial genomes were re-annotated to conform to the new data model</li>
<li>Nearly 1 million non-redundant protein records were updated in March and April 2015 to improve the protein name. These updates affected CDS “/product=� annotation details for all (&gt;31,000) of the RefSeq bacterial genomes and included typographical corrections, name format standardization, and improved functional information.</li>
<li>We have initiated a long-term project to validate and improve protein names for non-redundant protein records. In March and April we validated names for approximately 2 million records using multiple support lines from Swiss-Prot, HMM analysis, domain architecture analysis, and NCBI scientific staff curation.</li>
</ul>
<h3 id="nucleotide-records">Nucleotide records</h3>
<ul>
<li>&gt;6,400 new or re-annotated RefSeq bacterial genomes were released since January 2, 2015.</li>
<li>All new complete or draft RefSeq prokaryote genomes now use the accession format rule NZ_&lt;original_INDSC_accession&gt;. Complete genomes that were already accessioned using the ‘NC_’ prefix will continue to use that accession number. Thus, the accession prefix is no longer an indicator of a complete bacterial genome. Information about genome completeness is provided in the record DEFINITION line, the Assembly resource, and FTP reports provided by Assembly and Genome resources.</li>
</ul>
<h3 id="quality-control">Quality control</h3>
<ul>
<li>Over 450 RefSeq bacterial genomes that do not meet updated quality criteria were suppressed; some of these may be reinstated in the future after further improvements are made to NCBI’s prokaryotic genome annotation pipeline.</li>
<li>A supplemental file in the refseq-catalog directory (release70.addedQA-suppressedAssemblies.txt) reports details for a subset of bacterial genomes that were suppressed in March 2015 following an expansion of QA metrics and subsequent to curatorial review. This report illustrates some of the reasons for suppression. </li>
</ul>
<h3 id="locus_tag-format">locus_tag format</h3>
<p>Re-annotated RefSeq genome records have new locus_tags in the format of &lt;original locus tag prefix&gt;_RS&lt;digits&gt;. The original locus tag is provided in the “old_locus_tag� qualifier. A bacterial genomes mapping report available in the release-catalog directory (release70.bacterial-reannotation-report.txt.gz) includes information about old and new locus_tags.</p>
<h3 id="available-reports-and-documentat">Available Reports and Documentation</h3>
<p>a) Supplemental data mapping file: A ftp file in the release-catalog directory (release70.bacterial-reannotation-report.txt.gz) has been prepared for re-annotated genomes that have recently transitioned to using the new non-redundant proteins. This file reports the old protein accession and gi, the annotated CDS coordinates, the old locus_tag and NCBI GeneID values and maps that to the current non-redundant protein accession and gi, the new locus_tag and NCBI GeneID (if available), the current CDS annotation coordinates, and indicates then the original protein identically matches verses is similar to the replacement non-redundant protein or was dropped from the annotation.
b) Supplemental report of suppressed assemblies: A ftp file in the release-catalog directory (release70.addedQA-SuppressedAssemblies.txt) reports details for a subset of bacterial genomes that were suppressed in March 2015 following an expansion of QA metrics and subsequent to curatorial review. This report illustrates some of the reasons for suppression.
c) NCBI has created online documentation to explain these changes in detail:
- Re-annotation project: http://www.ncbi.nlm.nih.gov/refseq/about/prokaryotes/reannotation/
- RefSeq Prokaryotic Genome Policy: http://www.ncbi.nlm.nih.gov/refseq/about/prokaryotes/
- RefSeq non-redundant proteins: http://www.ncbi.nlm.nih.gov/refseq/about/nonredundantproteins/
- Prokaryotic annotation pipeline: http://www.ncbi.nlm.nih.gov/genome/annotation_prok/process/
- Prokaryotic RefSeq FAQ: http://www.ncbi.nlm.nih.gov/refseq/about/prokaryotes/faq/</p>
<h3 id="impact-to-ncbi-gene">Impact to NCBI Gene</h3>
<p>Together with this re-annotation effort, the scope of bacterial genomes included in Gene has been changed to include only genomes designated as a 'reference genome,' or 'representative genome' where there is a cluster of related assemblies to indicate that the chosen representative assembly will be stable. Individual gene features on each assembly are identified with a locus_tag that can be used as a unique identifier for the gene in publications, even if the assembly is out of scope for Gene.</p>
<h3 id="ongoing-work">Ongoing work</h3>
<ul>
<li>Organism classification and QA: work continues to identify miss-classified genomes and those with contamination. Depending on the specific details of identified issues, additional RefSeq bacterial genomes may be suppressed or updated.</li>
<li>Re-annotation of complete genomes: A small number of bacterial genomes have not yet been re-annotated at this time and will be in the near future. We also plan to re-annotate the archaeal RefSeq genomes in 2015.</li>
<li>Protein names: we are continuing to work on providing improved names for the non-redundant (WP_ accessioned) bacterial protein dataset. We are leveraging multiple sources of information including curated UniProtKB/Swiss-Prot records, HMMs, Domain and domain architecture, publications and manual curation.</li>
<li>Partial proteins: we are re-examining the prokaryotic genome annotation pipeline logic with regards to providing a non-redundant protein record for partial coding sequences. </li>
</ul>
<h3 id="using-this-data">Using this data</h3>
<p>Please refer to the <a href="/refseq/about/prokaryotes/faq/">RefSeq bacterial genomes FAQ</a> for information that will facilitate access to these data</p>
<p>a)Strain-specific protein datasets for individual RefSeq genomes can be obtained online, by FTP, and through NCBI's programming utilities. To access data online, navigate to the annotated genome record(s) in NCBI's Nucleotide database, use the right-column option to "Find related data" in the Protein database, then download the protein records using the upper-right ‘Send to’ wizard. To access proteins for specific species or strains by FTP, navigate to NCBI's Assembly record then follow the right-column link to the RefSeq FTP site. RefSeq genomes include a link to the
Assembly resource in the DBLINK section of the record or in the right-column Related information section of the Nucleotide record. To access data using NCBI programming utilities one must provide the genomic accessions and use the eLink function to access the linked protein data (see documentation http://www.ncbi.nlm.nih.gov/books/NBK25501/).
b) A graphical display of an annotated gene or protein can be accessed from the Nucleotide resource. From a RefSeq genome record of interest, such as NC_002695.1, follow the link to ‘Graphics’, and search for the locus_tag or protein name of interest.
c) Conversely, is starting from an individual non-redundant protein record, information about the annotated genomic location and genome taxonomy is available by following the (page top) link to the Identical Protein report. When a non-redundant protein record has been annotated on multiple RefSeq genomes, this report page lists the set of genomes that contain that identical protein, the genomic coordinates of the annotated CDS, and the specific organism information of the annotated genomic record. Thus this report page can be used to identify the taxonomic range that that identical protein has been found in. The protein report can be downloaded in tabular format using the "Send to" link, and can be accessed using NCBI's programming utilities.</p>
<h3 id="measurable-reduction-in-protein-">Measurable reduction in protein redundancy</h3>
<p>Here are some measures for four species that illustrates the significant reduction in protein record redundancy resulting from the use of non-redundant RefSeq proteins (WP_ accessions).</p>
<pre><code>Counts:
Species Genomes Total Proteins Total Unique WPs Total Singleton WPs
------------------------- ------- -------------- ---------------- -------------------
Staphylococcus aureus 4194 11,764,898 222,588 138,284
Escherichia coli 2685 13,637,370 1,033,617 649,100
Mycobacterium tuberculosis 1790 7,245,836 139,800 101,255
Salmonella enterica 918 4,099,013 294,106 194,982
Percents:
Species Genomes Percent Reduction (WPs) Percent Singleton WPs
------------------------- ------- ----------------------- ---------------------
Staphylococcus aureus 4194 98% 62%
Escherichia coli 2685 94% 63%
Mycobacterium tuberculosis 1790 98% 72%
Salmonella enterica 918 93% 66%
Singletons Per Genome:
Species Average Protein Count Singleton WPs per Genome Percent Singleton Per Genome
------------------------- --------------------- ------------------------ ----------------------------
Staphylococcus aureus 2814 33 1.17%
Escherichia coli 5088 241 4.74%
Mycobacterium tuberculosis 4046 56 1.38%
Salmonella enterica 4485 212 4.72%
</code></pre>
<h3 id="definitions">Definitions</h3>
<ul>
<li>"Total Proteins" counts the number of times non-redundant proteins accessions are annotated on the set of genomes for the species.</li>
<li>"Total Unique WPs" counts the distinct number of non-redundant proteins used across all genomes. This is the truly non-redundant set of proteins for the species. </li>
<li>"Total Singleton WPs" counts the number of non-redundant proteins used only once in the set of genomes for the species. </li>
<li>"Percent Reduction" measures the compression in protein identifier space gained by using non-redundant protein accessions (WP_ prefix)</li>
<li>"Percent Singleton WPs" measures the percent of all non-redundant proteins for that species that are used only once in that species.</li>
</ul>
<h2 id="july-13-2015-announcing-refseq-r">July 13, 2015: Announcing RefSeq Release 71</h2>
<p>This full release incorporates genomic, transcript, and protein data available, as of July 6, 2015 and includes 77,730,891 records, 52,494,032 proteins, 11,803,354 RNAs, and sequences from 55,267 organisms.</p>
<h3 id="changes-since-the-previous-relea_2">Changes since the previous release:</h3>
<p>[1] A list of updated organisms and dbSNP annotation summary is available here:</p>
<pre><code>&lt;ftp://ftp.ncbi.nih.gov/snp/release-notes/RefSeq/refseq71.snp.rpt&gt;
</code></pre>
<p>[2]Caenorhabditis elegans:</p>
<p>The Caenorhabditis elegans annotation was updated to correct an identified problem with missing gene symbols, and incorrectly labeled non-coding RNAs.</p>
<p>[3]Prokaryotic genomes:</p>
<p>We plan to comprehensively re-annotate bacterial and archaeal genomes for RefSeq release 72 (September 2015). This re-annotation is being carried out to reflect improvements in a) management of partial, very short, and fragmented genes and proteins; and b) protein name management. This re-annotation will also increase consistency of some textual information that is applied to RefSeq records. </p>
<p>Note that re-annotation will not be done for the small set of bacterial reference genomes for which annotation changes are manually maintained.</p>
<h2 id="august-27-2015-announcing-refseq">August 27, 2015: Announcing RefSeq Release 72</h2>
<p>This full release incorporates genomic, transcript, and protein data available, as of July 6, 2015 and includes 77,730,891 records, 52,494,032 proteins, 11,803,354 RNAs, and sequences from 55,267 organisms. Additional information is available in the <a href="https://ftp.ncbi.nlm.nih.gov/refseq/release/release-notes/archive/RefSeq-release72.txt">Release Notes</a>.</p>
<h3 id="changes-since-the-previous-relea_3">Changes since the previous release:</h3>
<p><strong>[1] A list of updated organisms and dbSNP annotation summary is available here:</strong></p>
<pre><code>[ftp://ftp.ncbi.nih.gov/snp/release-notes/RefSeq/refseq72.snp.rpt](ftp://ftp.ncbi.nih.gov/snp/release-notes/RefSeq/refseq71.snp.rpt)
</code></pre>
<p><strong>[2]Caenorhabditis elegans:</strong></p>
<p>The Caenorhabditis elegans annotation was updated to correct an identified problem with missing gene symbols, and incorrectly labeled non-coding RNAs.</p>
<p><strong>[3]Prokaryotic genomes:</strong></p>
<p>We plan to comprehensively re-annotate bacterial and archaeal genomes for RefSeq release 71 (September 2015). This re-annotation is being carried out to reflect improvements in a) management of partial, very short, and fragmented genes and proteins; and b) protein name management. This re-annotation will also increase consistency of some textual information that is applied to RefSeq records. </p>
<p>Note that re-annotation will not be done for the small set of bacterial reference genomes for which annotation changes are manually maintained.</p>
<h2 id="november-2-2015-announcing-refse">November 2, 2015: Announcing RefSeq Release 73</h2>
<p>This full release incorporates genomic, transcript, and protein data available, as of November 2, 2015 and includes 83,881,439 records, 54,766,170 proteins, 12,998,293 RNAs, and sequences from 55,966 organisms. Additional information is available in the <a href="https://ftp.ncbi.nlm.nih.gov/refseq/release/release-notes/archive/RefSeq-release73.txt">Release Notes</a>.</p>
<h3 id="changes-since-the-previous-relea_4">Changes since the previous release:</h3>
<p><strong>[1] A list of updated organisms and dbSNP annotation summary is available here:</strong></p>
<pre><code>&lt;ftp://ftp.ncbi.nih.gov/snp/release-notes/RefSeq/refseq73.snp.rpt&gt;
</code></pre>
<p><strong>[2] Future change: GI sequence identifiers to be removed from some file formats</strong></p>
<p>As of 06/15/2016, the integer sequence identifiers known as "GIs" will no longer be included in the GenBank, GenPept, and FASTA formats supported by NCBI for the display of sequence records.</p>
<p>Please refer to the FTP release notes for additional details.</p>
<p><span id="shared-content-1"></span></p>
</div>
<!--/.col1-->
<div class="col2">
</div>
<!--/.col2-->
<div class="col3">
</div>
<!--/.col3-->
<div class="col4">
</div>
<!--/.col4-->
<div class="col5">
</div>
<div class="col6">
</div>
<div class="col7">
</div>
<div class="col8">
</div>
<div class="col9">
</div>
</div><!--/.content-->
</div><!--/.container-->
<div id="NCBIFooter_dynamic">
<!--<component id="NCBIBreadcrumbs"/>
<component id="NCBIHelpDesk"/>-->
<noscript><img alt="" src="/stat?jsdisabled=true&amp;ncbi_app=refseq&amp;ncbi_db=&amp;ncbi_pdid=static&amp;ncbi_phid=CE8B84157C9B19810000000000940077" /></noscript>
</div>
<div xmlns:xi="http://www.w3.org/2001/XInclude">
<div xmlns="http://www.w3.org/1999/xhtml" class="footer" id="footer" xml:base="http://127.0.0.1/sites/static/header_footer">
<section class="icon-section">
<div id="icon-section-header" class="icon-section_header">Follow NCBI</div>
<div class="grid-container container">
<div class="icon-section_container">
<a class="footer-icon" id="footer_twitter" href="https://twitter.com/ncbi" aria-label="Twitter">
<svg xmlns="http://www.w3.org/2000/svg" width="40" height="40" viewBox="0 0 40 40" fill="none">
<title>Twitter</title>
<g id="twitterx1008">
<path id="path1008" d="M6.06736 7L16.8778 20.8991L6.00001 32.2H10.2L18.6 23.1L25.668 32.2H34L22.8 17.5L31.9 7H28.4L20.7 15.4L14.401 7H6.06898H6.06736ZM9.66753 8.73423H12.9327L29.7327 30.4658H26.5697L9.66753 8.73423Z" fill="#5B616B"></path>
</g>
</svg>
</a>
<a class="footer-icon" id="footer_facebook" href="https://www.facebook.com/ncbi.nlm" aria-label="Facebook"><svg xmlns="http://www.w3.org/2000/svg" data-name="Layer 1" viewBox="0 0 300 300">
<title>Facebook</title>
<path class="cls-11" d="M210.5,115.12H171.74V97.82c0-8.14,5.39-10,9.19-10h27.14V52l-39.32-.12c-35.66,0-42.42,26.68-42.42,43.77v19.48H99.09v36.32h27.24v109h45.41v-109h35Z">
</path>
</svg></a>
<a class="footer-icon" id="footer_linkedin" href="https://www.linkedin.com/company/ncbinlm" aria-label="LinkedIn"><svg xmlns="http://www.w3.org/2000/svg" data-name="Layer 1" viewBox="0 0 300 300">
<title>LinkedIn</title>
<path class="cls-11" d="M101.64,243.37H57.79v-114h43.85Zm-22-131.54h-.26c-13.25,0-21.82-10.36-21.82-21.76,0-11.65,8.84-21.15,22.33-21.15S101.7,78.72,102,90.38C102,101.77,93.4,111.83,79.63,111.83Zm100.93,52.61A17.54,17.54,0,0,0,163,182v61.39H119.18s.51-105.23,0-114H163v13a54.33,54.33,0,0,1,34.54-12.66c26,0,44.39,18.8,44.39,55.29v58.35H198.1V182A17.54,17.54,0,0,0,180.56,164.44Z">
</path>
</svg></a>
<a class="footer-icon" id="footer_github" href="https://github.com/ncbi" aria-label="GitHub"><svg xmlns="http://www.w3.org/2000/svg" data-name="Layer 1" viewBox="0 0 300 300">
<defs>
<style>
.cls-11,
.cls-12 {
fill: #737373;
}
.cls-11 {
fill-rule: evenodd;
}
</style>
</defs>
<title>GitHub</title>
<path class="cls-11" d="M151.36,47.28a105.76,105.76,0,0,0-33.43,206.1c5.28,1,7.22-2.3,7.22-5.09,0-2.52-.09-10.85-.14-19.69-29.42,6.4-35.63-12.48-35.63-12.48-4.81-12.22-11.74-15.47-11.74-15.47-9.59-6.56.73-6.43.73-6.43,10.61.75,16.21,10.9,16.21,10.9,9.43,16.17,24.73,11.49,30.77,8.79,1-6.83,3.69-11.5,6.71-14.14C108.57,197.1,83.88,188,83.88,147.51a40.92,40.92,0,0,1,10.9-28.39c-1.1-2.66-4.72-13.42,1-28,0,0,8.88-2.84,29.09,10.84a100.26,100.26,0,0,1,53,0C198,88.3,206.9,91.14,206.9,91.14c5.76,14.56,2.14,25.32,1,28a40.87,40.87,0,0,1,10.89,28.39c0,40.62-24.74,49.56-48.29,52.18,3.79,3.28,7.17,9.71,7.17,19.58,0,14.15-.12,25.54-.12,29,0,2.82,1.9,6.11,7.26,5.07A105.76,105.76,0,0,0,151.36,47.28Z">
</path>
<path class="cls-12" d="M85.66,199.12c-.23.52-1.06.68-1.81.32s-1.2-1.06-.95-1.59,1.06-.69,1.82-.33,1.21,1.07.94,1.6Zm-1.3-1">
</path>
<path class="cls-12" d="M90,203.89c-.51.47-1.49.25-2.16-.49a1.61,1.61,0,0,1-.31-2.19c.52-.47,1.47-.25,2.17.49s.82,1.72.3,2.19Zm-1-1.08">
</path>
<path class="cls-12" d="M94.12,210c-.65.46-1.71,0-2.37-.91s-.64-2.07,0-2.52,1.7,0,2.36.89.65,2.08,0,2.54Zm0,0"></path>
<path class="cls-12" d="M99.83,215.87c-.58.64-1.82.47-2.72-.41s-1.18-2.06-.6-2.7,1.83-.46,2.74.41,1.2,2.07.58,2.7Zm0,0">
</path>
<path class="cls-12" d="M107.71,219.29c-.26.82-1.45,1.2-2.64.85s-2-1.34-1.74-2.17,1.44-1.23,2.65-.85,2,1.32,1.73,2.17Zm0,0">
</path>
<path class="cls-12" d="M116.36,219.92c0,.87-1,1.59-2.24,1.61s-2.29-.68-2.3-1.54,1-1.59,2.26-1.61,2.28.67,2.28,1.54Zm0,0">
</path>
<path class="cls-12" d="M124.42,218.55c.15.85-.73,1.72-2,1.95s-2.37-.3-2.52-1.14.73-1.75,2-2,2.37.29,2.53,1.16Zm0,0"></path>
</svg></a>
<a class="footer-icon" id="footer_blog" href="https://ncbiinsights.ncbi.nlm.nih.gov/" aria-label="Blog">
<svg xmlns="http://www.w3.org/2000/svg" id="Layer_1" data-name="Layer 1" viewBox="0 0 40 40">
<defs><style>.cls-1{fill:#737373;}</style></defs>
<title>NCBI Insights Blog</title>
<path class="cls-1" d="M14,30a4,4,0,1,1-4-4,4,4,0,0,1,4,4Zm11,3A19,19,0,0,0,7.05,15a1,1,0,0,0-1,1v3a1,1,0,0,0,.93,1A14,14,0,0,1,20,33.07,1,1,0,0,0,21,34h3a1,1,0,0,0,1-1Zm9,0A28,28,0,0,0,7,6,1,1,0,0,0,6,7v3a1,1,0,0,0,1,1A23,23,0,0,1,29,33a1,1,0,0,0,1,1h3A1,1,0,0,0,34,33Z"></path>
</svg>
</a>
</div>
</div>
</section>
<section class="container-fluid bg-primary">
<div class="container pt-5">
<div class="row mt-3">
<div class="col-lg-3 col-12">
<p><a class="text-white" href="https://www.nlm.nih.gov/socialmedia/index.html">Connect with NLM</a></p>
<ul class="list-inline social_media">
<li class="list-inline-item"><a href="https://twitter.com/NLM_NIH" aria-label="Twitter" target="_blank" rel="noopener noreferrer">
<svg xmlns="http://www.w3.org/2000/svg" width="35" height="35" viewBox="0 0 36 35" fill="none">
<title>Twitter</title>
<g id="twitterx1009" clip-path="url(#clip0_65276_3946)">
<path id="Vector_Twitter" d="M17.5006 34.6565C26.9761 34.6565 34.6575 26.9751 34.6575 17.4996C34.6575 8.02416 26.9761 0.342773 17.5006 0.342773C8.02514 0.342773 0.34375 8.02416 0.34375 17.4996C0.34375 26.9751 8.02514 34.6565 17.5006 34.6565Z" fill="#205493" stroke="white" stroke-width="1.0" stroke-miterlimit="10"></path>
<path id="path1009" d="M8.54811 8.5L16.2698 18.4279L8.50001 26.5H11.5L17.5 20L22.5486 26.5H28.5L20.5 16L27 8.5H24.5L19 14.5L14.5007 8.5H8.54927H8.54811ZM11.1197 9.73873H13.4519L25.4519 25.2613H23.1926L11.1197 9.73873Z" fill="white"></path>
</g>
<defs>
<clipPath id="clip0_65276_3946">
<rect width="35" height="35" fill="white"></rect>
</clipPath>
</defs>
</svg>
</a></li>
<li class="list-inline-item"><a href="https://www.facebook.com/nationallibraryofmedicine" aria-label="Facebook" rel="noopener noreferrer" target="_blank">
<svg xmlns="http://www.w3.org/2000/svg" width="35" height="35" viewBox="0 0 36 35" fill="none">
<title>Facebook</title>
<g id="Facebook" clip-path="url(#clip0_1717_1086)">
<path id="Vector_Facebook" d="M15.1147 29.1371C15.1147 29.0822 15.1147 29.0296 15.1147 28.9747V18.9414H11.8183C11.6719 18.9414 11.6719 18.9414 11.6719 18.8018C11.6719 17.5642 11.6719 16.3289 11.6719 15.0937C11.6719 14.9793 11.7062 14.9518 11.816 14.9518C12.8683 14.9518 13.9206 14.9518 14.9751 14.9518H15.1215V14.8329C15.1215 13.8057 15.1215 12.774 15.1215 11.7492C15.1274 10.9262 15.3148 10.1146 15.6706 9.37241C16.1301 8.38271 16.9475 7.60378 17.9582 7.19235C18.6492 6.90525 19.3923 6.76428 20.1405 6.7783C21.0029 6.79202 21.8653 6.83091 22.7278 6.86065C22.8879 6.86065 23.048 6.89496 23.2082 6.90182C23.2974 6.90182 23.3271 6.94071 23.3271 7.02993C23.3271 7.54235 23.3271 8.05477 23.3271 8.5649C23.3271 9.16882 23.3271 9.77274 23.3271 10.3767C23.3271 10.4819 23.2974 10.5139 23.1921 10.5116C22.5379 10.5116 21.8814 10.5116 21.2271 10.5116C20.9287 10.5184 20.6316 10.5528 20.3395 10.6146C20.0822 10.6619 19.8463 10.7891 19.6653 10.9779C19.4842 11.1668 19.3672 11.4078 19.3307 11.6669C19.2857 11.893 19.2612 12.1226 19.2575 12.3531C19.2575 13.1904 19.2575 14.0299 19.2575 14.8695C19.2575 14.8946 19.2575 14.9198 19.2575 14.9564H23.0229C23.1807 14.9564 23.183 14.9564 23.1624 15.1074C23.0778 15.7662 22.9885 16.425 22.9039 17.0816C22.8322 17.6321 22.7636 18.1827 22.698 18.7332C22.6729 18.9437 22.6797 18.9437 22.4693 18.9437H19.2644V28.8992C19.2644 28.9793 19.2644 29.0593 19.2644 29.1394L15.1147 29.1371Z" fill="white"></path>
<path id="Vector_2_Facebook" d="M17.5006 34.657C26.9761 34.657 34.6575 26.9756 34.6575 17.5001C34.6575 8.02465 26.9761 0.343262 17.5006 0.343262C8.02514 0.343262 0.34375 8.02465 0.34375 17.5001C0.34375 26.9756 8.02514 34.657 17.5006 34.657Z" stroke="white" stroke-width="1.0" stroke-miterlimit="10"></path>
</g>
<defs>
<clipPath id="clip0_1717_1086">
<rect width="35" height="35" fill="white"></rect>
</clipPath>
</defs>
</svg>
</a></li>
<li class="list-inline-item"><a href="https://www.youtube.com/user/NLMNIH" aria-label="Youtube" target="_blank" rel="noopener noreferrer">
<svg xmlns="http://www.w3.org/2000/svg" width="35" height="35" viewBox="0 0 36 35" fill="none">
<title>Youtube</title>
<g id="YouTube" clip-path="url(#clip0_1717_1101)">
<path id="Vector_Youtube" d="M26.2571 11.4791C25.9025 11.1589 25.5709 10.9576 24.228 10.834C22.5512 10.6785 20.2797 10.6556 18.564 10.6533H16.4365C14.7208 10.6533 12.4493 10.6785 10.7725 10.834C9.43196 10.9576 9.09798 11.1589 8.7434 11.4791C7.81464 12.321 7.6202 14.6268 7.59961 16.8938C7.59961 17.3178 7.59961 17.741 7.59961 18.1635C7.62706 20.4121 7.82837 22.686 8.7434 23.521C9.09798 23.8412 9.42967 24.0425 10.7725 24.1661C12.4493 24.3216 14.7208 24.3445 16.4365 24.3468H18.564C20.2797 24.3468 22.5512 24.3216 24.228 24.1661C25.5686 24.0425 25.9025 23.8412 26.2571 23.521C27.1722 22.6929 27.3735 20.451 27.4009 18.2206C27.4009 17.7402 27.4009 17.2599 27.4009 16.7795C27.3735 14.5491 27.1699 12.3072 26.2571 11.4791ZM15.5604 20.5311V14.652L20.561 17.5001L15.5604 20.5311Z" fill="white"></path>
<path id="Vector_2_Youtube" d="M17.5006 34.657C26.9761 34.657 34.6575 26.9756 34.6575 17.5001C34.6575 8.02465 26.9761 0.343262 17.5006 0.343262C8.02514 0.343262 0.34375 8.02465 0.34375 17.5001C0.34375 26.9756 8.02514 34.657 17.5006 34.657Z" stroke="white" stroke-width="1.0" stroke-miterlimit="10"></path>
</g>
<defs>
<clipPath id="clip0_1717_1101">
<rect width="35" height="35" fill="white"></rect>
</clipPath>
</defs>
</svg>
</a></li>
</ul>
</div>
<div class="col-lg-3 col-12">
<p class="address_footer text-white">National Library of Medicine<br />
<a href="https://www.google.com/maps/place/8600+Rockville+Pike,+Bethesda,+MD+20894/@38.9959508,-77.101021,17z/data=!3m1!4b1!4m5!3m4!1s0x89b7c95e25765ddb:0x19156f88b27635b8!8m2!3d38.9959508!4d-77.0988323" class="text-white" target="_blank" rel="noopener noreferrer">8600 Rockville Pike<br />
Bethesda, MD 20894</a></p>
</div>
<div class="col-lg-3 col-12 centered-lg">
<p><a href="https://www.nlm.nih.gov/web_policies.html" class="text-white">Web Policies</a><br />
<a href="https://www.nih.gov/institutes-nih/nih-office-director/office-communications-public-liaison/freedom-information-act-office" class="text-white">FOIA</a><br />
<a href="https://www.hhs.gov/vulnerability-disclosure-policy/index.html" class="text-white" id="vdp">HHS Vulnerability Disclosure</a></p>
</div>
<div class="col-lg-3 col-12 centered-lg">
<p><a class="supportLink text-white" href="https://support.nlm.nih.gov/">Help</a><br />
<a href="https://www.nlm.nih.gov/accessibility.html" class="text-white">Accessibility</a><br />
<a href="https://www.nlm.nih.gov/careers/careers.html" class="text-white">Careers</a></p>
</div>
</div>
<div class="row">
<div class="col-lg-12 centered-lg">
<nav class="bottom-links">
<ul class="mt-3">
<li>
<a class="text-white" href="//www.nlm.nih.gov/">NLM</a>
</li>
<li>
<a class="text-white" href="https://www.nih.gov/">NIH</a>
</li>
<li>
<a class="text-white" href="https://www.hhs.gov/">HHS</a>
</li>
<li>
<a class="text-white" href="https://www.usa.gov/">USA.gov</a>
</li>
</ul>
</nav>
</div>
</div>
</div>
</section>
<script type="text/javascript" src="/portal/portal3rc.fcgi/rlib/js/InstrumentOmnitureBaseJS/InstrumentNCBIConfigJS/InstrumentNCBIBaseJS/InstrumentPageStarterJS.js?v=1"> </script>
<script type="text/javascript" src="/portal/portal3rc.fcgi/static/js/hfjs2.js"> </script>
</div>
</div>
<!--/.footer-->
<p class="last-updated small">Last updated: 2017-12-01T21:32:03Z</p>
</div>
<!--/.page-->
</div>
<!--/.wrap-->
<span class="PAFAppResources"></span>
</div><!-- /.twelve_col -->
</div>
<!-- /.grid -->
<!-- usually for JS scripts at page bottom -->
<span class="pagefixtures"></span>
<!-- CE8B5AF87C7FFCB1_0191SID /projects/refseq/refseq@1.21 portal104 v4.1.r689238 Tue, Oct 22 2024 16:10:51 -->
<span id="portal-csrf-token" style="display:none" data-token="CE8B5AF87C7FFCB1_0191SID"></span>
<script type='text/javascript' src='/portal/js/portal.js'></script><script type="text/javascript" src="//static.pubmed.gov/portal/portal3rc.fcgi/4218658/js/3879255/4121861/4218656/4087685.js" snapshot="refseq"></script></body>
</html>