nih-gov/www.ncbi.nlm.nih.gov/genbank/wgsfaq/index.html

993 lines
58 KiB
HTML

<?xml version="1.0" encoding="utf-8"?>
<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
<head><meta http-equiv="Content-Type" content="text/html; charset=utf-8" />
<!-- AppResources meta begin -->
<meta name="paf-app-resources" content="" />
<!-- AppResources meta end -->
<!-- TemplateResources meta begin -->
<meta name="paf_template" content="StdNCol" />
<!-- TemplateResources meta end -->
<!-- Page meta begin -->
<!-- Page meta end -->
<!-- Logger begin -->
<meta xmlns:ncbi-portal="http://ncbi.gov/portal/XSLT/namespace" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" name="ncbi_app" content="genbank" /><meta xmlns:ncbi-portal="http://ncbi.gov/portal/XSLT/namespace" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" name="ncbi_pdid" content="custom-page" />
<!-- Logger end -->
<title>Frequently Asked Questions for Genomes</title>
<!-- PageFixtures headcontent begin -->
<meta name="cms-local-nav-url" content="https://cms.ncbi.nlm.nih.gov//genbank/_nav" />
<!-- PageFixtures headcontent end -->
<!-- AppResources external_resources begin -->
<script type="text/javascript" src="/core/jig/1.15.6/js/jig.min.js"></script>
<!-- AppResources external_resources end -->
<!-- Page headcontent begin -->
<meta name="subsite" content="genbank" />
<meta name="path" content="genbank/wgsfaq" />
<meta name="modified" content="2024-03-22T15:36:55Z" /><meta xmlns:ncbi-portal="http://ncbi.gov/portal/XSLT/namespace" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" name="cms-edit-aux-url" content="http://cms.ncbi.nlm.nih.gov/node//edit" />
<!-- Page headcontent end -->
<!-- PageFixtures resources begin -->
<link xmlns="http://www.w3.org/1999/xhtml" type="text/css" rel="stylesheet" href="//static.pubmed.gov/portal/portal3rc.fcgi/4218191/css/4207974/4206132.css" xml:base="http://127.0.0.1/sites/static/header_footer" />
<!-- PageFixtures resources end -->
<link rel="shortcut icon" href="//www.ncbi.nlm.nih.gov/favicon.ico" /><meta name="ncbi_phid" content="CE8EA1107C7F390100000000013300F0.m_6" />
<meta name='referrer' content='origin-when-cross-origin'/><link type="text/css" rel="stylesheet" href="//static.pubmed.gov/portal/portal3rc.fcgi/4218137/css/4121862/3974050/3917732/251717/4108189/14534/45193/3534283/4128070/3407145/4005757/4062871.css" /><link type="text/css" rel="stylesheet" href="//static.pubmed.gov/portal/portal3rc.fcgi/4218137/css/3529741/3529739.css" media="print" /></head>
<body class=" col2 custom-page">
<div class="grid">
<div class="col twelve_col nomargin shadow">
<!-- System messages like service outage or JS required; this is handled by the TemplateResources portlet -->
<div class="sysmessages">
<noscript>
<p class="nojs">
<strong>Warning:</strong>
The NCBI web site requires JavaScript to function.
<a href="/guide/browsers/#enablejs" title="Learn how to enable JavaScript" target="_blank">more...</a>
</p>
</noscript>
</div>
<!--/.sysmessage-->
<div class="wrap">
<div class="page">
<div xmlns:xi="http://www.w3.org/2001/XInclude">
<div xmlns="http://www.w3.org/1999/xhtml" id="universal_header" xml:base="http://127.0.0.1/sites/static/header_footer">
<section class="usa-banner">
<div class="usa-accordion">
<header class="usa-banner-header">
<div class="usa-grid usa-banner-inner">
<img src="https://www.ncbi.nlm.nih.gov/coreutils/uswds/img/favicons/favicon-57.png" alt="U.S. flag" />
<p>An official website of the United States government</p>
<button class="non-usa-accordion-button usa-banner-button" aria-expanded="false" aria-controls="gov-banner-top" type="button">
<span class="usa-banner-button-text">Here's how you know</span>
</button>
</div>
</header>
<div class="usa-banner-content usa-grid usa-accordion-content" id="gov-banner-top" aria-hidden="true">
<div class="usa-banner-guidance-gov usa-width-one-half">
<img class="usa-banner-icon usa-media_block-img" src="https://www.ncbi.nlm.nih.gov/coreutils/uswds/img/icon-dot-gov.svg" alt="Dot gov" />
<div class="usa-media_block-body">
<p>
<strong>The .gov means it's official.</strong>
<br />
Federal government websites often end in .gov or .mil. Before
sharing sensitive information, make sure you're on a federal
government site.
</p>
</div>
</div>
<div class="usa-banner-guidance-ssl usa-width-one-half">
<img class="usa-banner-icon usa-media_block-img" src="https://www.ncbi.nlm.nih.gov/coreutils/uswds/img/icon-https.svg" alt="Https" />
<div class="usa-media_block-body">
<p>
<strong>The site is secure.</strong>
<br />
The <strong>https://</strong> ensures that you are connecting to the
official website and that any information you provide is encrypted
and transmitted securely.
</p>
</div>
</div>
</div>
</div>
</section>
<div class="usa-overlay"></div>
<header class="ncbi-header" role="banner" data-section="Header">
<div class="usa-grid">
<div class="usa-width-one-whole">
<div class="ncbi-header__logo">
<a href="/" class="logo" aria-label="NCBI Logo" data-ga-action="click_image" data-ga-label="NIH NLM Logo">
<img src="https://www.ncbi.nlm.nih.gov/coreutils/nwds/img/logos/AgencyLogo.svg" alt="NIH NLM Logo" />
</a>
</div>
<div class="ncbi-header__account">
<a id="account_login" href="https://account.ncbi.nlm.nih.gov" class="usa-button header-button" style="display:none" data-ga-action="open_menu" data-ga-label="account_menu">Log in</a>
<button id="account_info" class="header-button" style="display:none" aria-controls="account_popup" type="button">
<span class="fa fa-user" aria-hidden="true">
<svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 24 24" width="20px" height="20px">
<g style="fill: #fff">
<ellipse cx="12" cy="8" rx="5" ry="6"></ellipse>
<path d="M21.8,19.1c-0.9-1.8-2.6-3.3-4.8-4.2c-0.6-0.2-1.3-0.2-1.8,0.1c-1,0.6-2,0.9-3.2,0.9s-2.2-0.3-3.2-0.9 C8.3,14.8,7.6,14.7,7,15c-2.2,0.9-3.9,2.4-4.8,4.2C1.5,20.5,2.6,22,4.1,22h15.8C21.4,22,22.5,20.5,21.8,19.1z"></path>
</g>
</svg>
</span>
<span class="username desktop-only" aria-hidden="true" id="uname_short"></span>
<span class="sr-only">Show account info</span>
</button>
</div>
<div class="ncbi-popup-anchor">
<div class="ncbi-popup account-popup" id="account_popup" aria-hidden="true">
<div class="ncbi-popup-head">
<button class="ncbi-close-button" data-ga-action="close_menu" data-ga-label="account_menu" type="button">
<span class="fa fa-times">
<svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 48 48" width="24px" height="24px">
<path d="M38 12.83l-2.83-2.83-11.17 11.17-11.17-11.17-2.83 2.83 11.17 11.17-11.17 11.17 2.83 2.83 11.17-11.17 11.17 11.17 2.83-2.83-11.17-11.17z"></path>
</svg>
</span>
<span class="usa-sr-only">Close</span></button>
<h4>Account</h4>
</div>
<div class="account-user-info">
Logged in as:<br />
<b><span class="username" id="uname_long">username</span></b>
</div>
<div class="account-links">
<ul class="usa-unstyled-list">
<li><a id="account_myncbi" href="/myncbi/" class="set-base-url" data-ga-action="click_menu_item" data-ga-label="account_myncbi">Dashboard</a></li>
<li><a id="account_pubs" href="/myncbi/collections/bibliography/" class="set-base-url" data-ga-action="click_menu_item" data-ga-label="account_pubs">Publications</a></li>
<li><a id="account_settings" href="/account/settings/" class="set-base-url" data-ga-action="click_menu_item" data-ga-label="account_settings">Account settings</a></li>
<li><a id="account_logout" href="/account/signout/" class="set-base-url" data-ga-action="click_menu_item" data-ga-label="account_logout">Log out</a></li>
</ul>
</div>
</div>
</div>
</div>
</div>
</header>
<div role="navigation" aria-label="access keys">
<a id="nws_header_accesskey_0" href="https://www.ncbi.nlm.nih.gov/guide/browsers/#ncbi_accesskeys" class="usa-sr-only" accesskey="0" tabindex="-1">Access keys</a>
<a id="nws_header_accesskey_1" href="https://www.ncbi.nlm.nih.gov" class="usa-sr-only" accesskey="1" tabindex="-1">NCBI Homepage</a>
<a id="nws_header_accesskey_2" href="/myncbi/" class="set-base-url usa-sr-only" accesskey="2" tabindex="-1">MyNCBI Homepage</a>
<a id="nws_header_accesskey_3" href="#maincontent" class="usa-sr-only" accesskey="3" tabindex="-1">Main Content</a>
<a id="nws_header_accesskey_4" href="#" class="usa-sr-only" accesskey="4" tabindex="-1">Main Navigation</a>
</div>
<section data-section="Alerts">
<div class="ncbi-alerts-placeholder"></div>
</section>
</div>
</div>
<!--/.header-->
<div class="header">
<div class="res_logo"><h1 class="res_name"><a href="/genbank/" title="GenBank home">GenBank</a></h1><h2 class="res_tagline">Public nucleic acid sequence repository</h2></div>
<div class="search"><form method="get" action="/nuccore/"><div class="search_form"><label for="database" class="offscreen_noflow">Search database</label><select id="database"><optgroup label="Recent"><option value="nuccore" selected="selected">Nucleotide</option><option value="sra">SRA</option><option value="books">Books</option><option value="clinvar" class="last">ClinVar</option></optgroup><optgroup label="All"><option value="gquery">All Databases</option><option value="assembly">Assembly</option><option value="biocollections">Biocollections</option><option value="bioproject">BioProject</option><option value="biosample">BioSample</option><option value="books">Books</option><option value="clinvar">ClinVar</option><option value="cdd">Conserved Domains</option><option value="gap">dbGaP</option><option value="dbvar">dbVar</option><option value="gene">Gene</option><option value="genome">Genome</option><option value="gds">GEO DataSets</option><option value="geoprofiles">GEO Profiles</option><option value="gtr">GTR</option><option value="ipg">Identical Protein Groups</option><option value="medgen">MedGen</option><option value="mesh">MeSH</option><option value="nlmcatalog">NLM Catalog</option><option value="nuccore">Nucleotide</option><option value="omim">OMIM</option><option value="pmc">PMC</option><option value="protein">Protein</option><option value="proteinclusters">Protein Clusters</option><option value="protfam">Protein Family Models</option><option value="pcassay">PubChem BioAssay</option><option value="pccompound">PubChem Compound</option><option value="pcsubstance">PubChem Substance</option><option value="pubmed">PubMed</option><option value="snp">SNP</option><option value="sra">SRA</option><option value="structure">Structure</option><option value="taxonomy">Taxonomy</option><option value="toolkit">ToolKit</option><option value="toolkitall">ToolKitAll</option><option value="toolkitbookgh">ToolKitBookgh</option></optgroup></select><div class="nowrap"><label for="term" class="offscreen_noflow" accesskey="/">Search term</label><div class="nowrap"><input type="text" name="term" id="term" title="Search Nucleotide" value="" class="jig-ncbiclearbutton jig-ncbiautocomplete" data-jigconfig="isEnabled:false,disableUrl:'NcbiSearchBarAutoComplCtrl'" autocomplete="off" data-sbconfig="ds:'no',pjs:'no',afs:'yes'" /></div><button id="search" type="submit" class="button_search nowrap" cmd="go">Search</button></div></div></form></div>
</div>
<div class="nav_and_browser">
<div class="localnav"><ul class="jig-ncbilocalnav">
<li><a href="#">GenBank</a><ul>
<li><a href="/genbank/">About GenBank</a></li>
<li><a href="/genbank/submit_types">Submission Types</a></li>
<li><a href="/genbank/submit">Submission Tools</a></li>
<li><a href="/genbank/update">Update GenBank Records</a></li>
<li><a href="/nuccore/">Search</a></li>
<li><a href="/BLAST/Blast.cgi?CMD=Web&amp;PAGETYPE=BLASTHome">BLAST</a></li>
<li><a href="/genbank/statistics">Statistics</a></li>
<li><a href="/genbank/samplerecord/">Sample Record</a></li>
<li><a href="/genbank/sequencerevisionhistory/">Revision History</a></li>
<li><a href="/genbank/sequenceids/">Sequence IDs</a></li>
</ul>
</li>
<li><a href="#">Submit</a><ul>
<li><a href="/genbank/submit">Submission Tools</a></li>
<li><a href="/genbank/submit_types">Submission Types</a></li>
<li><a href="/WebSub/?tool=genbank">BankIt</a></li>
<li><a href="/genbank/table2asn">table2asn</a></li>
<li><a href="https://www.ncbi.nlm.nih.gov/sra/docs/sequence-data-processing">Sequence Data Processing</a></li>
</ul>
</li>
<li><a href="#">Genomes</a><ul>
<li><a href="/genbank/genomesubmit">Complete Genome Submission Guide</a></li>
<li><a href="/genbank/genomesubmit_annotation">Prokaryotic Genome Annotation Guide</a></li>
<li><a href="/genbank/eukaryotic_genome_submission_annotation">Eukaryotic Genome Annotation Guide</a></li>
<li><a href="/genbank/examples.wgs">Annotation Examples</a></li>
<li><a href="https://submit.ncbi.nlm.nih.gov/subs/wgs/">Genome Submission Portal</a></li>
</ul>
</li>
<li><a title="Whole Genome Shotgun sequences and submissions" href="#">WGS</a><ul>
<li><a href="/genbank/wgs">About WGS</a></li>
<li><a href="/Traces/wgs">WGS Project List</a></li>
<li><a href="/genbank/wgs.submit">WGS Submission Guide</a></li>
<li><a href="/genbank/wgsfaq/">FAQ</a></li>
<li><a href="https://submit.ncbi.nlm.nih.gov/subs/wgs/">Genome Submission Portal</a></li>
<li><a href="/genbank/eukaryotic_genome_submission_annotation">Eukaryotic Annotation Guide</a></li>
<li><a href="/genbank/genomesubmit_annotation">Prokaryotic Annotation Guide</a></li>
<li><a href="/genbank/asndisc">Discrepancy Report</a></li>
<li><a href="/assembly/agp/AGP_Specification/">AGP format</a></li>
</ul>
</li>
<li><a href="#">Metagenomes</a><ul>
<li><a href="/genbank/metagenome">About Metagenomes</a></li>
<li><a href="/genbank/structuredcomment">Structured Comment</a></li>
</ul>
</li>
<li><a href="#">TPA</a><ul>
<li><a href="/genbank/TPA">About TPA</a></li>
<li><a href="/genbank/tpafaq">FAQ</a></li>
<li><a href="/genbank/TPA-Exp">TPA-Exp</a></li>
<li><a href="/genbank/TPA-Inf">TPA-Inf</a></li>
</ul>
</li>
<li><a href="#">TSA</a><ul>
<li><a href="/genbank/TSA">About TSA</a></li>
<li><a href="/genbank/TSAguide">TSA Submission Guide</a></li>
<li><a href="/genbank/TSAfaq">FAQ</a></li>
</ul>
</li>
<li><a href="#">INSDC</a><ul>
<li><a href="/genbank/collab">About INSDC</a></li>
<li><a href="/genbank/collab/country">Geographic Location Name List</a></li>
<li><a href="/genbank/collab/db_xref">db_xref List</a></li>
<li><a href="http://www.insdc.org/documents/feature_table.html">Feature Table</a></li>
</ul>
</li>
<li><a href="#">Documentation</a><ul>
<li><a href="https://www.ncbi.nlm.nih.gov/sra/docs/sequence-data-processing/">Sequence Data Processing</a></li>
<li><a href="/genbank/submission_brokers">Submission Brokers</a></li>
<li><a href="/genbank/acc_prefix">Accession Number Prefixes</a></li>
<li><a href="/genbank/organelle_submit/">Organelle Submission Guide</a></li>
<li><a href="/genbank/monkeypox_submission/">Monkeypox Submission Guide</a></li>
<li><a href="/genbank/validation/">Common Submission Errors</a> </li>
<li><a href="/genbank/sequencecheck/">Ribosomal Submission Errors</a></li>
<li><a href="/genbank/sequencecheck/virus">Common Sequence Errors</a></li>
<li><a href="https://support.nlm.nih.gov/knowledgebase/category/?id=CAT-01240">Submission FAQs</a></li>
</ul>
</li>
<li><a href="#">Other</a><ul>
<li><a href="/genbank/htgs">About HTGs</a></li>
<li><a href="/genbank/dbest">About EST</a></li>
<li><a href="/genbank/dbgss">About GSS</a></li>
<li><a href="/genbank/tls">About TLS</a></li>
<li><a href="/genbank/tlsguide">Submit TLS</a></li>
</ul>
</li>
</ul></div>
</div>
<!-- was itemctrl -->
<div class="container">
<div id="maincontent" class="content col twelve_col last">
<div class="col1">
<h1 id="frequently-asked-questions-for-g">Frequently Asked Questions for Genomes</h1>
<ol>
<li><a href="#q1">Can I submit an assembly and have it held back until I publish my paper?</a></li>
<li><a href="#virus">Where do I submit my viral genome assemblies?</a></li>
<li><a href="#multi">Do I have to register a separate BioProject for each genome I am sequencing?</a></li>
<li><a href="#q3">Do I need to submit my genome assembly with annotation?</a></li>
<li><a href="#pipe">Does NCBI have an annotation pipeline that can be used to annotate my assembly?</a></li>
<li><a href="#annot_format">If I do have my own annotation, in what format should I provide this data?</a></li>
<li><a href="#ff">Can I submit annotation as a GenBank flatfile?</a></li>
<li><a href="#ngs">I'm using next generation sequencing technology. Can I still submit an assembly?</a></li>
<li><a href="#split">Do I need to split the sequences at the Ns that were inserted by the assembler?</a></li>
<li><a href="#q6">What should I use for the gap sizes?</a></li>
<li><a href="#q7">I concatenated the sequences into the correct order with Ns between each sequence and annotated this pseudomolecule. Can I submit this annotated pseudomolecule?</a></li>
<li><a href="#q8">I concatenated the sequences in a random order with Ns between each sequence and annotated the pseudomolecule. Can I submit the annotated pseudomolecule?</a></li>
<li><a href="#q9">Can I annotate across gaps?</a></li>
<li><a href="#q13">My genome assembly has contigs and scaffolds. Should I submit the annotation on the contigs or the scaffolds?</a></li>
<li><a href="#singletons">I want all of the WGS contigs in my assembly available to users. Should I put unlinked WGS contigs into the AGP?</a></li>
<li><a href="#diploid">How do I submit the separate haplotypes that were created from the reads of a diploid/polyploid genome?</a></li>
<li><a href="#metagen">How do I submit a prokaryotic or eukaryotic genome assembled from metagenomic reads (a MAG)?</a></li>
<li><a href="#rast">Can I submit RAST annotation?</a></li>
</ol>
<h2 id="q1">Can I submit an assembly and have it held back until I publish my paper?</h2>
<p>Yes, you may submit your assembly and have it held until publication. You will select a release date, and your genome will be released on that day or when it is publicly available, whichever is first. If needed, you can write to <a href="mailto:genomes@ncbi.nlm.nih.gov">genomes@ncbi.nlm.nih.gov</a> to request a change of the release date.</p>
<p>Note that release of the genome will automatically trigger the release of its BioProject and BioSample. However, the reverse is not true; the release of a BioProject or BioSample will not automatically trigger the release of associated data.</p>
<h2 id="virus">Where do I submit my viral genome assemblies?</h2>
<p>Virus sequences are submitted to GenBank via the appropriate option on the <a href="https://www.ncbi.nlm.nih.gov/WebSub/">BankIt</a> page.</p>
<h2 id="multi">Do I have to register a separate BioProject for each genome I am sequencing?</h2>
<p>If multiple genomes are part of the same research effort,
then they should belong to the same BioProject. However, each sample
must be registered as a separate BioSample.</p>
<p>Be sure to use the same BioProject and BioSample for the assembled genome and for the sequence reads that were used to assemble it.</p>
<h2 id="q3">Do I need to submit my genome assembly with annotation?</h2>
<p>No, you can submit the genome without any annotation. However, during the
genome submission you may request that a prokaryotic genome assembly be annotated by NCBI's
<a href="#pipe">Prokaryotic Genome Annotation Pipeline</a> before its release into
GenBank.</p>
<h2 id="pipe">Does NCBI have an annotation pipeline that can be used to annotate my assembly?</h2>
<p>You can request that NCBI annotate prokaryotic genomes using our <a href="/genome/annotation_prok/">Prokaryotic Genome Annotation Pipeline</a> during the <a href="/genbank/genomesubmit/#pgap">submission process</a>. </p>
<p>In addition, you can download and <a href="/genbank/genomesubmit/#run_pgap">run PGAP yourself</a> before submission, if desired.</p>
<p>The NCBI <a href="/genome/annotation_euk/">Eukaryotic Genome Annotation pipeline</a> is not available as a
GenBank submitter resource. See its <a href="/genome/annotation_euk/policy/">annotation policy</a> for details.</p>
<h2 id="annot_format">If I do have my own annotation, in what format should I provide this data?</h2>
<p>To submit the annotation, you need to create a .sqn file in ASN format
that combines the annotation and sequence, allowing for validation to check that these are consistent with each other without errors. The basic description is at <a href="https://www.ncbi.nlm.nih.gov/genbank/genomesubmit/#sqn">https://www.ncbi.nlm.nih.gov/genbank/genomesubmit/#sqn</a>.</p>
<p>As described there, the annotation input can be in either the 5-column
feature table (.tbl) format OR as a GenBank-specific GFF3 file. You then run table2asn to create the .sqn file and validate it.</p>
<ul>
<li><a href="/genbank/genomesubmit_annotation">Prokaryotic Annotation Guidelines</a> with .tbl examples</li>
<li><a href="/genbank/eukaryotic_genome_submission">Eukaryotic Annotation Guidelines</a> with .tbl examples</li>
<li><a href="/genbank/genomes_gff">Using GFF3 file as input</a></li>
</ul>
<p>Note that our set of <a href="#rast">RAST conversion scripts</a> are able to convert some .gb
flatfile formats into a GenBank submission.</p>
<h2 id="ff">Can I submit annotation as a GenBank flatfile?</h2>
<p>In general, we cannot accept annotation as a GenBank, EMBL or DDBJ flat
file. To submit annotation, see this <a href="#annot_format">FAQ</a> </p>
<p>However, you might be able to use the <a href="#rast">RAST conversion scripts</a> to make the correct file for
submission from a .gb file, although there may still be problems that
need to be fixed to create a GenBank submission.</p>
<h2 id="ngs">I'm using next generation sequencing technology. Can I still submit an assembly?</h2>
<p>Yes, you may submit assemblies using second or third generation sequencing
technology. The primary reads should be submitted to the <a href="/sra">Sequence Read Archive</a>.
The reads should be assembled into contigs
and submitted as described in the <a href="/genbank/genomesubmit">submission instructions</a>.
These WGS contigs can be used to
assemble higher order molecules and submitted to GenBank genomes either as gapped scaffold sequences or
as contigs plus an AGP file, as described in the <a href="/genbank/genomesubmit">submission instructions</a>.</p>
<h2 id="split">Do I need to split the sequences at the Ns that were inserted by the assembler?</h2>
<p>No, you do not need to split properly assembled sequences. However, sequences that have been concatenated in random, unknown order are not allowed. For example, we cannot accept a single sequence of all the unplaced sequences (eg, a chromosome Un).</p>
<p>During the submission process you will be asked to indicate what the Ns in the
genome sequence represent. The default answers are that 10 or more Ns
in a row represent a gap and that "paired-ends" is the evidence that
the sequences on either side of each gap are linked. If those answers
are not correct, then you need to provide the correct answers in the
submission form. During processing of the submission, those runs of Ns will be converted
to assembly_gap features. Note that NCBI's <a href="https://www.ncbi.nlm.nih.gov/assembly/">Assembly resource</a> counts
runs of 10 or more Ns as a gap, regardless of whether they have been
converted to a gap during processing of the genome.</p>
<p>The original/traditional submission format, of splitting the sequences at the runs
of Ns into contigs and rebuilding the scaffolds with an AGP file,
remains a submission option.</p>
<h2 id="q6">What should I use for the gap sizes?</h2>
<p>If you have estimates of the gap sizes, then use those values for the
gaps in the AGP file. We prefer that you use 10 as the minimum gap size, to be more of
a signal to database users. If you do not have an estimate of the gap
size, then the preference is to use 100 as the value and the 'U' in
column five of the <a href="/assembly/agp/AGP_Specification/">AGP</a> file,
indicating that the gap size is unknown. </p>
<p>If there is no annotation, then you can submit the fasta file and
answer the questions about the Ns in the sequence. The default answers
are that 10 or more Ns in a row represent a gap and that "paired-ends"
is the evidence that the sequences on either side of each gap are
linked. If those answers are not correct, then you provide the
correct answers in the submission form. During processing those runs
of Ns will be converted to assembly_gap features. Note that NCBI's
<a href="https://www.ncbi.nlm.nih.gov/assembly/">Assembly resource</a> counts runs of 10 or more Ns as a gap, regardless of
whether they have been converted to a gap during processing of the
genome.</p>
<p>For more complicated submissions with annotation on gapped sequence, follow the <a href="/genbank/wgs_gapped">Gapped submission</a> cases and instructions.</p>
<h2 id="q7">I concatenated the sequences into the correct order with the Ns between each sequence and annotated the pseudomolecule. Can I submit this annotated pseudomolecule?</h2>
<p>Yes, you can submit this gapped submissions. However, you will need
to include the correct gap and linkage evidence for each run of Ns
that represents a gap. You can make the appropriate gaps with table2asn, as
<a href="/genbank/wgs_gapped">described</a>, and use <a href="/genbank/genomesubmit/#sqn">.tbl</a> or <a href="genomes_gff/">GenBank-specific .gff file</a> as the annotation input.</p>
<h2 id="q8">I concatentated the sequences in a random order with Ns between each sequence and annotated this pseudomolecule. Can I submit the annotated pseudomolecule?</h2>
<p>No, you cannot. Since the sequence does not correspond to a biological
molecule, you need to split the pseudomolecule into the contig
sequences and submit those as the pieces of a wgs project. You will
need to map the annotation down to the contig level, but can use an
<a href="/genbank/feature_table">offset in the .tbl file</a> to avoid recalculating locations, if desired.</p>
<h2 id="q9">Can I annotate across gaps?</h2>
<p>Protein translations are allowed to cross gaps of estimated size, but
not those of unknown sizes. That is, introns can be in gaps of unknown
size, but not exons. However, annotation across gaps is discouraged
unless there is evidence that the translation on the other side of the
gap is in the correct frame. In addition, if &gt;50% of the
translation is Xs (i.e. in the gap) then the CDS should be made
partial at the gap, or split into two partial CDSs, as described for
<a href="/genbank/eukaryotic_genome_submission_annotation/#Splitgenesontwocontigs">genes split across two contigs</a>,
depending upon the confidence of the translation on both sides of the
gap.</p>
<h2 id="q13">My genome assembly has contigs and scaffolds. Should I submit the annotation on the contigs or the scaffolds?</h2>
<p>Eukaryotic genomes, which usually have thousands of contigs and
hundreds or thousands of scaffolds, should be annotated at the
scaffold level. </p>
<h2 id="singletons">I want all of the WGS contigs in my assembly available to users. Should I put singleton WGS contigs into the AGP?</h2>
<p>When a genome submission includes an AGP file, that file defines the assembly. Therefore, typically we do want all of the WGS contigs in the AGP file. However, contigs that are not considered to be part of the assembly, perhaps because they are degenerate or duplicates, should not be included in the AGP file. In addition, remove from the submission any sequences that are shorter than 200 bp and are not part of multi-component scaffolds.</p>
<h2 id="diploid">How do I submit the separate haplotypes that were created from the reads of a diploid/polyploid genome?</h2>
<p>When the assembly methods were able to generate separate assemblies of the haplotypes of a diploid/polyploid genome, submit them according to the instructions at <a href="/genbank/diploid_haps/">Submitting multiple haplotype assemblies</a></p>
<h2 id="metagen">How do I submit a prokaryotic or eukaryotic genome assembled from metagenomic reads (a MAG)?</h2>
<p>Description: You isolated DNA from an environmental or mixed sample and then binned and assembled the sequences to create individual prokaryotic or eukaryotic metagenome-assembled genomes (MAGs). Each assembly must:</p>
<ul>
<li>represent the genome from a single prokaryotic or eukaryotic organism reconstructed from the metagenomic mix</li>
<li>include all the identified genome sequence (ie, you have not intentionally removed noncoding regions or included only the sequences for a single kind of gene)</li>
<li>have a CheckM or CheckM2 of at least 90%</li>
<li>have a total size of at least 100,000 nucleotides</li>
</ul>
<p>Note that you should only use sequences that you have determined
yourself. Do not include sequences you have only downloaded from a
public depository. The raw reads should be submitted to the
<a href="https://submit.ncbi.nlm.nih.gov/subs/sra/">Sequence Read Archive (SRA)</a> and the
contigs made from overlapping reads can be submitted as a genome assembly.</p>
<p>(1) You will need to <a href="https://submit.ncbi.nlm.nih.gov/subs/bioproject">register a BioProject</a> for this
research effort. You can use this one BioProject for all the data associated with this study.</p>
<p>(2) You will need the SRA run accessions for the reads used to create the MAGs.
SRA data is organized into 4 levels:</p>
<ul>
<li>STUDY: accessions begin with SRP,ERP,DRP</li>
<li>SAMPLE: accessions begin with SRS,ERS,DRS</li>
<li>EXPERIMENT: accessions begin with SRX,ERX,DRX</li>
<li>RUN: accessions begin with SRR,ERR,DRR</li>
</ul>
<p>Please provide the 'run' accessions for the individual reads that
were used for each MAG. The accessions should start with SRR, ERR, or DRR.
You will need the SRA accessions when you create the MAG BioSamples in step (5).</p>
<p>Alternatively, if you sequenced the data but did not submit the reads to SRA,
instead of providing the SRA accessions, you can use a BioSample that represents
the mixed sample from which the DNA was isolated. Register this physical sample
in the <a href="https://submit.ncbi.nlm.nih.gov/subs/biosample/">BioSample database</a>. Select either the NCBI "Metagenome or environmental" package or the GSC MIxS
"MIMS Environmental/Metagenome" package. Use a metagenome organism name
that describes the sample from which the DNA was isolated (eg soil metagenome or
gut metagenome). Choose one of the metagenome names that is already present in the
<a href="https://www.ncbi.nlm.nih.gov/Taxonomy/Browser/wwwtax.cgi?mode=Undef&amp;id=408169&amp;lvl=3&amp;p=mapview&amp;p=has_linkout&amp;p=blast_url&amp;p=genome_blast&amp;keep=1&amp;srchmode=1&amp;unlock">NCBI Taxonomy database</a>.
If you did not submit the reads to SRA, you will need this physical metagenome
BioSample when you create the MAG BioSamples in step (5).</p>
<p>(3) Please provide a unique alpha-numeric code to distinguish each MAG assembly.
We will add the identifier as an isolate but we realize each organism was metagenomically
binned and not isolated. The isolate will be a stable identifier used only for a single MAG
that will not change over time. We do not recommend including the organism name or an
abbreviation of the organism name in the isolate, because the organism name may be updated
if additional work is done to characterize the MAG in the future, but the isolate will not change.
Do not include SRA accessions as part of the isolate. The isolate should be a series of letters or
numbers that serve as an identifier for your organism assembly. For example, how do you identify
this assembly in your laboratory notebook? If you don't have another identifier, you could use
something like MAG1, MAG2. You will need the isolate when you register the MAG BioSample
in step (5).</p>
<p>(4) We will need an organism name for each MAG. The organism names should be taxonomically meaningful,
at the lowest rank that is reliable (division, phylum, class, order, family, genus or species)
and in the NCBI Taxonomy database. Note that NCBI does not utilize unpublished ad hoc taxonomic names
from other databases such as Silva or GTDB. Therefore, before registering the BioSamples,
please email to <a href="mailto:genomes@ncbi.nlm.nih.gov">genomes@ncbi.nlm.nih.gov</a> a list of organism names
you plan to use and we will verify that those names are in the NCBI taxonomy database or are
appropriate to be added to the database. Please provide a table with:</p>
<ul>
<li>Column 1: the unique isolate name from step (3)</li>
<li>Column 2: the organism names you would to like to use OR the GTDB lineage in the original unmodified format</li>
</ul>
<p>We can use the unmodified GTDB lineage to determine the best NCBI tax name, but our tool will
not work if the format from GTDB has been modified. Here is an example of the correct format:</p>
<table>
<thead>
<tr>
<th>Isolate</th>
<th>GTDB lineage</th>
</tr>
</thead>
<tbody>
<tr>
<td>MAG1</td>
<td>d__Bacteria;p__Proteobacteria;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia coli_D</td>
</tr>
<tr>
<td>MAG2</td>
<td>d__Bacteria;p__Firmicutes_A;c__Clostridia;o__Monoglobales_A;f__UBA1381;g__12844;s__</td>
</tr>
<tr>
<td>MAG3</td>
<td>d__Bacteria;p__Myxococcota;c__Polyangia;o__Haliangiales;f__Haliangiaceae;g__;s__</td>
</tr>
<tr>
<td>MAG4</td>
<td>d__Bacteria;p__Patescibacteria;c__ABY1;o__SG8-24;f__2-12-FULL-60-25;g__;s__</td>
</tr>
</tbody>
</table>
<p>We will confer with the NCBI taxonomists and return to you the organism names to use when you create the MAG BioSamples in step (5).</p>
<p>(5) Use the names that we return to you in step (4) to <a href="https://submit.ncbi.nlm.nih.gov/subs/biosample/">create organism-specific MAG BioSamples</a>. You should create one BioSample
for each MAG. When you create the MAG BioSamples:</p>
<ul>
<li>choose the “MIMAG Metagenome-assembled Genome” package</li>
<li>include the BioProject ID PRJNAxxxx you created in step [1]</li>
<li>include as much source information as you can (eg, geo_loc_name, collection-data, lat-lon, isolation-source, etc.). The information should agree with the corresponding SRA data or physical BioSample(s). If multiple samples were used, include the common information. For example, if samples were collect on 3 different dates in the same year, just use the year as the collection-date of the MAG.</li>
<li>include a unique isolate name from step [3]</li>
<li>include sample_type=metagenomic assembly</li>
<li>in the derived_from attribute, list the SRA accessions for the reads used to create the MAGs (see step [2]). If there is more
than one read accession for a MAG, list all the accessions separated by commas. Do not hyphenate the list. Alternatively, if you did
not submit the reads or if your protocol precluded knowing which reads were used to assemble the MAG, you can provide the SAMN id for
the physical BioSample(s) that represents the mixed sample from which the DNA was isolated as described in step [2]. </li>
</ul>
<p>If you have several MAG BioSamples, you can use a table to upload all the BioSample information. From the
<a href="https://submit.ncbi.nlm.nih.gov/subs/biosample/">BioSample registration page</a> select
"Download batch template". Choose the “MIMAG Metagenome-assembled Genome” package and select
"download". Fill in this template and then upload it using the "Batch/Multiple BioSamples" option when you create a new BioSample
submission. Alternatively, you can provide this information in the embedded table within the BioSample submission form.
Note that you can only create 1000 BioSamples in a single table. If you have more than 1000 MAGs, you will need to divide the table
into separate BioSample submissions. If you are planning to submit 5000 or more MAGs, please write to <a href="mailto:genomes@ncbi.nlm.nih.gov">genomes@ncbi.nlm.nih.gov</a>
so we can review your BioSamples before you begin submitting the genome files.</p>
<p>(6) Prepare the genome sequences. In the fasta header of each sequence, include the SRA read accessions (SRR,ERR,DRR) of the reads
that were used to assemble the MAG (see step (2)). For example:</p>
<p>&gt;contig1 [SRA=SRRxxxxxx,SRRxxxxxy]</p>
<p>(7) After you have created the BioProject and the BioSamples, you are ready to submit the data using the <a href="https://submit.ncbi.nlm.nih.gov/subs/genome/">genome submission portal</a>.<br />
Submit each MAG assembly as a separate row in a <a href="/genbank/genomesubmit/#batch">batch submission</a> using the BioProject ID PRJNAxxxxx
from step [1] and the BioSample ID SAMNxxxxxxxx for the individual MAG from step (5). Note that because we run several validation
checks on each genome assembly, a single batch submission cannot contain more than 400 assemblies. If you have more than 400 MAGs,
you will need to divide them into separate batches. </p>
<p>(8) Annotation is not required; however, you may be interested to know that NCBI has a publicly available <a href="https://www.ncbi.nlm.nih.gov/genome/annotation_prok/">Prokaryotic Genomes Annotation Pipeline (PGAP)</a>. PGAP can be used for prokaryotic MAGs but not for sequences that are identified only as metagenomes. You can <a href="https://www.ncbi.nlm.nih.gov/genbank/genomesubmit/#pgap">request PGAP annotation during submission</a> of the MAG to GenBank, or you can <a href="https://www.ncbi.nlm.nih.gov/genbank/genomesubmit/#run_pgap">run PGAP yourself</a> and submit a GenBank-ready file. Note that we do not have a publicly available eukaryotic annotation pipeline.</p>
<h2 id="rast">Can I submit RAST annotation?</h2>
<p>We have a prototype that will convert flatfile
formats created by outside programs for prokaryotes into a 5-column feature
table. However, there may still be problems because GenBank-type files from other
sources often contain qualifiers that are not recognized by GenBank so
they cannot be converted. Conversely, features or qualifiers that are
required by GenBank may be missing. In addition, there may be errors
such as internal N's representing gaps, invalid translations or
<a href="/genbank/genomesubmit_annotation/#CDS">unacceptable protein names</a> that need to be addressed.</p>
<p>To convert the flatfile (.gb) file from RAST to a .sqn file for GenBank
submission, get the scripts from the scripts directory on the NCBI ftp
site: <a href="https://ftp.ncbi.nih.gov/toolbox/ncbi_tools/converters/scripts/">https://ftp.ncbi.nih.gov/toolbox/ncbi_tools/converters/scripts/</a></p>
<ul>
<li>gbf2tbl.pl</li>
<li>rast2sqn.sh</li>
<li>rastbatch.sh</li>
<li>tblfix.pl</li>
</ul>
<p>In addition, provide the following:</p>
<ul>
<li>a template file (from <a href="https://submit.ncbi.nlm.nih.gov/genbank/template/submission/">https://submit.ncbi.nlm.nih.gov/genbank/template/submission/</a>)</li>
<li>flatfile from RAST (*gb)</li>
<li>locus tag prefix (whatever is registered in BioProject for this genome)</li>
<li>protein_id prefix (an abbreviation of your lab name that you think will be unique)</li>
</ul>
<p>usage:</p>
<ul>
<li><code>./rast2sqn.sh template flatfile locus_tag_prefix protein_id_prefix</code></li>
</ul>
<p>for example:</p>
<p>input:</p>
<ul>
<li>flatfile = TEST.gb</li>
<li>template file = template.sbt</li>
<li>locus_tag prefix = AAA</li>
<li>protein_id_prefix = xx</li>
</ul>
<p>commandline:</p>
<ul>
<li>./rast2sqn.sh template.sbt TEST.gb AAA xx</li>
</ul>
<p>output:</p>
<ul>
<li>TEST.sqn</li>
<li>TEST.fsa</li>
<li>TEST.tbl</li>
<li>TEST.val = validation</li>
<li>errorsummary.val = summary of validation</li>
<li>TEST.dsc = discrepancy report</li>
<li>TEST.err = qualifiers that couldn't be converted</li>
<li>TEST.ecn = EC_numbers that are not found at ftp://ftp.expasy.org/databases/enzyme/enzyme.dat</li>
<li>TEST.fixedproducts = product names found by the discrepancy report Typo, Hypothetical protein, and American spelling tests that are automatically corrected</li>
</ul>
<p>You will need to review the validation and discrepancy reports, as described in the <a href="/genbank/genomesubmit/#sqn">3) Check the output of the validation and discrepancy report and fix problems</a> section under the '<em>see details</em>' hyperlink.</p>
<p>Make any necessary corrections to the starting .gb file and re-run the script. Alternatively, you can edit the .tbl file and then run table2asn <a href="/genbank/genomesubmit/#sqn">as described</a> to create a .sqn file for submission.</p>
<p><a href="https://submit.ncbi.nlm.nih.gov/subs/genome/">Submit</a> the .sqn file, as described.</p>
</div>
<!--/.col1-->
<div class="col2">
<div class="rightnav">
<h2 id="genome-resources">Genome Resources</h2>
<ul>
<li><a href="/genbank/wgs/">About WGS</a></li>
<li><a href="https://www.ncbi.nlm.nih.gov/Traces/wgs/?view=wgs">WGS Browser</a></li>
<li><a href="/genbank/genomesubmit/">Genome Submission Guide</a></li>
<li><a href="https://submit.ncbi.nlm.nih.gov/subs/genome/">Genome Submission Portal</a></li>
<li><a href="/genbank/wgs_update/">Update Genome Records</a></li>
<li><a href="/genbank/wgsfaq/">FAQ</a></li>
<li><a href="/genbank/table2asn">table2asn</a></li>
<li><a href="/genbank/diploid_haps">Submitting Multiple Haplotype Assemblies</a></li>
<li><a href="/WebSub/template.cgi/">Create Submission Template</a></li>
<li><a href="/genbank/eukaryotic_genome_submission/">Eukaryotic Annotation Guide</a></li>
<li><a href="/genbank/genomesubmit_annotation/">Prokaryotic Annotation Guide</a></li>
<li><a href="/genbank/examples.wgs/">Annotation Example Files</a></li>
<li><a href="/genbank/genomes_gff">Annotating Genomes with GFF3 or GTF files</a></li>
<li><a href="/genbank/genome_validation">Validation Error Explanations for Genomes</a></li>
<li><a href="/genbank/asndisc/">Discrepancy Report</a></li>
<li><a href="https://www.ncbi.nlm.nih.gov/genome/annotation_prok/">NCBI Prokaryotic Genome Annotation Pipeline</a></li>
<li><a href="https://www.ncbi.nlm.nih.gov/assembly/agp/AGP_Specification/">AGP Format</a></li>
<li><a href="/genbank/metagenome/">Metagenome Submission Guide</a></li>
<li><a href="/genbank/structuredcomment/">Structured Comment</a></li>
<li><a href="/bioproject/">BioProject</a></li>
<li><a href="/biosample/">BioSample</a></li>
</ul>
</div>
</div>
<!--/.col2-->
<div class="col3">
</div>
<!--/.col3-->
<div class="col4">
</div>
<!--/.col4-->
<div class="col5">
</div>
<div class="col6">
</div>
<div class="col7">
</div>
<div class="col8">
</div>
<div class="col9">
</div>
</div><!--/.content-->
</div><!--/.container-->
<div id="NCBIFooter_dynamic">
<div class="breadcrumbs">You are here:
<span id="breadcrumb_text"><a href="/guide/">NCBI</a></span></div>
<a id="help-desk-link" class="help_desk" href="https://support.ncbi.nlm.nih.gov/ics/support/default.asp?Time=2025-03-05T02:45:40-05:00&amp;Snapshot=%2Fprojects%2Fstaticsites%2Fgenbank%2Fgenbank@2.21&amp;Host=portal107&amp;ncbi_phid=CE8EA1107C7F390100000000013300F0&amp;ncbi_session=CE8B5AF87C7FFCB1_0191SID&amp;from=https%3A%2F%2Fwww.ncbi.nlm.nih.gov%2Fgenbank%2Fwgsfaq%2F&amp;Ncbi_App=genbank&amp;Page=custom-page&amp;style=classic&amp;deptID=28049" target="_blank">Support Center</a>
<noscript><img alt="" src="/stat?jsdisabled=true&amp;ncbi_app=genbank&amp;ncbi_db=&amp;ncbi_pdid=custom-page&amp;ncbi_phid=CE8EA1107C7F390100000000013300F0" /></noscript>
</div>
<div xmlns:xi="http://www.w3.org/2001/XInclude">
<div xmlns="http://www.w3.org/1999/xhtml" class="footer" id="footer" xml:base="http://127.0.0.1/sites/static/header_footer">
<section class="icon-section">
<div id="icon-section-header" class="icon-section_header">Follow NCBI</div>
<div class="grid-container container">
<div class="icon-section_container">
<a class="footer-icon" id="footer_twitter" href="https://twitter.com/ncbi" aria-label="Twitter">
<svg xmlns="http://www.w3.org/2000/svg" width="40" height="40" viewBox="0 0 40 40" fill="none">
<title>Twitter</title>
<g id="twitterx1008">
<path id="path1008" d="M6.06736 7L16.8778 20.8991L6.00001 32.2H10.2L18.6 23.1L25.668 32.2H34L22.8 17.5L31.9 7H28.4L20.7 15.4L14.401 7H6.06898H6.06736ZM9.66753 8.73423H12.9327L29.7327 30.4658H26.5697L9.66753 8.73423Z" fill="#5B616B"></path>
</g>
</svg>
</a>
<a class="footer-icon" id="footer_facebook" href="https://www.facebook.com/ncbi.nlm" aria-label="Facebook"><svg xmlns="http://www.w3.org/2000/svg" data-name="Layer 1" viewBox="0 0 300 300">
<title>Facebook</title>
<path class="cls-11" d="M210.5,115.12H171.74V97.82c0-8.14,5.39-10,9.19-10h27.14V52l-39.32-.12c-35.66,0-42.42,26.68-42.42,43.77v19.48H99.09v36.32h27.24v109h45.41v-109h35Z">
</path>
</svg></a>
<a class="footer-icon" id="footer_linkedin" href="https://www.linkedin.com/company/ncbinlm" aria-label="LinkedIn"><svg xmlns="http://www.w3.org/2000/svg" data-name="Layer 1" viewBox="0 0 300 300">
<title>LinkedIn</title>
<path class="cls-11" d="M101.64,243.37H57.79v-114h43.85Zm-22-131.54h-.26c-13.25,0-21.82-10.36-21.82-21.76,0-11.65,8.84-21.15,22.33-21.15S101.7,78.72,102,90.38C102,101.77,93.4,111.83,79.63,111.83Zm100.93,52.61A17.54,17.54,0,0,0,163,182v61.39H119.18s.51-105.23,0-114H163v13a54.33,54.33,0,0,1,34.54-12.66c26,0,44.39,18.8,44.39,55.29v58.35H198.1V182A17.54,17.54,0,0,0,180.56,164.44Z">
</path>
</svg></a>
<a class="footer-icon" id="footer_github" href="https://github.com/ncbi" aria-label="GitHub"><svg xmlns="http://www.w3.org/2000/svg" data-name="Layer 1" viewBox="0 0 300 300">
<defs>
<style>
.cls-11,
.cls-12 {
fill: #737373;
}
.cls-11 {
fill-rule: evenodd;
}
</style>
</defs>
<title>GitHub</title>
<path class="cls-11" d="M151.36,47.28a105.76,105.76,0,0,0-33.43,206.1c5.28,1,7.22-2.3,7.22-5.09,0-2.52-.09-10.85-.14-19.69-29.42,6.4-35.63-12.48-35.63-12.48-4.81-12.22-11.74-15.47-11.74-15.47-9.59-6.56.73-6.43.73-6.43,10.61.75,16.21,10.9,16.21,10.9,9.43,16.17,24.73,11.49,30.77,8.79,1-6.83,3.69-11.5,6.71-14.14C108.57,197.1,83.88,188,83.88,147.51a40.92,40.92,0,0,1,10.9-28.39c-1.1-2.66-4.72-13.42,1-28,0,0,8.88-2.84,29.09,10.84a100.26,100.26,0,0,1,53,0C198,88.3,206.9,91.14,206.9,91.14c5.76,14.56,2.14,25.32,1,28a40.87,40.87,0,0,1,10.89,28.39c0,40.62-24.74,49.56-48.29,52.18,3.79,3.28,7.17,9.71,7.17,19.58,0,14.15-.12,25.54-.12,29,0,2.82,1.9,6.11,7.26,5.07A105.76,105.76,0,0,0,151.36,47.28Z">
</path>
<path class="cls-12" d="M85.66,199.12c-.23.52-1.06.68-1.81.32s-1.2-1.06-.95-1.59,1.06-.69,1.82-.33,1.21,1.07.94,1.6Zm-1.3-1">
</path>
<path class="cls-12" d="M90,203.89c-.51.47-1.49.25-2.16-.49a1.61,1.61,0,0,1-.31-2.19c.52-.47,1.47-.25,2.17.49s.82,1.72.3,2.19Zm-1-1.08">
</path>
<path class="cls-12" d="M94.12,210c-.65.46-1.71,0-2.37-.91s-.64-2.07,0-2.52,1.7,0,2.36.89.65,2.08,0,2.54Zm0,0"></path>
<path class="cls-12" d="M99.83,215.87c-.58.64-1.82.47-2.72-.41s-1.18-2.06-.6-2.7,1.83-.46,2.74.41,1.2,2.07.58,2.7Zm0,0">
</path>
<path class="cls-12" d="M107.71,219.29c-.26.82-1.45,1.2-2.64.85s-2-1.34-1.74-2.17,1.44-1.23,2.65-.85,2,1.32,1.73,2.17Zm0,0">
</path>
<path class="cls-12" d="M116.36,219.92c0,.87-1,1.59-2.24,1.61s-2.29-.68-2.3-1.54,1-1.59,2.26-1.61,2.28.67,2.28,1.54Zm0,0">
</path>
<path class="cls-12" d="M124.42,218.55c.15.85-.73,1.72-2,1.95s-2.37-.3-2.52-1.14.73-1.75,2-2,2.37.29,2.53,1.16Zm0,0"></path>
</svg></a>
<a class="footer-icon" id="footer_blog" href="https://ncbiinsights.ncbi.nlm.nih.gov/" aria-label="Blog">
<svg xmlns="http://www.w3.org/2000/svg" id="Layer_1" data-name="Layer 1" viewBox="0 0 40 40">
<defs><style>.cls-1{fill:#737373;}</style></defs>
<title>NCBI Insights Blog</title>
<path class="cls-1" d="M14,30a4,4,0,1,1-4-4,4,4,0,0,1,4,4Zm11,3A19,19,0,0,0,7.05,15a1,1,0,0,0-1,1v3a1,1,0,0,0,.93,1A14,14,0,0,1,20,33.07,1,1,0,0,0,21,34h3a1,1,0,0,0,1-1Zm9,0A28,28,0,0,0,7,6,1,1,0,0,0,6,7v3a1,1,0,0,0,1,1A23,23,0,0,1,29,33a1,1,0,0,0,1,1h3A1,1,0,0,0,34,33Z"></path>
</svg>
</a>
</div>
</div>
</section>
<section class="container-fluid bg-primary">
<div class="container pt-5">
<div class="row mt-3">
<div class="col-lg-3 col-12">
<p><a class="text-white" href="https://www.nlm.nih.gov/socialmedia/index.html">Connect with NLM</a></p>
<ul class="list-inline social_media">
<li class="list-inline-item"><a href="https://twitter.com/NLM_NIH" aria-label="Twitter" target="_blank" rel="noopener noreferrer">
<svg xmlns="http://www.w3.org/2000/svg" width="35" height="35" viewBox="0 0 36 35" fill="none">
<title>Twitter</title>
<g id="twitterx1009" clip-path="url(#clip0_65276_3946)">
<path id="Vector_Twitter" d="M17.5006 34.6565C26.9761 34.6565 34.6575 26.9751 34.6575 17.4996C34.6575 8.02416 26.9761 0.342773 17.5006 0.342773C8.02514 0.342773 0.34375 8.02416 0.34375 17.4996C0.34375 26.9751 8.02514 34.6565 17.5006 34.6565Z" fill="#205493" stroke="white" stroke-width="1.0" stroke-miterlimit="10"></path>
<path id="path1009" d="M8.54811 8.5L16.2698 18.4279L8.50001 26.5H11.5L17.5 20L22.5486 26.5H28.5L20.5 16L27 8.5H24.5L19 14.5L14.5007 8.5H8.54927H8.54811ZM11.1197 9.73873H13.4519L25.4519 25.2613H23.1926L11.1197 9.73873Z" fill="white"></path>
</g>
<defs>
<clipPath id="clip0_65276_3946">
<rect width="35" height="35" fill="white"></rect>
</clipPath>
</defs>
</svg>
</a></li>
<li class="list-inline-item"><a href="https://www.facebook.com/nationallibraryofmedicine" aria-label="Facebook" rel="noopener noreferrer" target="_blank">
<svg xmlns="http://www.w3.org/2000/svg" width="35" height="35" viewBox="0 0 36 35" fill="none">
<title>Facebook</title>
<g id="Facebook" clip-path="url(#clip0_1717_1086)">
<path id="Vector_Facebook" d="M15.1147 29.1371C15.1147 29.0822 15.1147 29.0296 15.1147 28.9747V18.9414H11.8183C11.6719 18.9414 11.6719 18.9414 11.6719 18.8018C11.6719 17.5642 11.6719 16.3289 11.6719 15.0937C11.6719 14.9793 11.7062 14.9518 11.816 14.9518C12.8683 14.9518 13.9206 14.9518 14.9751 14.9518H15.1215V14.8329C15.1215 13.8057 15.1215 12.774 15.1215 11.7492C15.1274 10.9262 15.3148 10.1146 15.6706 9.37241C16.1301 8.38271 16.9475 7.60378 17.9582 7.19235C18.6492 6.90525 19.3923 6.76428 20.1405 6.7783C21.0029 6.79202 21.8653 6.83091 22.7278 6.86065C22.8879 6.86065 23.048 6.89496 23.2082 6.90182C23.2974 6.90182 23.3271 6.94071 23.3271 7.02993C23.3271 7.54235 23.3271 8.05477 23.3271 8.5649C23.3271 9.16882 23.3271 9.77274 23.3271 10.3767C23.3271 10.4819 23.2974 10.5139 23.1921 10.5116C22.5379 10.5116 21.8814 10.5116 21.2271 10.5116C20.9287 10.5184 20.6316 10.5528 20.3395 10.6146C20.0822 10.6619 19.8463 10.7891 19.6653 10.9779C19.4842 11.1668 19.3672 11.4078 19.3307 11.6669C19.2857 11.893 19.2612 12.1226 19.2575 12.3531C19.2575 13.1904 19.2575 14.0299 19.2575 14.8695C19.2575 14.8946 19.2575 14.9198 19.2575 14.9564H23.0229C23.1807 14.9564 23.183 14.9564 23.1624 15.1074C23.0778 15.7662 22.9885 16.425 22.9039 17.0816C22.8322 17.6321 22.7636 18.1827 22.698 18.7332C22.6729 18.9437 22.6797 18.9437 22.4693 18.9437H19.2644V28.8992C19.2644 28.9793 19.2644 29.0593 19.2644 29.1394L15.1147 29.1371Z" fill="white"></path>
<path id="Vector_2_Facebook" d="M17.5006 34.657C26.9761 34.657 34.6575 26.9756 34.6575 17.5001C34.6575 8.02465 26.9761 0.343262 17.5006 0.343262C8.02514 0.343262 0.34375 8.02465 0.34375 17.5001C0.34375 26.9756 8.02514 34.657 17.5006 34.657Z" stroke="white" stroke-width="1.0" stroke-miterlimit="10"></path>
</g>
<defs>
<clipPath id="clip0_1717_1086">
<rect width="35" height="35" fill="white"></rect>
</clipPath>
</defs>
</svg>
</a></li>
<li class="list-inline-item"><a href="https://www.youtube.com/user/NLMNIH" aria-label="Youtube" target="_blank" rel="noopener noreferrer">
<svg xmlns="http://www.w3.org/2000/svg" width="35" height="35" viewBox="0 0 36 35" fill="none">
<title>Youtube</title>
<g id="YouTube" clip-path="url(#clip0_1717_1101)">
<path id="Vector_Youtube" d="M26.2571 11.4791C25.9025 11.1589 25.5709 10.9576 24.228 10.834C22.5512 10.6785 20.2797 10.6556 18.564 10.6533H16.4365C14.7208 10.6533 12.4493 10.6785 10.7725 10.834C9.43196 10.9576 9.09798 11.1589 8.7434 11.4791C7.81464 12.321 7.6202 14.6268 7.59961 16.8938C7.59961 17.3178 7.59961 17.741 7.59961 18.1635C7.62706 20.4121 7.82837 22.686 8.7434 23.521C9.09798 23.8412 9.42967 24.0425 10.7725 24.1661C12.4493 24.3216 14.7208 24.3445 16.4365 24.3468H18.564C20.2797 24.3468 22.5512 24.3216 24.228 24.1661C25.5686 24.0425 25.9025 23.8412 26.2571 23.521C27.1722 22.6929 27.3735 20.451 27.4009 18.2206C27.4009 17.7402 27.4009 17.2599 27.4009 16.7795C27.3735 14.5491 27.1699 12.3072 26.2571 11.4791ZM15.5604 20.5311V14.652L20.561 17.5001L15.5604 20.5311Z" fill="white"></path>
<path id="Vector_2_Youtube" d="M17.5006 34.657C26.9761 34.657 34.6575 26.9756 34.6575 17.5001C34.6575 8.02465 26.9761 0.343262 17.5006 0.343262C8.02514 0.343262 0.34375 8.02465 0.34375 17.5001C0.34375 26.9756 8.02514 34.657 17.5006 34.657Z" stroke="white" stroke-width="1.0" stroke-miterlimit="10"></path>
</g>
<defs>
<clipPath id="clip0_1717_1101">
<rect width="35" height="35" fill="white"></rect>
</clipPath>
</defs>
</svg>
</a></li>
</ul>
</div>
<div class="col-lg-3 col-12">
<p class="address_footer text-white">National Library of Medicine<br />
<a href="https://www.google.com/maps/place/8600+Rockville+Pike,+Bethesda,+MD+20894/@38.9959508,-77.101021,17z/data=!3m1!4b1!4m5!3m4!1s0x89b7c95e25765ddb:0x19156f88b27635b8!8m2!3d38.9959508!4d-77.0988323" class="text-white" target="_blank" rel="noopener noreferrer">8600 Rockville Pike<br />
Bethesda, MD 20894</a></p>
</div>
<div class="col-lg-3 col-12 centered-lg">
<p><a href="https://www.nlm.nih.gov/web_policies.html" class="text-white">Web Policies</a><br />
<a href="https://www.nih.gov/institutes-nih/nih-office-director/office-communications-public-liaison/freedom-information-act-office" class="text-white">FOIA</a><br />
<a href="https://www.hhs.gov/vulnerability-disclosure-policy/index.html" class="text-white" id="vdp">HHS Vulnerability Disclosure</a></p>
</div>
<div class="col-lg-3 col-12 centered-lg">
<p><a class="supportLink text-white" href="https://support.nlm.nih.gov/">Help</a><br />
<a href="https://www.nlm.nih.gov/accessibility.html" class="text-white">Accessibility</a><br />
<a href="https://www.nlm.nih.gov/careers/careers.html" class="text-white">Careers</a></p>
</div>
</div>
<div class="row">
<div class="col-lg-12 centered-lg">
<nav class="bottom-links">
<ul class="mt-3">
<li>
<a class="text-white" href="//www.nlm.nih.gov/">NLM</a>
</li>
<li>
<a class="text-white" href="https://www.nih.gov/">NIH</a>
</li>
<li>
<a class="text-white" href="https://www.hhs.gov/">HHS</a>
</li>
<li>
<a class="text-white" href="https://www.usa.gov/">USA.gov</a>
</li>
</ul>
</nav>
</div>
</div>
</div>
</section>
<script type="text/javascript" src="/portal/portal3rc.fcgi/rlib/js/InstrumentOmnitureBaseJS/InstrumentNCBIConfigJS/InstrumentNCBIBaseJS/InstrumentPageStarterJS.js?v=1"> </script>
<script type="text/javascript" src="/portal/portal3rc.fcgi/static/js/hfjs2.js"> </script>
</div>
</div>
<!--/.footer-->
<p class="last-updated small">Last updated: 2024-03-22T15:36:55Z</p>
</div>
<!--/.page-->
</div>
<!--/.wrap-->
<span class="PAFAppResources"></span>
</div><!-- /.twelve_col -->
</div>
<!-- /.grid -->
<!-- usually for JS scripts at page bottom -->
<span class="pagefixtures"></span>
<!-- CE8B5AF87C7FFCB1_0191SID /projects/staticsites/genbank/genbank@2.21 portal107 v4.1.r689238 Tue, Oct 22 2024 16:10:51 -->
<span id="portal-csrf-token" style="display:none" data-token="CE8B5AF87C7FFCB1_0191SID"></span>
<script type="text/javascript" src="//static.pubmed.gov/portal/portal3rc.fcgi/4218137/js/3879255/4121861/1490097/4087685.js" snapshot="genbank"></script></body>
</html>