nih-gov/www.ncbi.nlm.nih.gov/genbank/genome_validation

1136 lines
66 KiB
XML
Raw Permalink Blame History

This file contains ambiguous Unicode characters

This file contains Unicode characters that might be confused with other characters. If you think that this is intentional, you can safely ignore this warning. Use the Escape button to reveal them.

<?xml version="1.0" encoding="utf-8"?>
<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
<head><meta http-equiv="Content-Type" content="text/html; charset=utf-8" />
<!-- AppResources meta begin -->
<meta name="paf-app-resources" content="" />
<!-- AppResources meta end -->
<!-- TemplateResources meta begin -->
<meta name="paf_template" content="StdNCol" />
<!-- TemplateResources meta end -->
<!-- Page meta begin -->
<!-- Page meta end -->
<!-- Logger begin -->
<meta xmlns:ncbi-portal="http://ncbi.gov/portal/XSLT/namespace" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" name="ncbi_app" content="genbank" /><meta xmlns:ncbi-portal="http://ncbi.gov/portal/XSLT/namespace" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" name="ncbi_pdid" content="custom-page" />
<!-- Logger end -->
<title>Validation Error Explanations for Genomes</title>
<!-- PageFixtures headcontent begin -->
<meta name="cms-local-nav-url" content="https://cms.ncbi.nlm.nih.gov//genbank/_nav" />
<!-- PageFixtures headcontent end -->
<!-- AppResources external_resources begin -->
<script type="text/javascript" src="/core/jig/1.15.6/js/jig.min.js"></script>
<!-- AppResources external_resources end -->
<!-- Page headcontent begin -->
<meta name="subsite" content="genbank" />
<meta name="path" content="genbank/genome_validation" />
<meta name="modified" content="2024-10-30T15:37:40Z" /><meta xmlns:ncbi-portal="http://ncbi.gov/portal/XSLT/namespace" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" name="cms-edit-aux-url" content="http://cms.ncbi.nlm.nih.gov/node//edit" />
<!-- Page headcontent end -->
<!-- PageFixtures resources begin -->
<link xmlns="http://www.w3.org/1999/xhtml" type="text/css" rel="stylesheet" href="//static.pubmed.gov/portal/portal3rc.fcgi/4218191/css/4207974/4206132.css" xml:base="http://127.0.0.1/sites/static/header_footer" />
<!-- PageFixtures resources end -->
<link rel="shortcut icon" href="//www.ncbi.nlm.nih.gov/favicon.ico" /><meta name="ncbi_phid" content="CE8B41FA7C7F1B610000000000F700C2.m_6" />
<meta name='referrer' content='origin-when-cross-origin'/><link type="text/css" rel="stylesheet" href="//static.pubmed.gov/portal/portal3rc.fcgi/4218137/css/4121862/3974050/3917732/251717/4108189/14534/45193/3534283/4128070/3407145/4005757/4062871.css" /><link type="text/css" rel="stylesheet" href="//static.pubmed.gov/portal/portal3rc.fcgi/4218137/css/3529741/3529739.css" media="print" /></head>
<body class=" col2 custom-page">
<div class="grid">
<div class="col twelve_col nomargin shadow">
<!-- System messages like service outage or JS required; this is handled by the TemplateResources portlet -->
<div class="sysmessages">
<noscript>
<p class="nojs">
<strong>Warning:</strong>
The NCBI web site requires JavaScript to function.
<a href="/guide/browsers/#enablejs" title="Learn how to enable JavaScript" target="_blank">more...</a>
</p>
</noscript>
</div>
<!--/.sysmessage-->
<div class="wrap">
<div class="page">
<div xmlns:xi="http://www.w3.org/2001/XInclude">
<div xmlns="http://www.w3.org/1999/xhtml" id="universal_header" xml:base="http://127.0.0.1/sites/static/header_footer">
<section class="usa-banner">
<div class="usa-accordion">
<header class="usa-banner-header">
<div class="usa-grid usa-banner-inner">
<img src="https://www.ncbi.nlm.nih.gov/coreutils/uswds/img/favicons/favicon-57.png" alt="U.S. flag" />
<p>An official website of the United States government</p>
<button class="non-usa-accordion-button usa-banner-button" aria-expanded="false" aria-controls="gov-banner-top" type="button">
<span class="usa-banner-button-text">Here's how you know</span>
</button>
</div>
</header>
<div class="usa-banner-content usa-grid usa-accordion-content" id="gov-banner-top" aria-hidden="true">
<div class="usa-banner-guidance-gov usa-width-one-half">
<img class="usa-banner-icon usa-media_block-img" src="https://www.ncbi.nlm.nih.gov/coreutils/uswds/img/icon-dot-gov.svg" alt="Dot gov" />
<div class="usa-media_block-body">
<p>
<strong>The .gov means it's official.</strong>
<br />
Federal government websites often end in .gov or .mil. Before
sharing sensitive information, make sure you're on a federal
government site.
</p>
</div>
</div>
<div class="usa-banner-guidance-ssl usa-width-one-half">
<img class="usa-banner-icon usa-media_block-img" src="https://www.ncbi.nlm.nih.gov/coreutils/uswds/img/icon-https.svg" alt="Https" />
<div class="usa-media_block-body">
<p>
<strong>The site is secure.</strong>
<br />
The <strong>https://</strong> ensures that you are connecting to the
official website and that any information you provide is encrypted
and transmitted securely.
</p>
</div>
</div>
</div>
</div>
</section>
<div class="usa-overlay"></div>
<header class="ncbi-header" role="banner" data-section="Header">
<div class="usa-grid">
<div class="usa-width-one-whole">
<div class="ncbi-header__logo">
<a href="/" class="logo" aria-label="NCBI Logo" data-ga-action="click_image" data-ga-label="NIH NLM Logo">
<img src="https://www.ncbi.nlm.nih.gov/coreutils/nwds/img/logos/AgencyLogo.svg" alt="NIH NLM Logo" />
</a>
</div>
<div class="ncbi-header__account">
<a id="account_login" href="https://account.ncbi.nlm.nih.gov" class="usa-button header-button" style="display:none" data-ga-action="open_menu" data-ga-label="account_menu">Log in</a>
<button id="account_info" class="header-button" style="display:none" aria-controls="account_popup" type="button">
<span class="fa fa-user" aria-hidden="true">
<svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 24 24" width="20px" height="20px">
<g style="fill: #fff">
<ellipse cx="12" cy="8" rx="5" ry="6"></ellipse>
<path d="M21.8,19.1c-0.9-1.8-2.6-3.3-4.8-4.2c-0.6-0.2-1.3-0.2-1.8,0.1c-1,0.6-2,0.9-3.2,0.9s-2.2-0.3-3.2-0.9 C8.3,14.8,7.6,14.7,7,15c-2.2,0.9-3.9,2.4-4.8,4.2C1.5,20.5,2.6,22,4.1,22h15.8C21.4,22,22.5,20.5,21.8,19.1z"></path>
</g>
</svg>
</span>
<span class="username desktop-only" aria-hidden="true" id="uname_short"></span>
<span class="sr-only">Show account info</span>
</button>
</div>
<div class="ncbi-popup-anchor">
<div class="ncbi-popup account-popup" id="account_popup" aria-hidden="true">
<div class="ncbi-popup-head">
<button class="ncbi-close-button" data-ga-action="close_menu" data-ga-label="account_menu" type="button">
<span class="fa fa-times">
<svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 48 48" width="24px" height="24px">
<path d="M38 12.83l-2.83-2.83-11.17 11.17-11.17-11.17-2.83 2.83 11.17 11.17-11.17 11.17 2.83 2.83 11.17-11.17 11.17 11.17 2.83-2.83-11.17-11.17z"></path>
</svg>
</span>
<span class="usa-sr-only">Close</span></button>
<h4>Account</h4>
</div>
<div class="account-user-info">
Logged in as:<br />
<b><span class="username" id="uname_long">username</span></b>
</div>
<div class="account-links">
<ul class="usa-unstyled-list">
<li><a id="account_myncbi" href="/myncbi/" class="set-base-url" data-ga-action="click_menu_item" data-ga-label="account_myncbi">Dashboard</a></li>
<li><a id="account_pubs" href="/myncbi/collections/bibliography/" class="set-base-url" data-ga-action="click_menu_item" data-ga-label="account_pubs">Publications</a></li>
<li><a id="account_settings" href="/account/settings/" class="set-base-url" data-ga-action="click_menu_item" data-ga-label="account_settings">Account settings</a></li>
<li><a id="account_logout" href="/account/signout/" class="set-base-url" data-ga-action="click_menu_item" data-ga-label="account_logout">Log out</a></li>
</ul>
</div>
</div>
</div>
</div>
</div>
</header>
<div role="navigation" aria-label="access keys">
<a id="nws_header_accesskey_0" href="https://www.ncbi.nlm.nih.gov/guide/browsers/#ncbi_accesskeys" class="usa-sr-only" accesskey="0" tabindex="-1">Access keys</a>
<a id="nws_header_accesskey_1" href="https://www.ncbi.nlm.nih.gov" class="usa-sr-only" accesskey="1" tabindex="-1">NCBI Homepage</a>
<a id="nws_header_accesskey_2" href="/myncbi/" class="set-base-url usa-sr-only" accesskey="2" tabindex="-1">MyNCBI Homepage</a>
<a id="nws_header_accesskey_3" href="#maincontent" class="usa-sr-only" accesskey="3" tabindex="-1">Main Content</a>
<a id="nws_header_accesskey_4" href="#" class="usa-sr-only" accesskey="4" tabindex="-1">Main Navigation</a>
</div>
<section data-section="Alerts">
<div class="ncbi-alerts-placeholder"></div>
</section>
</div>
</div>
<!--/.header-->
<div class="header">
<div class="res_logo"><h1 class="res_name"><a href="/genbank/" title="GenBank home">GenBank</a></h1><h2 class="res_tagline">Public nucleic acid sequence repository</h2></div>
<div class="search"><form method="get" action="/nuccore/"><div class="search_form"><label for="database" class="offscreen_noflow">Search database</label><select id="database"><optgroup label="Recent"><option value="nuccore" selected="selected">Nucleotide</option><option value="sra">SRA</option><option value="books">Books</option><option value="clinvar" class="last">ClinVar</option></optgroup><optgroup label="All"><option value="gquery">All Databases</option><option value="assembly">Assembly</option><option value="biocollections">Biocollections</option><option value="bioproject">BioProject</option><option value="biosample">BioSample</option><option value="books">Books</option><option value="clinvar">ClinVar</option><option value="cdd">Conserved Domains</option><option value="gap">dbGaP</option><option value="dbvar">dbVar</option><option value="gene">Gene</option><option value="genome">Genome</option><option value="gds">GEO DataSets</option><option value="geoprofiles">GEO Profiles</option><option value="gtr">GTR</option><option value="ipg">Identical Protein Groups</option><option value="medgen">MedGen</option><option value="mesh">MeSH</option><option value="nlmcatalog">NLM Catalog</option><option value="nuccore">Nucleotide</option><option value="omim">OMIM</option><option value="pmc">PMC</option><option value="protein">Protein</option><option value="proteinclusters">Protein Clusters</option><option value="protfam">Protein Family Models</option><option value="pcassay">PubChem BioAssay</option><option value="pccompound">PubChem Compound</option><option value="pcsubstance">PubChem Substance</option><option value="pubmed">PubMed</option><option value="snp">SNP</option><option value="sra">SRA</option><option value="structure">Structure</option><option value="taxonomy">Taxonomy</option><option value="toolkit">ToolKit</option><option value="toolkitall">ToolKitAll</option><option value="toolkitbookgh">ToolKitBookgh</option></optgroup></select><div class="nowrap"><label for="term" class="offscreen_noflow" accesskey="/">Search term</label><div class="nowrap"><input type="text" name="term" id="term" title="Search Nucleotide" value="" class="jig-ncbiclearbutton jig-ncbiautocomplete" data-jigconfig="isEnabled:false,disableUrl:'NcbiSearchBarAutoComplCtrl'" autocomplete="off" data-sbconfig="ds:'no',pjs:'no',afs:'yes'" /></div><button id="search" type="submit" class="button_search nowrap" cmd="go">Search</button></div></div></form></div>
</div>
<div class="nav_and_browser">
<div class="localnav"><ul class="jig-ncbilocalnav">
<li><a href="#">GenBank</a><ul>
<li><a href="/genbank/">About GenBank</a></li>
<li><a href="/genbank/submit_types">Submission Types</a></li>
<li><a href="/genbank/submit">Submission Tools</a></li>
<li><a href="/genbank/update">Update GenBank Records</a></li>
<li><a href="/nuccore/">Search</a></li>
<li><a href="/BLAST/Blast.cgi?CMD=Web&amp;PAGETYPE=BLASTHome">BLAST</a></li>
<li><a href="/genbank/statistics">Statistics</a></li>
<li><a href="/genbank/samplerecord/">Sample Record</a></li>
<li><a href="/genbank/sequencerevisionhistory/">Revision History</a></li>
<li><a href="/genbank/sequenceids/">Sequence IDs</a></li>
</ul>
</li>
<li><a href="#">Submit</a><ul>
<li><a href="/genbank/submit">Submission Tools</a></li>
<li><a href="/genbank/submit_types">Submission Types</a></li>
<li><a href="/WebSub/?tool=genbank">BankIt</a></li>
<li><a href="/genbank/table2asn">table2asn</a></li>
<li><a href="https://www.ncbi.nlm.nih.gov/sra/docs/sequence-data-processing">Sequence Data Processing</a></li>
</ul>
</li>
<li><a href="#">Genomes</a><ul>
<li><a href="/genbank/genomesubmit">Complete Genome Submission Guide</a></li>
<li><a href="/genbank/genomesubmit_annotation">Prokaryotic Genome Annotation Guide</a></li>
<li><a href="/genbank/eukaryotic_genome_submission_annotation">Eukaryotic Genome Annotation Guide</a></li>
<li><a href="/genbank/examples.wgs">Annotation Examples</a></li>
<li><a href="https://submit.ncbi.nlm.nih.gov/subs/wgs/">Genome Submission Portal</a></li>
</ul>
</li>
<li><a title="Whole Genome Shotgun sequences and submissions" href="#">WGS</a><ul>
<li><a href="/genbank/wgs">About WGS</a></li>
<li><a href="/Traces/wgs">WGS Project List</a></li>
<li><a href="/genbank/wgs.submit">WGS Submission Guide</a></li>
<li><a href="/genbank/wgsfaq/">FAQ</a></li>
<li><a href="https://submit.ncbi.nlm.nih.gov/subs/wgs/">Genome Submission Portal</a></li>
<li><a href="/genbank/eukaryotic_genome_submission_annotation">Eukaryotic Annotation Guide</a></li>
<li><a href="/genbank/genomesubmit_annotation">Prokaryotic Annotation Guide</a></li>
<li><a href="/genbank/asndisc">Discrepancy Report</a></li>
<li><a href="/assembly/agp/AGP_Specification/">AGP format</a></li>
</ul>
</li>
<li><a href="#">Metagenomes</a><ul>
<li><a href="/genbank/metagenome">About Metagenomes</a></li>
<li><a href="/genbank/structuredcomment">Structured Comment</a></li>
</ul>
</li>
<li><a href="#">TPA</a><ul>
<li><a href="/genbank/TPA">About TPA</a></li>
<li><a href="/genbank/tpafaq">FAQ</a></li>
<li><a href="/genbank/TPA-Exp">TPA-Exp</a></li>
<li><a href="/genbank/TPA-Inf">TPA-Inf</a></li>
</ul>
</li>
<li><a href="#">TSA</a><ul>
<li><a href="/genbank/TSA">About TSA</a></li>
<li><a href="/genbank/TSAguide">TSA Submission Guide</a></li>
<li><a href="/genbank/TSAfaq">FAQ</a></li>
</ul>
</li>
<li><a href="#">INSDC</a><ul>
<li><a href="/genbank/collab">About INSDC</a></li>
<li><a href="/genbank/collab/country">Geographic Location Name List</a></li>
<li><a href="/genbank/collab/db_xref">db_xref List</a></li>
<li><a href="http://www.insdc.org/documents/feature_table.html">Feature Table</a></li>
</ul>
</li>
<li><a href="#">Documentation</a><ul>
<li><a href="https://www.ncbi.nlm.nih.gov/sra/docs/sequence-data-processing/">Sequence Data Processing</a></li>
<li><a href="/genbank/submission_brokers">Submission Brokers</a></li>
<li><a href="/genbank/acc_prefix">Accession Number Prefixes</a></li>
<li><a href="/genbank/organelle_submit/">Organelle Submission Guide</a></li>
<li><a href="/genbank/monkeypox_submission/">Monkeypox Submission Guide</a></li>
<li><a href="/genbank/validation/">Common Submission Errors</a> </li>
<li><a href="/genbank/sequencecheck/">Ribosomal Submission Errors</a></li>
<li><a href="/genbank/sequencecheck/virus">Common Sequence Errors</a></li>
<li><a href="https://support.nlm.nih.gov/knowledgebase/category/?id=CAT-01240">Submission FAQs</a></li>
</ul>
</li>
<li><a href="#">Other</a><ul>
<li><a href="/genbank/htgs">About HTGs</a></li>
<li><a href="/genbank/dbest">About EST</a></li>
<li><a href="/genbank/dbgss">About GSS</a></li>
<li><a href="/genbank/tls">About TLS</a></li>
<li><a href="/genbank/tlsguide">Submit TLS</a></li>
</ul>
</li>
</ul></div>
</div>
<!-- was itemctrl -->
<div class="container">
<div id="maincontent" class="content col twelve_col last">
<div class="col1">
<h1 id="validation-error-explanations-fo">Validation Error Explanations for Genomes</h1>
<p>This page has explanations for individual errors that are commonly found during processing of prokaryotic and eukaryotic genomes, along with suggestions to fix them. Write to <a href="mailto:genomes@ncbi.nlm.nih.gov">genomes@ncbi.nlm.nih.gov</a> if you do not know how to correct the error in your submission.</p>
<p>Explanations of disrepancy report problems that are reported in the "discrep" file can be found at <a href="https://www.ncbi.nlm.nih.gov/genbank/asndisc#fatal">https://www.ncbi.nlm.nih.gov/genbank/asndisc#fatal</a>
nd <a href="https://www.ncbi.nlm.nih.gov/genbank/asndisc.examples/">https://www.ncbi.nlm.nih.gov/genbank/asndisc.examples/</a></p>
<p>Remember that annotation is not required for genome submissions, and
that you can request NCBI's
<a href="/genome/annotation_prok/">Prokaryotic Genome Annotation Pipeline</a> for your prokaryotic genome
submissions. For more information about annotation, see the
<a href="/genbank/genomesubmit_annotation/">Prokaryotic Genome Annotation Guidelines</a>
or <a href="/genbank/eukaryotic_genome_submission_annotation/">Eukaryotic Genome Annotation Guidelines.</a></p>
<h3 id="error-list">Error List</h3>
<ul>
<li><a href="#BadCharInAuthorLastName">SEQ_FEAT_BadCharInAuthorLastName</a></li>
<li><a href="#BadCharInAuthorName">SEQ_FEAT_BadCharInAuthorName</a></li>
<li><a href="#BadCollectionCode">SEQ_DESCR_BadCollectionCode</a></li>
<li><a href="#BadCollectionDate">SEQ_DESCR_BadCollectionDate</a></li>
<li><a href="#BadGeoLocNameCode">SEQ_DESCR.BadGeoLocNameCode</a></li>
<li><a href="#BadProteinNameECnum">SEQ_FEAT.BadProteinName: Unknown or hypothetical protein should not have EC number</a></li>
<li><a href="#StartCodonandBadProteinStart">SEQ_INST.BadProteinStart</a></li>
<li><a href="#BadVoucherID">SEQ_DESCR.BadVoucherID</a></li>
<li><a href="#BioSourceMissing">SEQ_DESCR.BioSourceMissing</a></li>
<li><a href="#EcNumberProblem">SEQ_FEAT.EcNumberProblem</a></li>
<li><a href="#FeatureBeginsOrEndsInGap">SEQ_FEAT.FeatureBeginsOrEndsInGap</a></li>
<li><a href="#GenCodeInvalid">SEQ_FEAT.GenCodeInvalid</a></li>
<li><a href="#GenCodeInvalid">SEQ_FEAT.GenCodeMismatch</a></li>
<li><a href="#IllegalDbXref">SEQ_FEAT.IllegalDbXref</a></li>
<li><a href="#InconsistentTech">SEQ_DESCR.InconsistentMolInfoTechnique</a></li>
<li><a href="#InternalNsInSeqRaw">SEQ_INST.InternalNsInSeqRaw</a></li>
<li><a href="#InternalStopandStopInProtein">SEQ_FEAT.InternalStop</a></li>
<li><a href="#InvalidInferenceValueUnrecognizedDB">SEQ_FEAT.InvalidInferenceValue: unrecognized database</a></li>
<li><a href="#InvalidQualifierValuerRNAhasnoname">SEQ_FEAT.InvalidQualifierValue: rRNA has no name</a></li>
<li><a href="#LatLonGeoLocName">SEQ_DESCR.LatLonGeoLocName</a></li>
<li><a href="#LatLonFormat">SEQ_DESCR.LatLonFormat</a></li>
<li><a href="#LatLonProblem">SEQ_DESCR.LatLonProblem</a></li>
<li><a href="#LatLonRange">SEQ_DESCR.LatLonRange</a></li>
<li><a href="#LatLonValue">SEQ_DESCR.LatLonValue</a></li>
<li><a href="#MisMatchAA">SEQ_FEAT.MisMatchAA</a></li>
<li><a href="#MissingPubInfoNosubmissioncitation">GENERIC.MissingPubInfo: No submission citation anywhere on this entire record</a></li>
<li><a href="#MissingPubInfoSubmissioncitationaffiliationhasnostate">GENERIC.MissingPubInfo: Submission citation affiliation has no state</a></li>
<li><a href="#MissingPubInfo">GENERIC.MissingPubInfo</a></li>
<li><a href="#MissingPubRequirement">GENERIC.MissingPubRequirement</a></li>
<li><a href="#MissingTrnaAA">SEQ_FEAT.MissingTrnaAA</a></li>
<li><a href="#NoOrgFound">SEQ_DESCR.NoOrgFound</a></li>
<li><a href="#NoPubFound">SEQ_DESCR.NoPubFound</a></li>
<li><a href="#NoSourceDescriptor">SEQ_DESCR.NoSourceDescriptor</a></li>
<li><a href="#NoStop">SEQ_FEAT.NoStop</a></li>
<li><a href="#OnlyGeneXrefs">SEQ_FEAT.OnlyGeneXrefs</a></li>
<li><a href="#PartialProblemPartialLocationStartdoesnotincludefirstlastresidue">SEQ_FEAT.PartialProblem PartialLocation: Start does not include first/last residue of sequence</a></li>
<li><a href="#ShortIntron">SEQ_FEAT.ShortIntron</a></li>
<li><a href="#ShortSeq">SEQ_INST.ShortSeq</a></li>
<li><a href="#StartCodonandBadProteinStart">SEQ_FEAT.StartCodon</a></li>
<li><a href="#InternalStopandStopInProtein">SEQ_INST.StopInProtein</a></li>
<li><a href="#TerminalNs">SEQ_INST.TerminalNs</a></li>
<li><a href="#TransLen">SEQ_FEAT.TransLen</a></li>
<li><a href="#UnknownFeatQualprotein_id">SEQ_FEAT.UnknownFeatureQual: orig_protein_id</a></li>
<li><a href="#UnstructuredVoucher">SEQ_DESCR.UnstructuredVoucher</a></li>
<li><a href="#UnwantedCompleteFlag">SEQ_DESCR.UnwantedCompleteFlag</a></li>
<li><a href="#WrongVoucherType">SEQ_DESCR.WrongVoucherType</a></li>
</ul>
<h3 id="BadCharInAuthorLastName">SEQ_FEAT_BadCharInAuthorLastName</h3>
<p><em>Explanation</em> : An author name has illegal characters.</p>
<p><em>Suggestion</em> : Check the last names (family names) in the sequence and
publication references. Use only plain ASCII text for the names. The
last name should NOT contain symbols, numbers, accents, umlauts,
characters with diacritical marks, and should NOT end in
punctuation. Note that names with internal punctuation such as
"St. John" or "D'Abaco" will validate.</p>
<p>examples:</p>
<pre><code>incorrect: Henry Jones., Carlos Méndez, Xu 1Weng
corrected: Henry Jones, Carlos Mendez, Xu Weng
</code></pre>
<p>The use of a terminal period and number in these family names causes
an error. The error can be corrected by removing the symbols,
characters with diacritical marks, numbers, or punctuation.</p>
<h3 id="BadCharInAuthorName">SEQ_FEAT_BadCharInAuthorName</h3>
<p><em>Explanation</em> : An author name has illegal characters.</p>
<p><em>Suggestion</em> : Check the first names (given names) in the sequence and
publication references. Use only plain ASCII text for the names. The
names should NOT contain symbols, numbers, accents, umlauts,
characters with diacritical marks, and should NOT end in
punctuation. Note that names with internal punctuation such as
"St. John" or "D'Abaco" or "Doe-Smith" are okay.</p>
<p>examples:</p>
<pre><code>incorrect: J\#ane Doe, José Perez, 1Xu Weng
corrected: Jane Doe, Jose Perez, Xu Wang
</code></pre>
<p>The use of symbols and numbers causes an error. The error can be
corrected by removing the symbols, characters with diacritical marks,
numbers, or punctuation.</p>
<h3 id="BadCollectionCode">SEQ_DESCR.BadCollectionCode</h3>
<p><em>Explanation:</em> The culture collection is not in the list of registered institutes, or is in the wrong format, or there are multiple culture-collections in a single qualifier.</p>
<p><em>Suggestion:</em> See the description for the proper format and list of
allowed institutes,
<a href="https://www.insdc.org/controlled-vocabulary-culturecollection-qualifier">https://www.insdc.org/controlled-vocabulary-culturecollection-qualifier</a>.
Include only the culture-collection from which the sample was
obtained. If the sample was deposited into multiple
culture-collections, then present each culture-collection in a
separate qualifier. If the culture collection is not in the list of
allowed institutes, write to us with details of the culture
collection. If the error is from a genome that was created from a
fasta submission, then the information comes from the BioSample,
which will need to be updated. Send the correct source information to
us at <a href="mailto:genomes@ncbi.nlm.nih.gov">genomes@ncbi.nlm.nih.gov</a>, and we will update the genome and
BioSample. Be sure to include the SUBid of the genome submission and
the accession of the BioSample (SAMNxxxxxxxx), if one has been
assigned.</p>
<p>Note that culture-collection should be used for microbial sequences,
while specimen-voucher should be used for plants and animals
only. However, do not use specimen-voucher to describe host
information for a microbial sequence submission.</p>
<h3 id="BadCollectionDate">SEQ_DESCR_BadCollectionDate</h3>
<p><em>Explanation:</em> The collection date is not in the required format.</p>
<p><em>Suggestion:</em> Correct the collection-date source modifier so the date
is in the correct format. For example, a collection-date should be
formatted like this: <code>DD-MMM-YYYY</code>, where the month is the three-letter
code in English. Alternatively, the ISO 8601 standard may be used;
see descriptions and examples on
<a href="https://www.insdc.org/files/feature_table.html">the INSDC Feature Table page</a>.
If the error
is from a genome that was created from a fasta submission, then the
information comes from the BioSample, which will need to be
updated. Send the correct source information to us at
<a href="mailto:genomes@ncbi.nlm.nih.gov">genomes@ncbi.nlm.nih.gov</a>, and we will update the genome and
BioSample. Be sure to include the SUBid of the genome submission and
the accession of the BioSample (SAMNxxxxxxxx), if one has been
assigned.</p>
<p>Examples of correctly formatted collection-dates:</p>
<pre><code>01-Jul-1999
Nov-2010
2008
</code></pre>
<p>INSDC has approved a list of <a href="https://www.insdc.org/technical-specifications/missing-value-reporting/">null terms</a> that must be used for reporting missing values in /collection_date. </p>
<h3 id="BadGeoLocNameCode">SEQ_DESCR_BadGeoLocNameCode</h3>
<p><em>Explanation:</em> The geographic location name (geo_loc_name), up to the first colon, is not on the approved list of geographic location names.</p>
<p><em>Suggestion:</em> Correct the geo_loc_name source modifier with a geographic location name
on the approved <a href="/genbank/collab/country/">geographic location name list</a> and verify the
geo_loc_name value is correctly formatted. If you want to include more
specific location information, you must place the approved geographic location
name first, followed by a colon and then the additional
information. The geo_loc_name has a specific format and must be formatted
as follows:</p>
<pre><code>&lt;approved geographic location name&gt;: &lt;region or specific area&gt;
</code></pre>
<p>Examples:</p>
<pre><code>Iceland
Canada: Vancouver
Atlantic Ocean: Charlie Gibbs Fracture Zone
</code></pre>
<p>If the error is from a genome that was created from a fasta
submission, then the information comes from the BioSample, which will
need to be updated. Send the correct source information to us at
genomes@ncbi.nlm.nih.gov, and we will update the genome and
BioSample. Be sure to include the SUBid of the genome submission and
the accession of the BioSample (SAMNxxxxxxxx), if one has been
assigned.</p>
<p>INSDC has approved a list of <a href="https://www.insdc.org/technical-specifications/missing-value-reporting/">null terms</a> that must be used for reporting missing values in /geo_loc_name. </p>
<h3 id="BadProteinNameECnum">SEQ_FEAT.BadProteinName: Unknown or hypothetical protein should not have EC number</h3>
<p><em>Explanation:</em> The product name is "hypothetical protein" and there is an EC number.</p>
<p><em>Suggestion:</em> If this really is a hypothetical protein, simply remove the EC number. If the EC number is correct, use that to provide a valid product name.</p>
<h3 id="BadVoucherID">SEQ_DESCR.BadVoucherID</h3>
<p><em>Explanation:</em> The voucher is missing a specific identifier.</p>
<p><em>Suggestion:</em> Correct the format of the culture-collection or
specimen-voucher source modifiers. The culture-collection or
specimen-voucher is missing the identifier. If the error is from a
genome that was created from a fasta submission, then the information
comes from the BioSample, which will need to be updated. Send the
correct source information to us at genomes@ncbi.nlm.nih.gov, and we
will update the genome and BioSample. Be sure to include the SUBid of
the genome submission and the accession of the BioSample
(SAMNxxxxxxxx), if one has been assigned.</p>
<p>The culture-collection must be formatted like this: <code>&lt;institution-code&gt;:\[&lt;collection-code&gt;:\]&lt;culture id&gt;</code>.
The institution code and culture ID are required, the collection-code
is optional. The institution code must be valid. See the
<a href="https://www.insdc.org/controlled-vocabulary-culturecollection-qualifier">description for the proper format</a>
and
<a href="https://ftp.ncbi.nlm.nih.gov/pub/taxonomy/coll_dump.txt">list of all allowed institutions</a>.</p>
<p>An example culture-collection is: <code>CBS:1234</code></p>
<p>Culture-collection should be used for microbial sequences, while
specimen-voucher should be used for plants and animals only. Do not
use specimen-voucher to describe host information for a microbial
sequence submission. The specimen-voucher is not required to be
structured.</p>
<h3 id="BioSourceMissing">SEQ_DESCR_BioSourceMissing</h3>
<p><em>Explanation:</em> The biological source of this sequence has not been described correctly. A submission must have a source descriptor that covers the entire molecule. Please add the source information.</p>
<p><em>Suggestion:</em> Provide an organism name for each sequence in your submission.</p>
<h3 id="EcNumberProblem">SEQ_FEAT.EcNumberProblem</h3>
<p><em>Explanation:</em> Apparent EC number in protein title. A product name includes a value that looks like an EC number, e.g. : "L-pipecolate oxidase (1.5.3.7)"</p>
<p><em>Suggestion:</em> Remove the EC number from the product name and field it in the EC_number qualifier. If it is something else, e.g. a TC number, then move it to a note.</p>
<h3 id="FeatureBeginsOrEndsInGap">SEQ_FEAT.FeatureBeginsOrEndsInGap</h3>
<p><em>Explanation:</em> A feature begins or ends in a gap.</p>
<p><em>Suggestion:</em> Remove the feature or adjust its location to be partial and abut the gap, whichever is appropriate.</p>
<h3 id="GenCodeInvalid">SEQ_FEAT.GenCodeInvalid and SEQ_FEAT.GenCodeMismatch</h3>
<p><em>Explanation:</em> The genetic code seems to be invalid or incorrect.</p>
<p><em>Suggestion:</em> If the organism is a prokaryote, then include -j "[gcode=11]" in the command line to force the use of the prokaryotic genetic code. If the organism is not a prokaryote, then you can ignore this error and we will address it during processing. </p>
<h3 id="IllegalDbXref">SEQ_FEAT.IllegalDbXref</h3>
<p><em>Explanation:</em> The database in the db_xref has the abbreviation or is not one of the <a href="/genbank/collab/db_xref">allowed databases</a></p>
<p><em>Suggestion:</em> If the database that you are using is not one of the <a href="/genbank/collab/db_xref">allowed databases</a>, then change the db_xref to a note. (However, do no use GI as a db_xref because that is an internal technical database.)</p>
<h3 id="InconsistentTech">SEQ_DESCR.InconsistentMolInfoTechnique</h3>
<p><em>Explanation:</em> A WGS accession appears to be present but the wgs technique is not set.</p>
<p><em>Suggestion:</em> You can ignore this error and we will address it during processing. However, you can quiet the error yourself if you wish by including -j "[tech=wgs]" in the command line. </p>
<h3 id="InternalNsInSeqRaw">SEQ_INST.InternalNsInSeqRaw</h3>
<p><em>Explanation:</em> A sequence has a run of 100 or more Ns, which is most likely a gap, not a run of ambiguous bases.</p>
<p><em>Suggestion:</em> Label the run's of N's as assembly_gaps. Choose a smaller length (e.g. 1 or 10) to convert runs of Ns to an assembly_gap with the appropriate linkage evidence. Do not simply remove internal N's.</p>
<h3 id="InternalStopandStopInProtein">SEQ_FEAT.InternalStop and SEQ_INST.StopInProtein</h3>
<p><em>Explanation:</em> The InternalStop and StopInProtein errors are produced when there is an internal stop codon within the CDS.</p>
<p><em>Suggestion:</em> The problem could be the genetic code, the location of the CDS, the reading frame of the CDS, or that the CDS cannot produce an error-free translation. Use the correct <a href="/Taxonomy/Utils/wprintgc.cgi">genetic code</a> to get the correct translations. For example, include [gcode=11] for prokaryotic genome submissions. If the genetic code is correct, then adjust the CDS location, if possible. If the CDS is partial at its 5' end, then you might need to add a codon_start qualifier with a value of 2 or 3 to shift the reading frame one or two bases, respectively. If the CDS does not have an error-free translation, then add the /pseudo qualifier to the gene to indicate that the CDS cannot be translated.</p>
<h3 id="InvalidQualifierValuerRNAhasnoname">SEQ_FEAT.InvalidQualifierValue: rRNA has no name</h3>
<p><em>Explanation:</em> rRNA features must have a product name.</p>
<p><em>Suggestion:</em> Use the appropriate full product name for each rRNA feature, e.g. "16S ribosomal RNA"</p>
<h3 id="InvalidInferenceValueUnrecognizedDB">SEQ_FEAT.InvalidInferenceValue: unrecognized database</h3>
<p><em>Explanation:</em> The database in the structured inference qualifier is not one of the expected ones.</p>
<p><em>Suggestion:</em> See the instructions for <a href="/genbank/evidence/">evidence qualifiers</a> and use one of listed acronyms. If the database that you are referring to is not on the list, then consider including the information as a /note, rather than an /inference.</p>
<h3 id="LatLonGeoLocName">SEQ_DESCR_LatLonGeoLocName</h3>
<p><em>Explanation:</em> lat_lon and geographic location (geo_loc_name) disagree</p>
<p><em>Suggestion:</em> The latitude-longitude (lat-lon) value provided does not map to the source geographic location (geo_loc_name) provided, so correct or remove the lat-lon values and/or geo_loc_name source modifiers. Provide lat-lon in decimal degrees with the compass direction (for example: 39.7 N 42.1 W) and check that the lat-lon coordinates map to the geographic location you have provided. If the error is from a genome that was created from a fasta submission, then the information comes from the BioSample, which will need to be updated. Send the correct source information to us at genomes@ncbi.nlm.nih.gov, and we will update the genome and BioSample. Be sure to include the SUBid of the genome submission and the accession of the BioSample (SAMNxxxxxxxx), if one has been assigned.</p>
<h3 id="LatLonFormat">SEQ_DESCR_LatLonFormat</h3>
<p><em>Explanation:</em> The format of lat-lon should be dd.dd N|S ddd.dd E|W.</p>
<p><em>Suggestion:</em> Correct the latitude-longitude (lat-lon) source modifier with lat-lon coordinates in decimal degree format with the compass directions. For example: 39.7 N 42.1 W If the error is from a genome that was created from a fasta submission, then the information comes from the BioSample, which will need to be updated. Send the correct source information to us at genomes@ncbi.nlm.nih.gov, and we will update the genome and BioSample. Be sure to include the SUBid of the genome submission and the accession of the BioSample (SAMNxxxxxxxx), if one has been assigned.</p>
<h3 id="LatLonProblem">SEQ_DESCR_LatLonProblem</h3>
<p><em>Explanation:</em> There is a problem with the lat-lon modifier provided.</p>
<p><em>Suggestion:</em> Correct or remove the latitude-longitude (lat-lon) values in the source modifiers. Provide lat-lon in decimal degrees and include the compass direction (for example, 39.7 N 42.1 W). Longitude values range from 0 to 180E or 0 to 180W. Latitude values range from 0 to 90 N or 0 to 90 S. If the error is from a genome that was created from a fasta submission, then the information comes from the BioSample, which will need to be updated. Send the correct source information to us at genomes@ncbi.nlm.nih.gov, and we will update the genome and BioSample. Be sure to include the SUBid of the genome submission and the accession of the BioSample (SAMNxxxxxxxx), if one has been assigned.</p>
<h3 id="LatLonRange">SEQ_DESCR_LatLonRange</h3>
<p><em>Explanation:</em> Latitude or longitude is out of range.</p>
<p><em>Suggestion:</em> Correct or remove the latitude-longitude (lat-lon) values in the source modifiers. Provide lat-lon in decimal degrees and include the compass direction (for example, 39.7 N 42.1 W). Longitude values range from 0 to 180E or 0 to 180W. Latitude values range from 0 to 90 N or 0 to 90 S. Numbers outside of these ranges will cause errors. If the error is from a genome that was created from a fasta submission, then the information comes from the BioSample, which will need to be updated. Send the correct source information to us at genomes@ncbi.nlm.nih.gov, and we will update the genome and BioSample. Be sure to include the SUBid of the genome submission and the accession of the BioSample (SAMNxxxxxxxx), if one has been assigned.</p>
<h3 id="LatLonValue">SEQ_DESCR_LatLonValue</h3>
<p><em>Explanation:</em> Latitude or longitude values appear to be in the wrong hemisphere or swapped.</p>
<p><em>Suggestion:</em> Correct or remove the latitude- longitude (lat-lon) values in the source modifiers. The lat-lon value for the record does not agree with the source geographic location (geo_loc_name) provided. Based on the source geographic location, the lat-lon value appears to have the incorrect hemisphere or is swapped. Check the coordinates and compass direction and provide the correct values. If the error is from a genome that was created from a fasta submission, then the information comes from the BioSample, which will need to be updated. Send the correct source information to us at genomes@ncbi.nlm.nih.gov, and we will update the genome and BioSample. Be sure to include the SUBid of the genome submission and the accession of the BioSample (SAMNxxxxxxxx), if one has been assigned.</p>
<h3 id="MisMatchAA">SEQ_FEAT.MisMatchAA</h3>
<p><em>Explanation:</em> The conceptual translation does not match the provided translation.</p>
<p><em>Suggestion:</em> Make the CDS partial if it does not begin at the start codon (and extend to end of the sequence for incomplete prokaryotic sequence). Set the genetic code of prokaryotes ( [gcode=11] ) to get the correct translations.</p>
<h3 id="MissingPubInfoNosubmissioncitation">GENERIC.MissingPubInfo: No submission citation anywhere on this entire record</h3>
<p><em>Explanation:</em> There is no submitter block.</p>
<p><em>Suggestion:</em> Include the template when you create the .sqn submission file. You can create a template here: <a href="https://submit.ncbi.nlm.nih.gov/genbank/template/submission/">https://submit.ncbi.nlm.nih.gov/genbank/template/submission/</a> .</p>
<h3 id="MissingPubInfoSubmissioncitationaffiliationhasnostate">GENERIC.MissingPubInfo: Submission citation affiliation has no state</h3>
<p><em>Explanation:</em> The country is USA, but the state is not included in the affiliation in the submitter block.</p>
<p><em>Suggestion:</em> Include the state in the template file (for .sqn submissions) or your submission portal profile (for fasta submissions).</p>
<h3 id="MissingPubInfo">GENERIC_MissingPubInfo</h3>
<p><em>Explanation:</em> The publication is missing essential information, such as title or authors.</p>
<p><em>Suggestion:</em> Check the references. Provide author names, a title, and select the publication status (unpublished, in press, or published). If the title is published or is in press, provide additional information including publication year, journal, volume, and pages, where applicable.</p>
<h3 id="MissingPubRequirement">GENERIC_MissingPubRequirement</h3>
<p><em>Explanation:</em> The REFERENCE that includes the submitter information is missing. </p>
<p><em>Suggestion:</em> Make the <a href="https://submit.ncbi.nlm.nih.gov/genbank/template/submission/">template file</a> and call it with the -t argument in the command line: -t template.sbt</p>
<h3 id="MissingTrnaAA">SEQ_FEAT.MissingTrnaAA</h3>
<p><em>Explanation:</em> The amino acid that the tRNA carries is not included.</p>
<p><em>Suggestion:</em> Include the amino acid as the product of the tRNA. If the amino acid of a tRNA is unknown, use tRNA-Xxx as the product. See <a href="/genbank/genomesubmit_annotation#RNA">prokaryotic examples</a> and <a href="/genbank/eukaryotic_genome_submission_annotation#rRNA">eukaryotic examples</a> .</p>
<h3 id="NoOrgFound">SEQ_DESCR.NoOrgFound</h3>
<p><em>Explanation:</em> No organism name is included.</p>
<p><em>Suggestion:</em> Include the organism information when creating the .sqn file. When running table2asn (or tbl2asn), the organism information can be included in the definition lines of the fasta files or in the command line with <code>-j</code>.</p>
<h3 id="NoPubFound">SEQ_DESCR.NoPubFound</h3>
<p><em>Explanation:</em> There is no submitter block or other reference.</p>
<p><em>Suggestion:</em> Include the template when you create the .sqn submission file. You can create a template here: <a href="https://submit.ncbi.nlm.nih.gov/genbank/template/submission/">https://submit.ncbi.nlm.nih.gov/genbank/template/submission/</a> .</p>
<h3 id="NoSourceDescriptor">SEQ_DESCR.NoSourceDescriptor</h3>
<p><em>Explanation:</em> There is no source information included.</p>
<p><em>Suggestion:</em> Include the source by including the information in the fasta headers OR the -j argument in the command line. See the available <a href="https://www.ncbi.nlm.nih.gov/genbank/mods_fastadefline/">source modifiers</a>. For a genome you only need to include the organism and strain (for microbes) or organism and breed/ecotype/cultivar and isolate for plants and animals because the information in the BioSample will be added to the genome.</p>
<h3 id="NoStop">SEQ_FEAT.NoStop</h3>
<p><em>Explanation:</em> The CDS is not marked as partial at its 3 end and does not end with a stop codon.</p>
<p><em>Suggestion:</em> Extend the CDS to the stop codon, or mark the 3 end as partial (and extend the CDS to the end of the sequence for prokaryotic sequences), or add the /pseudo qualifier to the gene to indicate that the CDS cannot be translated.</p>
<h3 id="OnlyGeneXrefs">SEQ_FEAT.OnlyGeneXrefs</h3>
<p><em>Explanation:</em> Features, such as CDS, refer to genes but there are no corresponding gene features.</p>
<p><em>Suggestion:</em> Include gene features with a unique locus_tag on each gene.</p>
<h3 id="PartialProblemPartialLocationStartdoesnotincludefirstlastresidue">SEQ_FEAT.PartialProblem PartialLocation: Start does not include first/last residue of sequence</h3>
<p><em>Explanation:</em> Since prokaryotes have very little splicing, their features need to be complete or to extend to the end of the sequence and be partial. In eukaryotes this error can be ignored if the partial is at an intron/exon boundary.</p>
<p><em>Suggestion:</em> Extend the feature one or a few bases to the end of the sequence. If the feature is complete, remove the partial symbols. If this is only a fragment or a nonfunctional gene, change the features location to be complete and add the /pseudo qualifier to the gene.</p>
<h3 id="ShortIntron">SEQ_FEAT.ShortIntron</h3>
<p><em>Explanation:</em> The CDS contains an intron shorter than 11bp, which is generally not biologically correct and is usually included to adjust for a frameshift in the sequence. </p>
<p><em>Suggestion:</em> If the gene is frameshifted but not a pseudogene, then annotate a single gene feature across the entire span and include a <em>pseudo</em> qualifier to indicate that the gene is broken and cannot be translated as expected. In addition, you could include a brief note explaining the problem. If the gene is an actual pseudogene, then add the <em>pseudogene</em> qualifier and the appropriate <a href="https://www.insdc.org/documents/pseudogene-qualifier-vocabulary">TYPE</a> to the single gene feature. Alternatively, you can include "-c s" in the table2asn command line, in which case the CDS will have a translation but it will also have the qualifier /artificial_location="low-quality sequence region" and the protein definition line will be prefaced with "LOW QUALITY PROTEIN:"</p>
<h3 id="ShortSeq">SEQ_INST.ShortSeq</h3>
<p><em>Explanation:</em> This warning is triggered by proteins that are shorter than ten amino acids. This is probably fine and will not cause problems with your submission, but you should investigate and decide whether you think these really exist. </p>
<p><em>Suggestion:</em> This is probably fine and will not cause problems with your submission, but you should investigate and decide whether you think these really exist. If there are lots of them and they
are just short ORF calls by the annotation tool, then we recommend that you remove them unless you think that they are real.</p>
<h3 id="StartCodonandBadProteinStart">SEQ_FEAT.StartCodon and SEQ_INST.BadProteinStart</h3>
<p><em>Explanation:</em> The StartCodon and BadProteinStart errors are produced when the CDS is not marked as partial at its 5 end and does not begin with a start codon.</p>
<p><em>Suggestion:</em> Use the correct <a href="/Taxonomy/Utils/wprintgc.cgi">genetic code</a> to get the correct translations. For example, include [gcode=11] for prokaryotic genome submissions. Other possible fixes include: extend the CDS to the start codon, or mark the 5 end as partial (and extend the CDS to the end of the sequence for prokaryotic sequences), or add the /pseudo qualifier to the gene to indicate that the CDS cannot be translated.</p>
<h3 id="TerminalNs">SEQ_INST.TerminalNs</h3>
<p><em>Explanation:</em> There are Ns at the beginning or end to the sequence.</p>
<p><em>Suggestion:</em> Remove Ns from the beginning and end of the sequence or indicate that the sequence circular, if that is applicable.</p>
<h3 id="TransLen">SEQ_FEAT.TransLen</h3>
<p><em>Explanation:</em> The length of the protein does not match the provided protein length</p>
<p><em>Suggestion:</em> Recreate the .sqn file and if the error persists, send your file to us with a description of how you created it and a request to help fix the error.</p>
<h3 id="UnknownFeatQualprotein_id">SEQ_FEAT.UnknownFeatureQual: orig_protein_id</h3>
<p><em>Explanation:</em> An older version of table2asn_GFF was used to convert a GFF file that had <em>pseudo=true</em> or <em>pseudogene=true</em></p>
<p><em>Suggestion:</em> Download the current version of table2asn_GFF and use it to make your submission. </p>
<h3 id="UnstructuredVoucher">SEQ_DESCR.UnstructuredVoucher</h3>
<p><em>Explanation:</em> The voucher needs to be structured as "&lt;institution-code&gt;:[&lt;collection-code&gt;:]&lt;culture id&gt;".</p>
<p><em>Suggestion:</em> Correct the format of the culture-collection source modifier. The institution code and culture ID are required, the collection-code is optional. Follow the formatting instruction in the explanation. The culture collection must have a valid institution code followed by a colon and the culture ID. See the <a href="https://ftp.ncbi.nlm.nih.gov/pub/taxonomy/coll_dump.txt">list</a> of allowed institutes. If the error is from a genome that was created from a fasta submission, then the information comes from the BioSample, which will need to be updated. Send the correct source information to us at genomes@ncbi.nlm.nih.gov, and we will update the genome and BioSample. Be sure to include the SUBid of the genome submission and the accession of the BioSample (SAMNxxxxxxxx), if one has been assigned.</p>
<p>For example CBS:1234</p>
<p>In this example, CBS is the insitution code and 1234 is the culture ID. There must be a colon between the institution code and the culture ID.</p>
<h3 id="UnwantedCompleteFlag">SEQ_DESCR.UnwantedCompleteFlag</h3>
<p><em>Explanation:</em> The sequence is listed as complete, but there is missing information elsewhere in the record</p>
<p><em>Suggestion:</em> You can ignore this error when you have submitted a complete chromosome or plasmid or organelle.</p>
<h3 id="WrongQualOnImpFeat">SEQ_FEAT.WrongQualOnImpFeat</h3>
<p><em>Explanation:</em> The feature has an illegal qualifier</p>
<p><em>Suggestion:</em> Find the legal qualifiers for each feature in the <a href="https://www.insdc.org/documents/feature-table#7.2">Feature Table</a> .</p>
<h3 id="WrongVoucherType">SEQ_DESCR_WrongVoucherType</h3>
<p><em>Explanation:</em> The institution (or institution: collection) code normally uses a different bio material/culturecollection/specimen voucher type.</p>
<p><em>Suggestion:</em> In the source modifiers, use the source modifier "culture-collection" instead of "specimen-voucher" or vice versa. For example, if you provided the source modifiers in a tab-delimited table, edit the table so the column header "culture-collection" is used in place of "specimen-voucher" and upload the revised table. If the error is from a genome that was created from a fasta submission, then the information comes from the BioSample, which will need to be updated. Send the correct source information to us at genomes@ncbi.nlm.nih.gov, and we will update the genome and BioSample. Be sure to include the SUBid of the genome submission and the accession of the BioSample (SAMNxxxxxxxx), if one has been assigned.</p>
<p>Note that culture-collection should be used for microbial sequences, while specimen-voucher should be used for plants and animals only. Do not use specimen-voucher to describe host information for a microbial sequence submission.</p>
</div>
<!--/.col1-->
<div class="col2">
<div class="rightnav">
<h2 id="genome-resources">Genome Resources</h2>
<ul>
<li><a href="/genbank/wgs/">About WGS</a></li>
<li><a href="https://www.ncbi.nlm.nih.gov/Traces/wgs/?view=wgs">WGS Browser</a></li>
<li><a href="/genbank/genomesubmit/">Genome Submission Guide</a></li>
<li><a href="https://submit.ncbi.nlm.nih.gov/subs/genome/">Genome Submission Portal</a></li>
<li><a href="/genbank/wgs_update/">Update Genome Records</a></li>
<li><a href="/genbank/wgsfaq/">FAQ</a></li>
<li><a href="/genbank/table2asn">table2asn</a></li>
<li><a href="/genbank/diploid_haps">Submitting Multiple Haplotype Assemblies</a></li>
<li><a href="/WebSub/template.cgi/">Create Submission Template</a></li>
<li><a href="/genbank/eukaryotic_genome_submission/">Eukaryotic Annotation Guide</a></li>
<li><a href="/genbank/genomesubmit_annotation/">Prokaryotic Annotation Guide</a></li>
<li><a href="/genbank/examples.wgs/">Annotation Example Files</a></li>
<li><a href="/genbank/genomes_gff">Annotating Genomes with GFF3 or GTF files</a></li>
<li><a href="/genbank/genome_validation">Validation Error Explanations for Genomes</a></li>
<li><a href="/genbank/asndisc/">Discrepancy Report</a></li>
<li><a href="https://www.ncbi.nlm.nih.gov/genome/annotation_prok/">NCBI Prokaryotic Genome Annotation Pipeline</a></li>
<li><a href="https://www.ncbi.nlm.nih.gov/assembly/agp/AGP_Specification/">AGP Format</a></li>
<li><a href="/genbank/metagenome/">Metagenome Submission Guide</a></li>
<li><a href="/genbank/structuredcomment/">Structured Comment</a></li>
<li><a href="/bioproject/">BioProject</a></li>
<li><a href="/biosample/">BioSample</a></li>
</ul>
</div>
</div>
<!--/.col2-->
<div class="col3">
</div>
<!--/.col3-->
<div class="col4">
</div>
<!--/.col4-->
<div class="col5">
</div>
<div class="col6">
</div>
<div class="col7">
</div>
<div class="col8">
</div>
<div class="col9">
</div>
</div><!--/.content-->
</div><!--/.container-->
<div id="NCBIFooter_dynamic">
<div class="breadcrumbs">You are here:
<span id="breadcrumb_text"><a href="/guide/">NCBI</a></span></div>
<a id="help-desk-link" class="help_desk" href="https://support.ncbi.nlm.nih.gov/ics/support/default.asp?Time=2025-03-05T02:46:03-05:00&amp;Snapshot=%2Fprojects%2Fstaticsites%2Fgenbank%2Fgenbank@2.21&amp;Host=portal104&amp;ncbi_phid=CE8B41FA7C7F1B610000000000F700C2&amp;ncbi_session=CE8B5AF87C7FFCB1_0191SID&amp;from=https%3A%2F%2Fwww.ncbi.nlm.nih.gov%2Fgenbank%2Fgenome_validation%2F&amp;Ncbi_App=genbank&amp;Page=custom-page&amp;style=classic&amp;deptID=28049" target="_blank">Support Center</a>
<noscript><img alt="" src="/stat?jsdisabled=true&amp;ncbi_app=genbank&amp;ncbi_db=&amp;ncbi_pdid=custom-page&amp;ncbi_phid=CE8B41FA7C7F1B610000000000F700C2" /></noscript>
</div>
<div xmlns:xi="http://www.w3.org/2001/XInclude">
<div xmlns="http://www.w3.org/1999/xhtml" class="footer" id="footer" xml:base="http://127.0.0.1/sites/static/header_footer">
<section class="icon-section">
<div id="icon-section-header" class="icon-section_header">Follow NCBI</div>
<div class="grid-container container">
<div class="icon-section_container">
<a class="footer-icon" id="footer_twitter" href="https://twitter.com/ncbi" aria-label="Twitter">
<svg xmlns="http://www.w3.org/2000/svg" width="40" height="40" viewBox="0 0 40 40" fill="none">
<title>Twitter</title>
<g id="twitterx1008">
<path id="path1008" d="M6.06736 7L16.8778 20.8991L6.00001 32.2H10.2L18.6 23.1L25.668 32.2H34L22.8 17.5L31.9 7H28.4L20.7 15.4L14.401 7H6.06898H6.06736ZM9.66753 8.73423H12.9327L29.7327 30.4658H26.5697L9.66753 8.73423Z" fill="#5B616B"></path>
</g>
</svg>
</a>
<a class="footer-icon" id="footer_facebook" href="https://www.facebook.com/ncbi.nlm" aria-label="Facebook"><svg xmlns="http://www.w3.org/2000/svg" data-name="Layer 1" viewBox="0 0 300 300">
<title>Facebook</title>
<path class="cls-11" d="M210.5,115.12H171.74V97.82c0-8.14,5.39-10,9.19-10h27.14V52l-39.32-.12c-35.66,0-42.42,26.68-42.42,43.77v19.48H99.09v36.32h27.24v109h45.41v-109h35Z">
</path>
</svg></a>
<a class="footer-icon" id="footer_linkedin" href="https://www.linkedin.com/company/ncbinlm" aria-label="LinkedIn"><svg xmlns="http://www.w3.org/2000/svg" data-name="Layer 1" viewBox="0 0 300 300">
<title>LinkedIn</title>
<path class="cls-11" d="M101.64,243.37H57.79v-114h43.85Zm-22-131.54h-.26c-13.25,0-21.82-10.36-21.82-21.76,0-11.65,8.84-21.15,22.33-21.15S101.7,78.72,102,90.38C102,101.77,93.4,111.83,79.63,111.83Zm100.93,52.61A17.54,17.54,0,0,0,163,182v61.39H119.18s.51-105.23,0-114H163v13a54.33,54.33,0,0,1,34.54-12.66c26,0,44.39,18.8,44.39,55.29v58.35H198.1V182A17.54,17.54,0,0,0,180.56,164.44Z">
</path>
</svg></a>
<a class="footer-icon" id="footer_github" href="https://github.com/ncbi" aria-label="GitHub"><svg xmlns="http://www.w3.org/2000/svg" data-name="Layer 1" viewBox="0 0 300 300">
<defs>
<style>
.cls-11,
.cls-12 {
fill: #737373;
}
.cls-11 {
fill-rule: evenodd;
}
</style>
</defs>
<title>GitHub</title>
<path class="cls-11" d="M151.36,47.28a105.76,105.76,0,0,0-33.43,206.1c5.28,1,7.22-2.3,7.22-5.09,0-2.52-.09-10.85-.14-19.69-29.42,6.4-35.63-12.48-35.63-12.48-4.81-12.22-11.74-15.47-11.74-15.47-9.59-6.56.73-6.43.73-6.43,10.61.75,16.21,10.9,16.21,10.9,9.43,16.17,24.73,11.49,30.77,8.79,1-6.83,3.69-11.5,6.71-14.14C108.57,197.1,83.88,188,83.88,147.51a40.92,40.92,0,0,1,10.9-28.39c-1.1-2.66-4.72-13.42,1-28,0,0,8.88-2.84,29.09,10.84a100.26,100.26,0,0,1,53,0C198,88.3,206.9,91.14,206.9,91.14c5.76,14.56,2.14,25.32,1,28a40.87,40.87,0,0,1,10.89,28.39c0,40.62-24.74,49.56-48.29,52.18,3.79,3.28,7.17,9.71,7.17,19.58,0,14.15-.12,25.54-.12,29,0,2.82,1.9,6.11,7.26,5.07A105.76,105.76,0,0,0,151.36,47.28Z">
</path>
<path class="cls-12" d="M85.66,199.12c-.23.52-1.06.68-1.81.32s-1.2-1.06-.95-1.59,1.06-.69,1.82-.33,1.21,1.07.94,1.6Zm-1.3-1">
</path>
<path class="cls-12" d="M90,203.89c-.51.47-1.49.25-2.16-.49a1.61,1.61,0,0,1-.31-2.19c.52-.47,1.47-.25,2.17.49s.82,1.72.3,2.19Zm-1-1.08">
</path>
<path class="cls-12" d="M94.12,210c-.65.46-1.71,0-2.37-.91s-.64-2.07,0-2.52,1.7,0,2.36.89.65,2.08,0,2.54Zm0,0"></path>
<path class="cls-12" d="M99.83,215.87c-.58.64-1.82.47-2.72-.41s-1.18-2.06-.6-2.7,1.83-.46,2.74.41,1.2,2.07.58,2.7Zm0,0">
</path>
<path class="cls-12" d="M107.71,219.29c-.26.82-1.45,1.2-2.64.85s-2-1.34-1.74-2.17,1.44-1.23,2.65-.85,2,1.32,1.73,2.17Zm0,0">
</path>
<path class="cls-12" d="M116.36,219.92c0,.87-1,1.59-2.24,1.61s-2.29-.68-2.3-1.54,1-1.59,2.26-1.61,2.28.67,2.28,1.54Zm0,0">
</path>
<path class="cls-12" d="M124.42,218.55c.15.85-.73,1.72-2,1.95s-2.37-.3-2.52-1.14.73-1.75,2-2,2.37.29,2.53,1.16Zm0,0"></path>
</svg></a>
<a class="footer-icon" id="footer_blog" href="https://ncbiinsights.ncbi.nlm.nih.gov/" aria-label="Blog">
<svg xmlns="http://www.w3.org/2000/svg" id="Layer_1" data-name="Layer 1" viewBox="0 0 40 40">
<defs><style>.cls-1{fill:#737373;}</style></defs>
<title>NCBI Insights Blog</title>
<path class="cls-1" d="M14,30a4,4,0,1,1-4-4,4,4,0,0,1,4,4Zm11,3A19,19,0,0,0,7.05,15a1,1,0,0,0-1,1v3a1,1,0,0,0,.93,1A14,14,0,0,1,20,33.07,1,1,0,0,0,21,34h3a1,1,0,0,0,1-1Zm9,0A28,28,0,0,0,7,6,1,1,0,0,0,6,7v3a1,1,0,0,0,1,1A23,23,0,0,1,29,33a1,1,0,0,0,1,1h3A1,1,0,0,0,34,33Z"></path>
</svg>
</a>
</div>
</div>
</section>
<section class="container-fluid bg-primary">
<div class="container pt-5">
<div class="row mt-3">
<div class="col-lg-3 col-12">
<p><a class="text-white" href="https://www.nlm.nih.gov/socialmedia/index.html">Connect with NLM</a></p>
<ul class="list-inline social_media">
<li class="list-inline-item"><a href="https://twitter.com/NLM_NIH" aria-label="Twitter" target="_blank" rel="noopener noreferrer">
<svg xmlns="http://www.w3.org/2000/svg" width="35" height="35" viewBox="0 0 36 35" fill="none">
<title>Twitter</title>
<g id="twitterx1009" clip-path="url(#clip0_65276_3946)">
<path id="Vector_Twitter" d="M17.5006 34.6565C26.9761 34.6565 34.6575 26.9751 34.6575 17.4996C34.6575 8.02416 26.9761 0.342773 17.5006 0.342773C8.02514 0.342773 0.34375 8.02416 0.34375 17.4996C0.34375 26.9751 8.02514 34.6565 17.5006 34.6565Z" fill="#205493" stroke="white" stroke-width="1.0" stroke-miterlimit="10"></path>
<path id="path1009" d="M8.54811 8.5L16.2698 18.4279L8.50001 26.5H11.5L17.5 20L22.5486 26.5H28.5L20.5 16L27 8.5H24.5L19 14.5L14.5007 8.5H8.54927H8.54811ZM11.1197 9.73873H13.4519L25.4519 25.2613H23.1926L11.1197 9.73873Z" fill="white"></path>
</g>
<defs>
<clipPath id="clip0_65276_3946">
<rect width="35" height="35" fill="white"></rect>
</clipPath>
</defs>
</svg>
</a></li>
<li class="list-inline-item"><a href="https://www.facebook.com/nationallibraryofmedicine" aria-label="Facebook" rel="noopener noreferrer" target="_blank">
<svg xmlns="http://www.w3.org/2000/svg" width="35" height="35" viewBox="0 0 36 35" fill="none">
<title>Facebook</title>
<g id="Facebook" clip-path="url(#clip0_1717_1086)">
<path id="Vector_Facebook" d="M15.1147 29.1371C15.1147 29.0822 15.1147 29.0296 15.1147 28.9747V18.9414H11.8183C11.6719 18.9414 11.6719 18.9414 11.6719 18.8018C11.6719 17.5642 11.6719 16.3289 11.6719 15.0937C11.6719 14.9793 11.7062 14.9518 11.816 14.9518C12.8683 14.9518 13.9206 14.9518 14.9751 14.9518H15.1215V14.8329C15.1215 13.8057 15.1215 12.774 15.1215 11.7492C15.1274 10.9262 15.3148 10.1146 15.6706 9.37241C16.1301 8.38271 16.9475 7.60378 17.9582 7.19235C18.6492 6.90525 19.3923 6.76428 20.1405 6.7783C21.0029 6.79202 21.8653 6.83091 22.7278 6.86065C22.8879 6.86065 23.048 6.89496 23.2082 6.90182C23.2974 6.90182 23.3271 6.94071 23.3271 7.02993C23.3271 7.54235 23.3271 8.05477 23.3271 8.5649C23.3271 9.16882 23.3271 9.77274 23.3271 10.3767C23.3271 10.4819 23.2974 10.5139 23.1921 10.5116C22.5379 10.5116 21.8814 10.5116 21.2271 10.5116C20.9287 10.5184 20.6316 10.5528 20.3395 10.6146C20.0822 10.6619 19.8463 10.7891 19.6653 10.9779C19.4842 11.1668 19.3672 11.4078 19.3307 11.6669C19.2857 11.893 19.2612 12.1226 19.2575 12.3531C19.2575 13.1904 19.2575 14.0299 19.2575 14.8695C19.2575 14.8946 19.2575 14.9198 19.2575 14.9564H23.0229C23.1807 14.9564 23.183 14.9564 23.1624 15.1074C23.0778 15.7662 22.9885 16.425 22.9039 17.0816C22.8322 17.6321 22.7636 18.1827 22.698 18.7332C22.6729 18.9437 22.6797 18.9437 22.4693 18.9437H19.2644V28.8992C19.2644 28.9793 19.2644 29.0593 19.2644 29.1394L15.1147 29.1371Z" fill="white"></path>
<path id="Vector_2_Facebook" d="M17.5006 34.657C26.9761 34.657 34.6575 26.9756 34.6575 17.5001C34.6575 8.02465 26.9761 0.343262 17.5006 0.343262C8.02514 0.343262 0.34375 8.02465 0.34375 17.5001C0.34375 26.9756 8.02514 34.657 17.5006 34.657Z" stroke="white" stroke-width="1.0" stroke-miterlimit="10"></path>
</g>
<defs>
<clipPath id="clip0_1717_1086">
<rect width="35" height="35" fill="white"></rect>
</clipPath>
</defs>
</svg>
</a></li>
<li class="list-inline-item"><a href="https://www.youtube.com/user/NLMNIH" aria-label="Youtube" target="_blank" rel="noopener noreferrer">
<svg xmlns="http://www.w3.org/2000/svg" width="35" height="35" viewBox="0 0 36 35" fill="none">
<title>Youtube</title>
<g id="YouTube" clip-path="url(#clip0_1717_1101)">
<path id="Vector_Youtube" d="M26.2571 11.4791C25.9025 11.1589 25.5709 10.9576 24.228 10.834C22.5512 10.6785 20.2797 10.6556 18.564 10.6533H16.4365C14.7208 10.6533 12.4493 10.6785 10.7725 10.834C9.43196 10.9576 9.09798 11.1589 8.7434 11.4791C7.81464 12.321 7.6202 14.6268 7.59961 16.8938C7.59961 17.3178 7.59961 17.741 7.59961 18.1635C7.62706 20.4121 7.82837 22.686 8.7434 23.521C9.09798 23.8412 9.42967 24.0425 10.7725 24.1661C12.4493 24.3216 14.7208 24.3445 16.4365 24.3468H18.564C20.2797 24.3468 22.5512 24.3216 24.228 24.1661C25.5686 24.0425 25.9025 23.8412 26.2571 23.521C27.1722 22.6929 27.3735 20.451 27.4009 18.2206C27.4009 17.7402 27.4009 17.2599 27.4009 16.7795C27.3735 14.5491 27.1699 12.3072 26.2571 11.4791ZM15.5604 20.5311V14.652L20.561 17.5001L15.5604 20.5311Z" fill="white"></path>
<path id="Vector_2_Youtube" d="M17.5006 34.657C26.9761 34.657 34.6575 26.9756 34.6575 17.5001C34.6575 8.02465 26.9761 0.343262 17.5006 0.343262C8.02514 0.343262 0.34375 8.02465 0.34375 17.5001C0.34375 26.9756 8.02514 34.657 17.5006 34.657Z" stroke="white" stroke-width="1.0" stroke-miterlimit="10"></path>
</g>
<defs>
<clipPath id="clip0_1717_1101">
<rect width="35" height="35" fill="white"></rect>
</clipPath>
</defs>
</svg>
</a></li>
</ul>
</div>
<div class="col-lg-3 col-12">
<p class="address_footer text-white">National Library of Medicine<br />
<a href="https://www.google.com/maps/place/8600+Rockville+Pike,+Bethesda,+MD+20894/@38.9959508,-77.101021,17z/data=!3m1!4b1!4m5!3m4!1s0x89b7c95e25765ddb:0x19156f88b27635b8!8m2!3d38.9959508!4d-77.0988323" class="text-white" target="_blank" rel="noopener noreferrer">8600 Rockville Pike<br />
Bethesda, MD 20894</a></p>
</div>
<div class="col-lg-3 col-12 centered-lg">
<p><a href="https://www.nlm.nih.gov/web_policies.html" class="text-white">Web Policies</a><br />
<a href="https://www.nih.gov/institutes-nih/nih-office-director/office-communications-public-liaison/freedom-information-act-office" class="text-white">FOIA</a><br />
<a href="https://www.hhs.gov/vulnerability-disclosure-policy/index.html" class="text-white" id="vdp">HHS Vulnerability Disclosure</a></p>
</div>
<div class="col-lg-3 col-12 centered-lg">
<p><a class="supportLink text-white" href="https://support.nlm.nih.gov/">Help</a><br />
<a href="https://www.nlm.nih.gov/accessibility.html" class="text-white">Accessibility</a><br />
<a href="https://www.nlm.nih.gov/careers/careers.html" class="text-white">Careers</a></p>
</div>
</div>
<div class="row">
<div class="col-lg-12 centered-lg">
<nav class="bottom-links">
<ul class="mt-3">
<li>
<a class="text-white" href="//www.nlm.nih.gov/">NLM</a>
</li>
<li>
<a class="text-white" href="https://www.nih.gov/">NIH</a>
</li>
<li>
<a class="text-white" href="https://www.hhs.gov/">HHS</a>
</li>
<li>
<a class="text-white" href="https://www.usa.gov/">USA.gov</a>
</li>
</ul>
</nav>
</div>
</div>
</div>
</section>
<script type="text/javascript" src="/portal/portal3rc.fcgi/rlib/js/InstrumentOmnitureBaseJS/InstrumentNCBIConfigJS/InstrumentNCBIBaseJS/InstrumentPageStarterJS.js?v=1"> </script>
<script type="text/javascript" src="/portal/portal3rc.fcgi/static/js/hfjs2.js"> </script>
</div>
</div>
<!--/.footer-->
<p class="last-updated small">Last updated: 2024-10-30T15:37:40Z</p>
</div>
<!--/.page-->
</div>
<!--/.wrap-->
<span class="PAFAppResources"></span>
</div><!-- /.twelve_col -->
</div>
<!-- /.grid -->
<!-- usually for JS scripts at page bottom -->
<span class="pagefixtures"></span>
<!-- CE8B5AF87C7FFCB1_0191SID /projects/staticsites/genbank/genbank@2.21 portal104 v4.1.r689238 Tue, Oct 22 2024 16:10:51 -->
<span id="portal-csrf-token" style="display:none" data-token="CE8B5AF87C7FFCB1_0191SID"></span>
<script type="text/javascript" src="//static.pubmed.gov/portal/portal3rc.fcgi/4218137/js/3879255/4121861/1490097/4087685.js" snapshot="genbank"></script></body>
</html>