nih-gov/www.ncbi.nlm.nih.gov/pathogens/pathogens_help/index.html
2025-03-17 02:05:34 +00:00

10779 lines
No EOL
923 KiB
HTML
Raw Permalink Blame History

This file contains ambiguous Unicode characters

This file contains Unicode characters that might be confused with other characters. If you think that this is intentional, you can safely ignore this warning. Use the Escape button to reveal them.

<!DOCTYPE html>
<html lang="en" >
<head >
<meta charset="UTF-8">
<meta http-equiv="X-UA-Compatible" content="IE=edge">
<!-- Mobile properties -->
<meta name="HandheldFriendly" content="True">
<meta name="MobileOptimized" content="320">
<meta name="viewport" content="width=device-width, initial-scale=1.0">
<!-- Stylesheets -->
<link href="/pathogens/static/django_uswds/uswds/css/uswds.css" rel="stylesheet" />
<link rel="stylesheet" href="/pathogens/static/nwds/css/nwds.css" />
<link rel="stylesheet" href="/pathogens/static/nwds/css/header.css" />
<link rel="stylesheet" href="/pathogens/static/nwds/css/footer.css" />
<link rel="stylesheet" href="/pathogens/static/nwds/css/form.css" />
<link rel="stylesheet" href="https://maxcdn.bootstrapcdn.com/font-awesome/4.7.0/css/font-awesome.min.css"/>
<title>
NCBI -
Pathogen Detection - NCBI
</title>
<!-- extra head -->
<!-- Favicons -->
<link rel="shortcut icon" type="image/ico" href="https://www.ncbi.nlm.nih.gov/coreutils/nwds/img/favicons/favicon.ico" />
<link rel="icon" type="image/png" href="https://www.ncbi.nlm.nih.gov/coreutils/nwds/img/favicons/favicon.png" />
<!-- 192x192, as recommended for Android
http://updates.html5rocks.com/2014/11/Support-for-theme-color-in-Chrome-39-for-Android
-->
<link rel="icon" type="image/png" sizes="192x192" href="https://www.ncbi.nlm.nih.gov/coreutils/nwds/img/favicons/favicon-192.png" />
<!-- 57x57 (precomposed) for iPhone 3GS, pre-2011 iPod Touch and older Android devices -->
<link rel="apple-touch-icon-precomposed" href="https://www.ncbi.nlm.nih.gov/coreutils/nwds/img/favicons/favicon-57.png">
<!-- 72x72 (precomposed) for 1st generation iPad, iPad 2 and iPad mini -->
<link rel="apple-touch-icon-precomposed" sizes="72x72" href="https://www.ncbi.nlm.nih.gov/coreutils/nwds/img/favicons/favicon-72.png">
<!-- 114x114 (precomposed) for iPhone 4, 4S, 5 and post-2011 iPod Touch -->
<link rel="apple-touch-icon-precomposed" sizes="114x114" href="https://www.ncbi.nlm.nih.gov/coreutils/nwds/img/favicons/favicon-114.png">
<!-- 144x144 (precomposed) for iPad 3rd and 4th generation -->
<link rel="apple-touch-icon-precomposed" sizes="144x144" href="https://www.ncbi.nlm.nih.gov/coreutils/nwds/img/favicons/favicon-144.png">
<link rel="stylesheet" href="/pathogens/static/main/styles/app.css" type="text/css" media="screen">
<link rel="stylesheet" href="/pathogens/static/main/styles/breadcrumbs.css" type="text/css" media="screen">
<style type="text/css">
a { text-decoration: underline }
</style>
<!-- Logging params: Pinger defaults -->
<meta name="ncbi_app" content="labs_pathogens" />
<meta name="ncbi_pdid" content="static" />
<meta name="ncbi_phid" content="939B8FCEB20BE4F500003D37E27A3373.1.m_5" />
<!-- /extra head -->
<link rel="stylesheet" href="/pathogens/static/main/styles/page-search.css" type="text/css">
</head>
<body >
<a class="usa-skipnav" href="#main_content">Skip to main page content</a>
<!-- ========== BEGIN HEADER ========== -->
<section class="usa-banner">
<div class="usa-accordion">
<header class="usa-banner-header">
<div class="usa-grid usa-banner-inner">
<img src="https://www.ncbi.nlm.nih.gov/coreutils/uswds/img/favicons/favicon-57.png" alt="U.S. flag" />
<p>An official website of the United States government</p>
<button
class="usa-accordion-button usa-banner-button"
aria-expanded="false"
aria-controls="gov-banner-top"
>
<span class="usa-banner-button-text">Here's how you know</span>
</button>
</div>
</header>
<div
class="usa-banner-content usa-grid usa-accordion-content"
id="gov-banner-top"
>
<div class="usa-banner-guidance-gov usa-width-one-half">
<img
class="usa-banner-icon usa-media_block-img"
src="https://www.ncbi.nlm.nih.gov/coreutils/uswds/img/icon-dot-gov.svg"
alt="Dot gov"
/>
<div class="usa-media_block-body">
<p>
<strong>The .gov means its official.</strong>
<br />
Federal government websites often end in .gov or .mil. Before
sharing sensitive information, make sure youre on a federal
government site.
</p>
</div>
</div>
<div class="usa-banner-guidance-ssl usa-width-one-half">
<img
class="usa-banner-icon usa-media_block-img"
src="https://www.ncbi.nlm.nih.gov/coreutils/uswds/img/icon-https.svg"
alt="Https"
/>
<div class="usa-media_block-body">
<p>
<strong>The site is secure.</strong>
<br />
The <strong>https://</strong> ensures that you are connecting to the
official website and that any information you provide is encrypted
and transmitted securely.
</p>
</div>
</div>
</div>
</div>
</section>
<div class="usa-overlay"></div>
<header class="ncbi-header" role="banner" data-section="Header">
<div class="usa-grid">
<div class="usa-width-one-whole">
<div class="ncbi-header__logo">
<a href="https://www.ncbi.nlm.nih.gov/" class="logo" aria-label="NCBI Logo" data-ga-action="click_image" data-ga-label="NIH NLM Logo">
<img src="https://www.ncbi.nlm.nih.gov/coreutils/nwds/img/logos/AgencyLogo.svg" alt="NIH NLM Logo" />
</a>
</div>
<div class="ncbi-header__account">
<a id="account_login" href="https://account.ncbi.nlm.nih.gov" class="usa-button header-button" style="display:none" data-ga-action="open_menu" data-ga-label="account_menu">Log in</a>
<button id="account_info" class="header-button" style="display:none"
aria-controls="account_popup">
<span class="fa fa-user" aria-hidden="true"></span>
<span class="username desktop-only" aria-hidden="true" id="uname_short"></span>
<span class="sr-only">Show account info</span>
</button>
</div>
<div class="ncbi-popup-anchor">
<div class="ncbi-popup account-popup" id="account_popup" aria-hidden="true">
<div class="ncbi-popup-head">
<button class="ncbi-close-button" data-ga-action="close_menu" data-ga-label="account_menu"><span class="fa fa-times"></span><span class="usa-sr-only">Close</span></button>
<h4>Account</h4>
</div>
<div class="account-user-info">
Logged in as:<br/>
<b><span class="username" id="uname_long">username</span></b>
</div>
<div class="account-links">
<ul class="usa-unstyled-list">
<li><a id="account_myncbi" href="/myncbi/" class="set-base-url" data-ga-action="click_menu_item" data-ga-label="account_myncbi">Dashboard</a></li>
<li><a id="account_pubs" href="/myncbi/collections/bibliography/" class="set-base-url" data-ga-action="click_menu_item" data-ga-label="account_pubs">Publications</a></li>
<li><a id="account_settings" href="/account/settings/" class="set-base-url" data-ga-action="click_menu_item" data-ga-label="account_settings">Account settings</a></li>
<li><a id="account_logout" href="/account/signout/" class="set-base-url" data-ga-action="click_menu_item" data-ga-label="account_logout">Log out</a></li>
</ul>
</div>
</div>
</div>
</div>
</div>
</header>
<div role="navigation" aria-label="access keys">
<a id="nws_header_accesskey_0" href="https://www.ncbi.nlm.nih.gov/guide/browsers/#ncbi_accesskeys" class="usa-sr-only" accesskey="0" tabindex="-1">Access keys</a>
<a id="nws_header_accesskey_1" href="https://www.ncbi.nlm.nih.gov" class="usa-sr-only" accesskey="1" tabindex="-1">NCBI Homepage</a>
<a id="nws_header_accesskey_2" href="/myncbi/" class="set-base-url usa-sr-only" accesskey="2" tabindex="-1">MyNCBI Homepage</a>
<a id="nws_header_accesskey_3" href="#maincontent" class="usa-sr-only" accesskey="3" tabindex="-1">Main Content</a>
<a id="nws_header_accesskey_4" href="#" class="usa-sr-only" accesskey="4" tabindex="-1">Main Navigation</a>
</div>
<section data-section="Alerts">
<div class="ncbi-alerts-placeholder"></div>
</section>
<!-- ========== END HEADER ========== -->
<main id="main_content" accesskey="3">
<section class="pathogens-content-page usa-grid">
<div class="usa-width-one-whole ptg-top">
<div><ul id="breadcrumbs" class="usa-unstyled-list breadcrumbs">
<li><a href="https://www.ncbi.nlm.nih.gov/home/health.shtml">Health</a></li>
<li><a href=/pathogens/>Pathogen Detection</a></li>
<li>NCBI</li>
</ul>
</div>
<div class="ptg-search">
<input placeholder="Search page" type="search"/><button title="Previous" disabled="disabled"></button><button title="Next" disabled="disabled"></button>
</div>
</div>
<div> <html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
<!-- ============== HEAD =============== -->
<head><meta http-equiv="Content-Type" content="text/html; charset=ASCII" />
<title>NCBI Pathogen Detection Project Help Document</title>
<meta name="description" content="Help document for the Pathogen Detection Project, a resource of the National Center for Biotechnology Information (NCBI) for microbial genome sequence analysis for epidemiologic surveillance." />
<meta name="keywords" content="pathogens, genomes, genome sequences, antimicrobial resistance, AMR, antibiotic resistance, Reference Gene Catalog, genes, alleles, bacteria, microbes, Escherichia coli, E coli, Salmonella, Listeria, food borne illness, outbreaks, CDC, FDA, NCBI, National Center for Biotechnology Information" />
<meta name="robots" content="index,follow,noarchive" />
</head>
<!-- ============= END_HEAD ============= -->
<!-- ============== BODY =============== -->
<body>
<h1 id="top">Pathogen Detection Help Document</h1>
<!-- ============== BOXED_NOTE =============== -->
<h3>Beta Release</h3>
<div style="padding: 0em 2em 0em 2em">
<table cellpadding="10">
<tr>
<td bgcolor="#ffffcc">
This is a <b>beta release</b> of the Pathogens help documentation in order to make new content available, while development continues on the format and presentation of the information. Navigation tips:<br />
<ul>
<li>The <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Isolates Browser Advanced Search, topic list" /> icon takes you to the list of topics for the section you are currently reading</li>
<li>The <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /> icon takes you to the top of the document</li>
</ul>
We welcome and appreciate feedback about the content, including comments about sections that are helpful as well as those in need of clarification and/or enhancement. Thank you for your feedback, which can be sent to<br /><a href="mailto:pd-help@ncbi.nlm.nih.gov">pd-help@ncbi.nlm.nih.gov</a>.
</td>
</tr>
</table>
</div>
<!-- ============== END_BOXED_NOTE =============== -->
<!-- ======== TABLE_OF_CONTENTS ========= -->
<h3 id="toc">Table of contents</h3>
<ul>
<li id="toc-what-is"><a href="#what-is">What is the NCBI Pathogen Detection project?</a></li>
<li id="toc-how-to"><a href="#how-to">How To</a></li>
<li id="toc-components"><a href="#components">Pathogens Project Components</a> (<a href="#resources">resources/tools</a>, <a href="#data-types">types of data</a>, <a href="#contributors">contributors</a>)</li>
<li id="toc-data-retrieval"><a href="#data-retrieval">Data Retrieval &amp; Analysis</a></li>
<li id="toc-isolates-browser"><a href="#isolates-browser"><b>Isolates Browser help</b></a>
<ul>
<li><a href="#isolates-browser-what-is">What is the Isolates Browser?</a></li>
<li id="toc-isolates-browser-input"><a href="#isolates-browser-input">Input to Isolates Browser</a> (<a href="#allowable-search-terms">allowable search terms</a>, <a href="#isolates-browser-basic-search">basic search</a>, <a href="#filters">filters</a>)</li>
<li id="toc-advanced-search"><a href="#isolates-browser-advanced-search">Advanced Search</a> (<a href="#solr">SOLR query language</a>, <a href="#isolates-browser-data-fields"><b>data fields</b></a>, <a href="#solr-sample-searches">examples of SOLR queries</a>)</li>
<li id="toc-isolates-browser-output"><a href="#isolates-browser-output">Output from Isolates Browser</a></li>
<ul>
<li><a href="/pathogens/docs/isolates_gcp">Isolates Browser Data at Google Cloud</a></li>
</ul>
</ul>
</li>
<li id="toc-snp-tree-viewer"><a href="#snp-tree-viewer"><b>SNP Tree Viewer help</b></a>
<ul>
<li><a href="#snp-tree-viewer-what-is">What is the SNP Tree Viewer?</a></li>
<li><a href="#snp-tree-viewer-access">How to access</a></li>
<li><a href="#snp-tree-viewer-output">Output: four panels in a SNP Tree Viewer display</a></li>
</ul>
</li>
<li id="toc-automated-searches"><a href="#automated-searches"><b>Automatic e-mail notifications of new data</b></a>
<ul>
<li><a href="#automated-searches-save">SAVE a search in the Pathogens Isolates Browser</a></li>
<li><a href="#automated-searches-watch">WATCH an isolate(s) in the SNP Tree Viewer</a></li>
</ul>
</li>
<li id="toc-amr"><a href="#amr"><b>Antimicrobial Resistance (AMR) resources</b></a>
<ul>
<li><a href="#amr-overview">Overview</a> (<a href="#amr-resources-schematic">schematic illustration of AMR resources</a>)</li>
<li><a href="#microbigge"><b>MicroBIGG-E:</b> <b>Micro</b>bial <b>B</b>rowser for <b>I</b>dentification of <b>G</b>enetic and <b>G</b>enomic <b>E</b>lements</a> (<a href="#microbigge-search-tips">search tips</a>, <a href="#microbigge-data-fields"><b>data fields</b></a>, <a href="#microbigge-sample-searches">use cases/sample searches</a>)</li>
<ul>
<li> <a href="/pathogens/docs/microbigge_gcp/">MicroBIGG-E Data at Google Cloud</a></li>
</ul>
<li><a href="/pathogens/docs/microbigge_map"><b>MicroBIGG-E Map</b></a></li>
<li><a href="/pathogens/docs/ast/"><b>AST Browser</b></a> (<a href="/pathogens/docs/ast/#data-fields-in-the-ast-browser">data fields</a>, <a href="/pathogens/docs/ast_gcp/">AST data at Google Cloud</a>)</li>
<li><a href="#reference-gene-catalog"><b>Pathogen Detection Reference Gene Catalog</b></a> (<a href="#refgene-search-tips">search tips</a>, <a href="#refgene-data-fields"><b>data fields</b></a>, <a href="#refgene-sample-searches">use cases/sample searches</a>)</li>
<li><a href="/pathogens/docs/HMM_catalog"><b>Pathogen Detection Reference HMM Catalog</b></a> (<a href="/pathogens/docs/HMM_catalog/#search-tips-for-the-pathogen-det">search tips</a>, <a href="/pathogens/docs/HMM_catalog/#data-fields-in-the-pathogen-dete"><b>data fields</b></a>) </li>
<li><a href="/pathogens/docs/gene_hierarchy"><b>Pathogen Detection Reference Gene Hierarchy</b></a> (<a href="/pathogens/docs/gene_hierarchy/#how-to-search-the-reference-gene">search tips</a>, <a href="/pathogens/docs/gene_hierarchy/#data-fields-in-the-reference-gen"><b>data fields</b></a>)</li>
<li><a href="#amr-finder"><b>AMRFinderPlus</b></a></li>
</ul>
</li>
<li id="toc-ftp"><a href="#ftp">FTP Site help</a></li>
<li id="toc-submit"><a href="#submit">Data Submissions</a></li>
<li><a href="#data-processing">Data Processing Pipeline</a></li>
<li id="toc-data-retention"><a href="#data-retention">Data Retention and History Tracking</a></li>
<li><a href="#change-log">Log of Changes to the Pathogen Detection Project</a>
<li><a href="#change-log-features">Feature deployments</a></li>
<li><a href="#change-log-organism-groups">Organism group changes</a></li>
</li>
<li><a href="#references">References</a></li>
<li><a href="#contact">Contact the NCBI Pathogens Detection Team</a></li>
</ul>
<!-- ====== END_TABLE_OF_CONTENTS ======= -->
<!-- ======== HORIZONTAL_RULE ============ -->
<hr />
<!-- ======== END_HORIZONTAL_RULE ======== -->
<!-- ########## H2_SECTION:WHAT_IS ########## -->
<h2 id="what-is">What is the NCBI Pathogen Detection project? <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h2>
<!-- div style='padding-left: 2em'>
<a href="#overview">Overview</a> | <a href="#access">Access Pathogen Detection Project Results</a> | <a href="#access-amr">Access Antimicrobial Resistance (AMR) Data</a> | <a href="#update-frequency">Update Frequency</a> | <a href="#change-log">Log of Changes</a> | <a href="#references">References</a> | <a href="#contact">Contact</a>
</div -->
<ul>
<li><a href="#overview">Overview</a></li>
<li><a href="#access">Where to access the Pathogens Detection Project results</a></li>
<li><a href="#access-amr">Where to access the Pathogen Detection Project Antimicrobial Resistance (AMR) Data</a></li>
<li><a href="#update-frequency">Update Frequency</a></li>
<li><a href="#references-and-contact">References and Contact Information</a></li>
</ul>
<!-- ========= WHAT_IS:OVERVIEW ============ -->
<h3 id="overview">Overview <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#what-is"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="What is the NCBI Pathogen Detection Project, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h3>
<div style="padding-left: 2em">
<a href="/pathogens/">NCBI Pathogen Detection</a> project is a centralized system that integrates sequence data for bacterial pathogens.<br /><br />
NCBI Pathogen Detection integrates bacterial and fungal pathogen genomic sequences from numerous ongoing surveillance and research efforts whose sources include food, environmental sources such as water or production facilities, and patient samples. Foodborne, hospital-acquired, and other clinically infectious pathogens are included.
The system provides two major automated real-time analyses:
<ol>
<li>It quickly clusters related pathogen genome sequences to identify potential transmission chains, helping public health scientists investigate disease outbreaks</li>
<li>As part of the National Database of Antibiotic Resistant Organisms (NDARO), NCBI screens genomic sequences using AMRFinderPlus to identify the antimicrobial resistance, stress response, and virulence genes found in bacterial genomic sequences, which enables scientists to track the spread of resistance genes and to understand the relationships among antimicrobial resistance, stress response, and virulence. </li>
</ol>
A number of public health agencies and researchers in the US and internationally are collecting samples from clinical cases, from the environment, from food products, and from industrial production facilities to facilitate active, real-time surveillance of pathogens, including foodborne disease. Public health agencies and researchers sequence the samples and submit the data to NCBI, which analyzes the sequences and compares them to others in its database, including all genomes in GenBank, to identify closely related sequences. The aim is to identify closely or clonally related isolates to aid in outbreak investigation. For example the FDA, CDC, and USDA use isolates from food and the environment linked to isolates associated with human illness to aid traceback investigations and outbreak response. <i> (read more in the <a href="https://ftp.ncbi.nlm.nih.gov/pub/factsheets/Factsheet_Pathogen_Detection.pdf"> Pathogen Detection factsheet </a> , and in the <a href="#contributors"> Contributors </a> section of this document) </i> <br /> <br />
<em>NOTE: NCBI Pathogen Detection does not identify outbreaks or outbreak membership. All analyses are dependent on the public data submitted to the system and the quirks of our analysis pipelines. NCBI provides a service to help identify clonal relationships based on genomic similarity. Determinations of outbreaks are done by public health organizations including CDC, FDA, USDA. Although we take care to make the analyses as error free as possible, this is a large-scale automated pipeline that takes data from submitters and analyzes it in real-time therefore we cannot guarantee the results to be free from error or applicable for a particular use. </em>
</div>
<!-- ======== END_WHAT_IS:OVERVIEW ========= -->
<!-- ======= WHAT_IS:ACCESS_PATHOGEN_DETECTION_PROJECT_RESULTS ======= -->
<h3 id="access">Where to access the Pathogens Detection Project results <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#what-is"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="What is the NCBI Pathogen Detection Project, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h3>
<div style="padding-left: 2em">The Pathogen Detection project can be accessed from a variety of entry points, such as:
<ul>
<li><a href="/pathogens/">Pathogens Detection home page</a> - provides an overview of the project and links to pathogens resources and tools. </li>
<li><a href="/pathogens/isolates#/search/">Pathogen Detection Isolates Browser</a> - provides an interface to search and/or subset the isolate data, displays details for each isolate, and links to a SNP Tree Viewer, which shows phylogenetic relationships among the isolates. <i>(Separate sections of this file provide <a href="#isolates-browser">Isolates Browser help documentation</a> and <a href="#snp-tree-viewer">SNP Tree Viewer help documentation</a>.)</i></li>
<li><a href="/pathogens/microbigge">Microbial Browser for Genetic and Genomic Elements (MicroBIGG-E)</a> - Provides a detailed view of genetic elements important to clinical and public health identified by <a href="/pathogens/antimicrobial-resistance/AMRFinder/">AMRFinderPlus</a>. See the <a href="/pathogens/pathogens_help/#microbigge">MicroBIGG-E documentation</a> for more information.</li>
<li>The Pathogen Detection <a href="/pathogens/refgene">Reference Gene Catalog</a>, <a href="/pathogens/genehierarchy">Reference Gene Hierarchy</a>, and <a href="/pathogens/hmm">Reference HMM Catalog</a> are the reference databases behind MicroBIGG-E and together they make up the <a href="https://github.com/ncbi/amr/wiki/AMRFinderPlus-database">AMRFinderPlus database</a>. See <a href="#amr">Antimicrobial Resistance (AMR) Resources</a> for more information.</li>
<li><a href="https://ftp.ncbi.nlm.nih.gov/pathogen/">FTP site</a> provides access to the results of analyses that have been done at NCBI on the sequence reads and genome sequences of pathogen isolates. <i>(A separate section of this document provides an <a href="#ftp">overview of the data available</a> on the FTP site, and the <a href="https://ftp.ncbi.nlm.nih.gov/pathogen/ReadMe.txt">FTP readme file</a> provides additional details.)</i></li>
<!-- li><a href="https://www.ncbi.nlm.nih.gov/home/health/">NCBI Health home page</a> - provides access to a variety of resources for clinical practice and medical research. The Pathogen Detection Project is listed under the column header for "Clinical &amp; Public Health Resources."</li><br -->
<!-- li><a href="https://www.ncbi.nlm.nih.gov/guide/sitemap/">NCBI Resource List (A-Z)</a>, under <a href="https://www.ncbi.nlm.nih.gov/guide/sitemap/#_N">"NCBI Pathogen Detection Project"</a><br />
You can also use "CTRL+F" to find the term "Pathogen" in the NCBI Resource List using your web browser's "Find in page" function.</li><br -->
</ul>
</div>
<!-- ======= END_WHAT_IS:ACCESS_PATHOGEN_DETECTION_PROJECT_RESulTS ======= -->
<!-- ======= ACCESS_ANTIMICROBIAL_RESISTANCE_DATA ======= -->
<h3 id="access-amr">Where to access Antimicrobial Resistance (AMR) Data <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#what-is"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="What is the NCBI Pathogen Detection Project, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h3>
<div style="padding-left: 2em">
<ul>
<li><a href="/pathogens/isolates#/microbigge/">MicroBIGG-E</a> is the <b>Micro</b>bial <b>B</b>rowser for <b>I</b>dentification of <b>G</b>enetic and <b>G</b>enomic <b>E</b>lements. Every row in the <a href="/pathogens/isolates#/microbigge/">MicroBIGG-E</a> display is an <b>anti-microbial resistance (AMR)</b>, <b>stress response</b>, and/or <b>virulence</b> gene that has been identified in an isolate by the <a href="/pathogens/docs/data_processing">data processing pipeline</a>.<i>(Separate sections of this file provide <a href="#microbigge-what-is">MicroBIGG-E help documentation</a>.)</i></li>
<li><a href="/pathogens/antimicrobial-resistance/">AMR Landing page</a> - provides information about the NCBI National Database of Antibiotic Resistant Organisms (<b>NDARO</b>), a collaborative, cross-agency, centralized hub for researchers to access AMR data to facilitate real-time surveillance of pathogenic organisms.</li>
<li><a href="/pathogens/antimicrobial-resistance/resources/">AMR Resources page</a> - provides a list of available resources, with a brief description and sample searches or links to additional information about each one.</li>
<!-- ul -->
<li><a href="/pathogens/refgene/">Pathogen Detection Reference Gene Catalog</a> provides access to a curated reference set of antimicrobial resistance genes and proteins, which are stored in the <b>Bacterial Antimicrobial Resistance Reference Gene Database</b> (BioProject <a href="https://www.ncbi.nlm.nih.gov/bioproject/PRJNA313047">PRJNA313047</a>).
The Reference Gene Catalog together with the <a href="/pathogens/genehierarchy">Reference Gene Hierarchy</a> and the <a href="/pathogens/hmm">Reference HMM Catalog</a> make up the AMRFinderPlus database and provide the reference data behind the <a href="/pathogens/antimicrobial-resistance/AMRFinder/">AMRFinderPlus software</a> and <a href="/pathogens/microbigge">MicroBIGG-E browser</a>.
The source of input for these <b>curated databases</b> include: 1) allele assignments, 2) exchanges with other external curated resources, 3) reports of novel antimicrobial resistance proteins in the literature. (<i>The <a href="#reference-gene-catalog">Pathogen Detection Reference Gene Catalog</a>, <a href="/pathogens/docs/gene_hierarchy/">Pathogen Detection Reference Gene Hierarchy</a>, and <a href="/pathogens/docs/HMM_catalog/">Pathogen Detection Reference HMM Catalog help documents</a> provide information on how to use the tools.</i>)</li>
<li><a href="/pathogens/antimicrobial-resistance/AMRFinder/">AMRFinderPlus</a> - a tool that compares isolate genomes against the reference protein set using BLAST and against the HMM set using HMMER, and uses the <a href="/pathogens/genehierarchy">gene hierarchy</a> to provide the most specific protein assignment to antimicrobial resistant protein or family, if present in the query set of proteins. <a href="https://github.com/ncbi/amr/wiki">AMRFinderPlus</a> identifies the AMR genes and point mutations that are found by the original AMRFinder, plus it identifies select members of additional classes of genes such as virulence factors, biocide, heat, acid, and metal resistance genes. Unlike other AMR gene detection methods that report the best hit, AMRFinderPlus reports the specific gene symbol based on the available evidence. For example, when presented with a novel blaKPC allele that is nearly identical to blaKPC-2, closest hit tools might return blaKPC-2, but AMRFinderPlus would call it as blaKPC so that users do not incorrectly assume the phenotype (<a href="#amr-finder-hierarchy-illustration">illustrated example</a>). More details about the tool are provided in publications <a href="https://www.ncbi.nlm.nih.gov/pubmed/31427293">Feldgarden M, et al., 2019</a> and <a href="https://www.ncbi.nlm.nih.gov/pubmed/34135355/">Feldgarden M, et al., 2021</a>.</li>
<li><a href="/pathogens/submit-data/">Submit sequence and phenotype data related to AMR</a> - includes instructions on how to submit data for real-time analysis, <a href="https://www.ncbi.nlm.nih.gov/biosample/docs/antibiogram/">submit antibiograms to the BioSample database</a>, and <a href="/pathogens/submit-beta-lactamase/">request new alleles for beta-lactamase, MCR, and Qnr Genes</a>.</li>
<!-- /ul -->
<li><a href="https://ftp.ncbi.nlm.nih.gov/pathogen/Antimicrobial_resistance">FTP/Raw Data Download</a> - includes AMRFinderPlus data files, the Reference Gene Catalog, Reference Gene Hieararchy, and Reference HMM Hierarchy, and the Bacterial Antimicrobial Resistance Reference Gene Database (BioProject <a href="https://www.ncbi.nlm.nih.gov/bioproject/PRJNA313047">PRJNA313047</a>) See <a href="https://github.com/ncbi/amr/wiki/AMRFinderPlus-database">database documentation</a> for more information about the files and formats.</li>
</ul>
</div>
<!-- ======= END_WHAT_IS:ACCESS_ANTIMICROBIAL_RESISTANCE_DATA ======= -->
<!-- ========= WHAT_IS:UPDATE_FREQUENCY ============ -->
<h3 id="update-frequency">Update Frequency <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#what-is"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="What is the NCBI Pathogen Detection Project, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h3>
<div style="padding-left: 2em">
The various components of the Pathogen Detection project are updated at the following intervals:
<ul>
<li id="update-frequency-ftp-results"><a href="https://ftp.ncbi.nlm.nih.gov/pathogen/Results/">FTP Results</a> and <a href="/pathogens/isolates#/search/">Isolates Browser</a> and <a href="/pathogens/isolates#/microbigge/">MicroBIGG-E</a>
<ul>
<li>The Pathogens Detection Project analysis results are <b>updated approximately daily</b> for each taxgroup, when new data is submitted. <a href="https://ftp.ncbi.nlm.nih.gov/pathogen/Results/">FTP Results</a> and the <a href="/pathogens/isolates#/search/">Isolates Browser</a> are generally synchronized, but sometimes indexing delays might occur, resulting in a temporary asynchrony. The Isolates Browser and MicroBIGG-E updates are synchronized and update along with the corresponding taxgroups. The <a href="/pathogens/docs/isolates_gcp">Isolates</a> and <a href="/docs/microbigge_gcp">MicroBIGG-E</a> tables in Google Cloud BigQuery are updated daily and data may lag behind the web interfaces by up to one day. <br />
<i>(Read an <a href="#ftp">overview of the FTP site</a>, or go directly to the <a href="https://ftp.ncbi.nlm.nih.gov/pathogen/">FTP parent directory</a> or to the <a href="https://ftp.ncbi.nlm.nih.gov/pathogen/Results/">FTP Results</a> subdirectory. Read about the <a href="#isolates-browser">Isolates Browser</a>.)</i></li>
<li>Isolate Browser and MicroBIGG-E data in Google Cloud are updated independently, see <a href="/pathogens/docs/gcp/#update-frequency">GCP Update frequency</a> for details.</li>
</ul>
</li>
<li>The AMRFinderPlus database (Including the <a href="/pathogens/refgene">Reference Gene Catalog</a>, <a href="/pathogens/genehierarchy">Reference Gene Hierarchy</a>, <a href="/pathogens/hmm">Reference HMM Catalog</a>, and <a href="https://github.com/ncbi/amr/wiki/AMRFinderPlus-database">AMRFinderPlus database</a> are updated simultaneously, somewhat irregularly with releases approximately every two months.)</li>
<li id="update-frequency-ftp-rapid-reports">FTP Rapid Reports
<ul>
<li>The Rapid Reports directory of the Pathogens FTP site is a pilot phase test of rapid reporting based solely on wgMLST allele differences and currently reports on certain bioprojects and some organisms. The FTP Rapid Reports for a given organism are <b>updated within approximatly an hour</b> of completing sequence read submissions for a new isolate.<br />
<i>(Read an <a href="#ftp">overview of the FTP site</a>, or go directly to the <a href="https://ftp.ncbi.nlm.nih.gov/pathogen/Results/">FTP Results</a> subdirectory, where you can find Rapid Reports for organisms such as <a href="https://ftp.ncbi.nlm.nih.gov/pathogen/Results/Clostridioides_difficile/Rapid_reports/">Clostridioides difficile</a>, <a href="https://ftp.ncbi.nlm.nih.gov/pathogen/Results/Salmonella/Rapid_reports/">Salmonella</a>, <a href="https://ftp.ncbi.nlm.nih.gov/pathogen/Results/Listeria/Rapid_reports/">Listeria</a>.)</i></li>
</ul><br />
</li>
</ul>
</div>
<!-- ======== END_WHAT_IS:UPDATE_FREQUENCY ========= -->
<!-- ======== WHAT_IS:LINKS_TO_REFERENCES_AND_CONTACT ========= -->
<h3 id="references-and-contact">References and Contact Information <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#what-is"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="What is the NCBI Pathogen Detection Project, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h3>
<div style="padding-left: 2em">
Separate sections of this document provide additional information, including:
<ul>
<li><a href="#references">References</a> about the Pathogen Detection Project and related intiatives</li>
<li><a href="#contact">Contact information</a> for the NCBI Pathogens Detection Team</li>
</ul>
</div>
<!-- ======== END_WHAT_IS:LINKS_TO_REFERENCES_AND_CONTACT ========= -->
<!-- ########## END_H2_SECTION:WHAT_IS ########## -->
<!-- ======== HORIZONTAL_RULE ============ -->
<hr />
<!-- ======== END_HORIZONTAL_RULE ======== -->
<!-- ########## H2_SECTION:HOW_TO ########## -->
<h2 id="how-to">How To: <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h2>
<!-- =========== HOW_TO_MINI_TOC ========== -->
<ul>
<li><a href="/pathogens/docs/HowTo">Visual HowTos</a></li>
<li><a href="#how-to-quick-link-searches">Quick link searches</a> (e.g., quickly retrieve new isolates for a given organism group)</li>
<li><a href="#how-to-general-text-searches">General text searches</a> (e.g., "lettuce")</li>
<li><a href="#how-to-field-specific-searches">Field-specific searches</a> (e.g., retrieve isolates that were collected in a given geographic location, e.g., U.S.)</li>
<li><a href="#how-to-facet-search-results">Using filters to focus the search results</a> (e.g., retrieve isolates by scientific name, then facet the data by various criteria such as isolation source)</li>
<li><a href="#how-to-outbreak">Identify the possible source of an outbreak</a> (e.g., <i>E. coli</i> outbreak from all-purpose flour)</li>
<li>The <a href="#toc-advanced-search">Advanced Search</a> &gt; <a href="#solr-sample-searches"><span style="color:#d70000">Examples of SOLR queries</span></a> provides additional examples of field-specific searches and complex Boolean searches using the SOLR query syntax</li>
<li>The <a href="#reference-gene-catalog">Pathogen Detection Reference Gene Catalog</a> &gt; <a href="#refgene-sample-searches"><span style="color:#d70000">Use cases/sample searches</span></a> section of this document shows how to find antimicrobial resistance (AMR) genes, point mutations that confer resistance, AMR content of known isolates, and more.</li>
</ul>
<!-- =========== END_HOW_TO_MINI_TOC ========== -->
<!-- ========= HOW_TO:QUICK_LINK_SEARCHES ============ -->
<h3 id="how-to-quick-link-searches">Quick link searches <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#how-to"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Pathogens How To, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h3>
<ul>
<li>The <a href="/pathogens/"><b>Pathogen Detection Project</b></a> home page includes an "<b>Explore the Data</b>" section. This lists the four foodborne pathogens including direct links to the Isolates Browser for <i>Salmonella enterica</i>, <i>E.coli and Shigella</i>, <i>Campylobacter jejuni</i>, <i>Listeria monocytogenes</i>, and provides instant access to isolates from those groups.</li>
<li>The <a href="/pathogens/organisms/"><b>Organism Groups</b></a> page also provides links for all available organism groups, along with additional details for each group. Note that the species name under the Organism Groups table reflects the most common species in each group, but does not reflect all species. For example, the <i>Salmonella enterica</i> organism group consists of predominantly Salmonella enterica isolates, but also <i>Salmonella bongori</i> isolates. To see the full list of organisms present in each group, see the <a href="#isolates-browser-data-field-ScientificName">scientific_name</a> column in the Isolates Browser.</li>
<li>For <b>example</b>, to quickly retrieve new isolates for a <i>Salmonella enterica</i>, open the <a href="/pathogens/">Pathogen Detection Project</a> home page:
<ul>
<li>Scroll down to "<b>Explore the Data</b>" and follow the "<b>New Isolates</b>" link for the <i>Salmonella enterica</i>.</li>
<li id="new-isolates">That will retrieve isolates that have become available in the Pathogen Detection Project. <b>"New" isolates</b> are those that have been added to a <a href="#accession-prefix-pdg">Pathogen Detection Group (PDG#)</a> since the last calculation. This may have been all isolates added in the last 24 hours for frequently updated organism groups like <i>Salmonella</i>, or it may have been months since the last update and "new" isolates are now several months old, but reflect the newest isolates added to a given pathogen detection group.</li>
</ul>
</li>
</ul>
<!-- ======== END_HOW_TO:QUICK_LINK_SEARCHES ========= -->
<!-- ========= HOW_TO:GENERAL_TEXT_SEARCHES ============ -->
<h3 id="how-to-general-text-searches">General text searches <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#how-to"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Pathogens How To, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h3>
<ul>
<li>Simply enter text term(s) of interest (e.g., "lettuce") in the Isolates Browser to search across <b>all</b> of the text-containing fields.</li>
<li>For example, open the <a href="/pathogens/isolates#/search/">Isolates Browser</a> home page.</li>
<ul>
<li>It will display all isolates are by default. Any search you enter will result in the display of only the subset of isolates that match your query.</li>
</ul><br />
<li>Enter the desired search term in the text box to display of only the subset of isolates that match your query. For example, try searches for:</li>
<ul>
<li><a href="/pathogens/isolates#/search/lettuce"><i>lettuce</i></a></li>
<li><a href="/pathogens/isolates#/search/strawberries"><i>strawberries</i></a></li>
<li><a href="/pathogens/isolates#/search/%22all-purpose%20flour%22"><i>"all-purpose flour"</i></a><br />
(Separate sections of this document describe how the Isolates Browser handles <a href="#query-tips-special-characters">special characters</a> such as hyphens that are part of search terms, and provide tips about <a href="#case-sensitive">case sensitive</a> searches and the use of <a href="#query-tips-phrase-search-quotes">quotes for phrase searches</a>.)</li>
<li><a href="/pathogens/isolates#/search/blaKPC*"><i>blaKPC*</i></a><br />
(Separate sections of this document provide additional examples of searches for <a href="#isolates-browser-data-field-AMRGenotypes">antimicrobial resistance (AMR) genotypes</a> and details about the use of <a href="#wildcards">wildcards</a> such as asterisks.)</li>
</ul><br />
<li>Use the <a href="#filters">Filters</a>, if desired, to filter the data you retrieved by characteristics such as:</li>
<ul>
<li>geographic <a href="#filter-location">location</a> where the isolate was collected</li>
<li><a href="#filter-isolation-type">isolation type</a> (clinical or environmental/other)</li>
<li><a href="#filter-property">property</a> (<a href="#data-type-genotype">has AMR genotypes</a> or <a href="#data-type-phenotype">has AST phenotypes</a>)</li>
<li><a href="#filter-target-creation">target creation</a> (date on which the isolate was first seen at the Pathogen Detection project)</li>
<li>and <a href="#filters">more...</a></li>
</ul><br />
<li>For additional information, search tips, and examples, see the <a href="#isolates-browser">Isolates Browser help</a> &gt; <a href="#allowable-search-terms"><b>Allowable search terms</b></a> section of this document.</li>
</ul>
<!-- ======== END_HOW_TO:GENERAL_TEXT_SEARCHES ========= -->
<!-- ===== HOW_TO:FIELD_SPECIFIC_SEARCHES ======== -->
<h3 id="how-to-field-specific-searches">Field-specific searches <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#how-to"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Pathogens How To, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h3>
<ul>
<li>As an alternative to general text searches, you can conduct more precise searches by limiting your query to specific data fields.<br />
<div style="padding-left: 2em">
The general <b>syntax of a field-specific search</b> is:<br />
<ul>
<li><i>searchfieldname:searchterm</i> &#160;(to search for a single term)</li>
<li><i>searchfieldname:"search phrase"</i> &#160;(use <a href="#query-tips-phrase-search-quotes">quotes to search for a phrase</a>)</li>
<li><i>searchfieldname:searchterm AND searchfieldname:searchterm</i> &#160;(use the desired <a href="#operators">Boolean operator(s)</a>)</li>
</ul>
<br />
<b>Important notes</b>:<br />
<ul>
<li>The names of <a href="#isolates-browser-data-fields">data fields</a>, and the values they contain, are <a href="#case-sensitive"><b>case sensitive</b></a>.</li>
<li>The exact name of the data fields can be seen by hovering the mouse over the column names, then a popup appears with the search syntax for that field.</li>
<li>The data field names and values might also include <a href="#special-characters">special characters</a> such as underscore bars, hypens, parentheses, and slashes. These should be included in the query string, as the Isolates Browser has been modified relative to the SOLR Standard Query Parser to recognize and properly handle special characters that are part of a search term.</li>
</ul>
</div>
</li>
<li>For <b>example</b>, you can search the <a href="#isolates-browser-data-field-Location">Location</a> data field, as shown below, in order to retrieve isolates that were collected from a given geographic area:<br /><br />
<ul>
<li>Open the <a href="/pathogens/isolates#/search/">Isolates Browser</a> home page. It will display all isolates are by default.</li>
<li>Enter the following type of search in the text box to display only the subset of isolates that have been identified by the submitter as having been collected in the USA:</li>
<ul>
<li><i>geo_loc_name:USA</i></li>
</ul>
</ul>
</li>
<li>For <b>additional examples</b>, such as searches that retrieve isolates with specific <a href="#isolates-browser-data-field-AMRGenotypes">genotypes</a> and/or <a href="#isolates-browser-data-field-ASTPhenotypes">phenotypes</a>, see the <a href="#solr-sample-searches"><b>Examples of SOLR queries</b></a> section of this document.</li>
<li>For detailed information about searching specific data fields, see the <a href="#isolates-browser">Isolates Browser help</a> &gt; <a href="#isolates-browser-advanced-search">Advanced Search</a> &gt; <a href="#isolates-browser-data-fields"><b>Data Fields</b></a> section of this document.</li>
</ul>
<!-- ======== END_HOW_TO:FIELD_SPECIFIC_SEARCHES ========= -->
<!-- ========= HOW_TO:FACET_THE_SEARCH_RESULTS ============ -->
<h3 id="how-to-facet-search-results">Using Filters to focus the search results <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#how-to"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Pathogens How To, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h3>
<ul>
<li>You can use "Filters" in order to focus on a specific subset of isolates.</li>
<li>For example, open the <a href="/pathogens/isolates#/search/"><b>Isolates Browser</b></a> home page. It will <b>display all isolates by default</b>.</li>
<li>To <b>filter</b> the isolates by criteria such as <b>isolation source</b>:</li>
<li>Click on the "<a href="#filters"><b>Filters</b></a>" menu in order to filter the data displayed by the browser.</li>
<li>Scroll down to the <b>"Isolation source" text box</b> to filter the data by source of isolation.
</li>
<li>Now the "Isolation source" filter box pops up. By default the top 100 unique values are shown, which can be viewed using the scrollbar. The number of items for each value are also shown. This box has a search bar to search for any values not displayed. Values can be selected and will update the number of items displayed in the table below. If two or more filters are open, then the selections in one filter will update the available values and unique items in the other filter.
The filters that you see are <a href="#filters-on-the-fly">generated on the fly</a> to reflect the attributes of the isolates that you are currently viewing in the browser.</li>
</ul>
<!-- ======== END_HOW_TO:FACET_THE_SEARCH_RESULTS ========= -->
<!-- ========= HOW_TO:IDENTIFY_SOURCE_OF_AN_OUTBREAK ============ -->
<h3 id="how-to-outbreak">Identify the possible source of an outbreak <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#how-to"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Pathogens How To, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h3>
<div style="padding-left: 2em">To identify the possible source of an outbreak, you can use either one of the following methods:
<ul>
<li id="how-to-outbreak-tree-viewer"><b>Analyze data that's already available in the pathogen detection project</b> by using the <b>SNP Tree Viewer</b> to view the phylogenetic relationships among a group of sequence-similar isolates from clincal or environmental sources.<br />
<div style="padding-left: 2em">
For example, the FDA's GenomeTrakr project (BioProject <a href="https://www.ncbi.nlm.nih.gov/bioproject/230969">PRJNA230969</a>) for the surveillance and rapid detection of foodborne contamination events include a <a href="/pathogens/isolates#/search/PRJNA230969%20AND%20PDS000003441"><b>subset of <i>E. coli</i> isolates that belong to the SNP cluster "PDS000003441</b></a>." Many of the isolates in that cluster were from an outbreak that originated in all-purpose flour. <i>(<a href="https://www.cdc.gov/ecoli/2016/o121-06-16/index.html">Read more on the CDC website about that outbreak</a>.)</i><br /><br />
In the <a href="/pathogens/isolates#/search/PRJNA230969%20AND%20PDS000003441">Isolates Browser display</a>, you can <b>click on the "PDS*" accession number</b> that appears in the <b>"SNP Cluster" column</b> for any one of those isolates<!-- (e.g., isolate PDT000133982.1) --> to open a <b>Tree Viewer</b> display for the SNP cluster and interactively examine the phylogenetic distance tree. A SNP cluster contains isolate genomes that have been found, via the Pathogens <a href="/pathogens/docs/data_processing">data processing pipeline</a>, to be closely related.<br /><br />
The Tree View for SNP cluster PDS000003441 shows a number of <b>clinical and environmental samples that are very closely related</b>, in some cases, with a distance of zero SNPs between the clinical and environmental samples. (Mouse over any branch in the tree to view the SNP distance between the isolates.) The phylogenetic distance tree therefore sheds light on the possible source of the outbreak.<br /><br />
<i>The <a href="#sequence-data">sequence data analysis</a> and <a href="#snp-tree-viewer">SNP Tree Viewer help</a> sections of this document provide additional details about SNP clusters and using the SNP Tree Viewer, respectively. The SNP Tree Viewer help includes an <a href="#snp-tree-viewer-access"><span style="color:#d70000">illustrated example</span> of SNP Tree Viewer launch points</a> and <a href="#snp-tree-viewer-illustration"><span style="color:#d70000">illustrated example</span> of a SNP Tree Viewer display</a>.</i><br />
</div>
<b>- or -</b><br /><br />
</li>
<li id=" how-to-outbreak-ftp"><b>Submit sequence reads</b> to NCBI and obtain data analysis results on the Pathogen Detection project <a href="https://ftp.ncbi.nlm.nih.gov/pathogen/Results/">FTP site</a>, in the form of phylogenetic distance trees that show the relationship of your isolates to those already in the Pathogen Detection project.</li>
</ul>
<i>See the section of this document on <a href="#sequence-data">sequence data analysis</a> for more information.</i>
</div>
<!-- ======== END_HOW_TO:IDENTIFY_SOURCE_OF_AN_OUTBREAK ========= -->
<!-- ========= HOW_TO:MORE_EXAMPLES_UNDER_SOLR_QUERIES ============ -->
<h3 id="how-to-more-examples">More examples... <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#how-to"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Pathogens How To, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h3>
<ul>
<li>The <a href="#toc-advanced-search">Advanced Search</a> &gt; <a href="#solr-sample-searches"><span style="color:#d70000">Examples of SOLR queries</span></a> section of this document provides additional examples of field-specific searches and complex Boolean searches using the SOLR query syntax.</li>
<li>The <a href="#reference-gene-catalog">Pathogen Detection Reference Gene Catalog</a> &gt; <a href="#refgene-sample-searches"><span style="color:#d70000">Use cases/sample searches</span></a> section of this document shows how to find antimicrobial resistance (AMR) genes, point mutations that confer resistance, AMR content of known isolates, and more.</li>
</ul>
<!-- ======== END_HOW_TO:MORE_EXAMPLES_UNDER_SOLR_QUERIES ========= -->
<br />
<!-- ########## END_H2_SECTION:HOW_TO ########## -->
<!-- ======== HORIZONTAL_RULE ============ -->
<hr />
<!-- ======== END_HORIZONTAL_RULE ======== -->
<!-- ########## H2_SECTION:COMPONENTS ########## -->
<h2 id="components">Pathogens Project Components <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h2>
<!-- div style='padding-left: 2em'>
<a href="#resources"><b>Resources/Tools</b></a>: &#160;<a href="#resource-isolates-browser">Isolates Browser</a> | <a href="#resource-snp-tree-viewer">SNP Tree Viewer</a> | <a href="#resource-amr">Antimicrobial Resistance (AMR) resources</a> | <a href="#resource-ftp">FTP site</a> | <a href="#resource-submit">Data submission tools</a><br /><br />
<a href="#data-types"><b>Types of Data</b></a>: &#160;<a href="#data-type-bioproject">BioProject records</a> | <a href="#data-type-biosample">BioSample records</a> | <a href="#data-type-sequence-read">Raw data: Sequence reads</a> | <a href="#data-type-genome">Genomes</a> | <a href="#data-type-genotype">Genotypes: antimicrobial resistance (AMR) genes</a> | <a href="#data-type-phenotype">Phenotypes: antimicrobial susceptibility test (AST) data (antibiograms)</a><br /><br />
</div -->
<ul>
<li><a href="#resources">Resources/Tools</a>
<ul>
<li><a href="#resource-isolates-browser">Isolates Browser</a></li>
<li><a href="#resource-snp-tree-viewer">SNP Tree Viewer</a></li>
<li><a href="#resource-automated-searches">Automatic e-mail notifications of new data</a></li>
<li><a href="#resource-amr">Antimicrobial Resistance (AMR) resources</a> (<a href="#amr-resources-schematic"><span style="color:#d70000">schematic illustration</span> of AMR resources</a>)</li>
<li><a href="#resource-ftp">FTP site</a></li>
<li><a href="#resource-submit">Data submission tools</a></li>
</ul>
</li>
<li><a href="#data-types">Types of Data</a>
<ul>
<li><a href="#data-type-bioproject">BioProject records</a></li>
<li><a href="#data-type-biosample">BioSample records</a></li>
<li><a href="#data-type-sequence-read">Raw data: Sequence reads</a></li>
<li><a href="#data-type-genome">Genomes</a></li>
<li><a href="#data-type-genotype">Genotypes: Antimicrobial Resistance (AMR), Virulence, and Stress Resistance Genes</a></li>
<li><a href="#data-type-phenotype">Phenotypes: Antimicrobial Susceptibility Test (AST) results (Antibiograms)</a></li>
</ul>
</li>
<li><a href="#contributors">Contributors</a>
</li>
</ul>
<!-- ========= COMPONENTS_RESOURCES/TOOLS ============ -->
<h3 id="resources">Resources/Tools <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#components"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Pathogens Project Components, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h3>
<div style="padding-left: 2em">
<a href="#resource-isolates-browser">Isolates Browser</a> | <a href="#resource-snp-tree-viewer">SNP Tree Viewer</a> | <a href="#resource-automated-searches">Automatic e-mail notifications of new data</a> | <a href="#resource-amr">Antimicrobial Resistance (AMR) resources</a> | <a href="#resource-ftp">FTP site</a> | <a href="#resource-submit">Data submission tools</a>
</div>
<!-- ========= RESOURCE_ISOLATES_BROWSER ============ -->
<div style="padding-left: 2em">
<h4 id="resource-isolates-browser">Isolates Browser <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#components"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Pathogens Project Components, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h4>
<div style="padding-left: 2em">
The NCBI Pathogens <a href="/pathogens/isolates#/search/">Isolates Browser</a> is a web-based portal that integrates pathogen genomic sequences, metadata, antibiotic susceptibility and resistance gene information, and the SNP cluster information.<br /><br />
The Isolates Browser was built to answer two specific questions for incoming pathogen genomes:<br />
1) is this isolate clonally related to anything else in the database?<br />
2) what is the AMR repertoire of this isolate?<br /><br />
It allows users to browse and search over 300,000 pathogen isolates, effectively and efficiently providing access to the <a href="/pathogens/antimicrobial-resistance/">National Database of Antibiotic Resistant Organisms</a>.<br /><br />
Upon opening the <a href="/pathogens/isolates#/search/">Isolates Browser</a>, a table displays data for all available isolates, with the most recently added data at the top. You can query the Isolates Browser with a wide variety of <a href="#allowable-search-terms">allowable search terms</a>. The data can be <b>sorted</b> by clicking on column headers, <a href="#filters">filtered</a> by using the "Filters" interface (e.g., Property: has antimicrobial resistance (AMR) genotypes), or <b>searched</b> using <a href="#isolates-browser-basic-search">basic</a> or <a href="#isolates-browser-advanced-search">advanced</a> queries.<br /><br />
Every row in the Isolates Browser is an <b>assembled isolate</b>, possibly with antimicrobial resistance (AMR), virulence, and/or stress response <a href="#data-type-genotype"><b>genotype data</b></a>, and antibiotic susceptibility (AST) <a href="#data-type-phenotype"><b>phenotype data</b></a>, as available.<br /><br />
If an isolate has a "PDS*" accession number in the "SNP Cluster" column, that indicates it is part of a SNP cluster. You can click on the PSD* accession to launch the <a href="#snp-tree-viewer"><b>SNP Tree Viewer</b></a> and examine the relationships among your isolate of interest and other isolates that have been found, via the Pathogens <a href="/pathogens/docs/data_processing">data processing pipeline</a>, to be closely related.<br /><br />
<i>A separate section of this file provides <a href="#isolates-browser">Isolates Browser help documentation</a>, with details on how the browser can be used, including allowable <a href="#isolates-browser-input">input</a>, a decription of the <a href="#isolates-browser-output">output</a>, and an <a href="#isolates-browser-illustration"><span style="color:#d70000">illustrated example</span> of search results</a>.</i><br />
</div>
</div>
<!-- ====== END_RESOURCE_ISOLATES_BROWSER ========= -->
<!-- ========= RESOURCE_TREE_VIEWER ============ -->
<div style="padding-left: 2em">
<h4 id="resource-snp-tree-viewer">SNP Tree Viewer <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#components"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Pathogens Project Components, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h4>
<div style="padding-left: 2em">
The SNP Tree Viewer is a component of the Pathogens <a href="/pathogens/isolates#/search/">Isolates Browser</a>. Any isolate that belongs to a SNP cluster (group of isolates whose genome assemblies are <a href="/pathogens/docs/data_processing">clustered</a>) has a link to the SNP Tree Viewer.<br /><br />
The SNP Tree Viewer displays a phylogenetic tree of pathogen isolates, built from assembled genomes by the <a href="#MaximumCompatibilityAlgorithm_2017">maximum compatibility method</a>. It shows relationships among the isolates based on the number of single nucleotide polymorphisms (SNPs) they contain relative to each other. Each tree represents a cluster of isolates that have been found, via the Pathogens <a href="/pathogens/docs/data_processing">data processing pipeline</a>, to be closely related.<br /><br />
The trees can be used to examine the relationships of isolates in a SNP cluster to each other, and to identify the possible source of an outbreak based on the sequence similarity of the clinical and environmental isolates in a tree. <i>(See an example in <a href="#how-to-outbreak">How to identify the possible source of an outbreak</a>.)</i><br /><br />
<i>A separate section of this file provides <a href="#snp-tree-viewer">SNP Tree Viewer help documentation</a>, with details on how the tree viewer can be used. It includes an <a href="#snp-tree-viewer-access"><span style="color:#d70000">illustrated example</span> of SNP Tree Viewer launch points</a> and <a href="#snp-tree-viewer-illustration"><span style="color:#d70000">illustrated example</span> of a SNP Tree Viewer display</a>.</i><br />
</div>
</div>
<!-- ====== END_RESOURCE_TREE_VIEWER ========= -->
<!-- ========= RESOURCE_AUTOMATED_SEARCHES ============ -->
<div style="padding-left: 2em">
<h4 id="resource-automated-searches">Automatic e-mail notifications of new data<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#components"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Pathogens Project Components, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h4>
<div style="padding-left: 2em">
You can <b>perform a search</b> in the Pathogens Isolates Browser, or to <b>select an isolate of interest</b> in the SNP Tree Viewer, and then automatically receive e-mail notifications each time new isolates become available that match your search criteria, or are closely related to your isolate of interest.<br /><br />
There are two ways to receive <a href="#automated-searches">automatic e-mail notifications of new data</a>, and you must be <a href="#automated-searches-requirements">logged into your free My NCBI</a> account to use either one:<br /><br />
<b>"Save" a search in the Isolates Browser</b><br />
<ul>
<li>A "<b>Save</b>" button in the <b>Isolates Browser</b> interface allows you to save one or more searches, and automatically notifies you about new isolates that match the criteria of each saved search.
<i>(<a href="#automated-searches-save">Read more</a> and view an <a href="#automated-searches-save-illustration"><span style="color:#d70000">illustrated example</span></a>.)</i></li>
</ul>
<b>"Watch" an isolate of interest in the SNP Tree Viewer</b><br />
<ul>
<li>A "<b>Watch</b>" button in the <b>SNP Tree Viewer</b> interface allows you to watch one or more selected isolates in a tree, and automatically notifies you about new isolates that fall within the SNP distance that you have specified from the watched isolate(s).
<i>(<a href="#automated-searches-watch">Read more</a> and view an <a href="#automated-searches-watch-illustration"><span style="color:#d70000">illustrated example</span></a>.)</i></li>
</ul>
</div>
</div>
<!-- ====== END_RESOURCE_AUTOMATED_SEARCHES ========= -->
<!-- ====== RESOURCE_ANTIMICROBIAL_RESISTANCE_ AMR_RESOURCES ========= -->
<div style="padding-left: 2em">
<h4 id="resource-amr">Antimicrobial Resistance (AMR) resources <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#components"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Pathogens Project Components, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h4>
<div style="padding-left: 2em">
<!-- ============ MINI_TOC ============= -->
<a href="#resource-amr-landing-page">AMR Landing page</a> | <a href="#resource-amr-resources-page">AMR Resources page</a> | <a href="#resource-amr-reference-gene-catalog">Pathogen Detection Reference Gene Catalog</a> | <a href="#resource-amr-finder">AMRFinderPlus</a> | <a href="#resource-amr-microbigge">MicroBIGG-E</a> | <a href="#resource-amr-submit">Submit sequence and phenotype data related to AMR</a> | <a href="#resource-amr-ftp">FTP/Raw Data Download</a> | <a href="#resource-amr-bigquery">Data in Google Cloud</a> | <a href="#resource-amr-resources-schematic"><span style="color:#d70000">Schematic illustration</span> of AMR resources</a><br /><br />
<!-- ============ END_MINI_TOC ============= -->
As antimicrobial resistance (AMR) continues to evolve in many bacterial pathogens, the NCBI Pathogen Detection Project has developed a database to collect curated information about AMR genes, as well as tools to access the data. The AMR resources include:<br />
<ul>
<li id="resource-amr-landing-page"><a href="/pathogens/antimicrobial-resistance/">AMR Landing page</a> - provides information about the NCBI National Database of Antibiotic Resistant Organisms (<b>NDARO</b>), a collaborative, cross-agency, centralized hub for researchers to access AMR data to facilitate real-time surveillance of pathogenic organisms.</li>
<li id="resource-amr-resources-page"><a href="/pathogens/antimicrobial-resistance/resources/">AMR Resources page</a> - provides a list of available resources, with a brief description and sample searches or links to additional information about each one.</li>
<li id="resource-amr-reference-gene-catalog"><a href="/pathogens/isolates#/refgene/">Pathogen Detection Reference Gene Catalog</a>
is a component of the <a href="/pathogens/isolates#/search/">Pathogens Isolates Browser</a>. The Reference Gene Catalog is a <a href="#refgene-non-redundant">non-redundant</a> database of bacterial genes related to antimicrobial resistance, stress resistance, virulence, and antigenicity. A graphical user interface (GUI) allows you to browse and search the Catalog, which includes <a href="#refgene-scope">two data subsets</a>:<br />
<ol>
<li>"<b>Core</b>": this subset includes highly curated, AMR-specific genes and proteins from the Bacterial Antimicrobial Resistance Reference Gene Database (BioProject <a href="https://www.ncbi.nlm.nih.gov/bioproject/PRJNA313047">PRJNA313047</a>), plus point mutations. The sources of input for this <b>curated database</b> include: 1) allele assignments, 2) exchanges with other external curated resources, 3) reports of novel antimicrobial resistance proteins in the literature.</li>
<li>"<b>Plus</b>": this subset includes genes related to biocide and stress resistance, general efflux, virulence, or antigenicity.</li>
</ol>
Every row in the Pathogen Detection Reference Gene Catalog display is a <b>reference gene</b> or a <b>point mutation</b>. The <a href="#reference-gene-catalog"><b>Pathogen Detection Reference Gene Catalog help</b></a> provides information on how to use the tool, including <a href="#refgene-search-tips">search tips</a>, <a href="#refgene-data-fields">data fields</a>, <a href="#refgene-output">output</a>, and <a href="#refgene-sample-searches"><span style="color:#d70000">use cases (sample searches)</span></a>. It is also possible to <b>download</b> the Reference Gene Catalog data by clicking on the <b>Download</b> link. <br />
<i>(The Pathogen Detection Reference Gene Catalog supercedes the previously available "AMR Reference Gene Browser," which encompassed only the "core" data set.)</i>
</li>
<li id="resource-amr-finder"><a href="/pathogens/antimicrobial-resistance/AMRFinder/">AMRFinderPlus</a> - a tool that compares isolate genomes against the reference protein set using BLAST and against the HMM set using HMMER, and uses the gene hierarchy to provide the most specific protein assignment to antimicrobial resistant protein or family, if present in the query set of proteins. The <a href="https://github.com/ncbi/amr/wiki/v1-Home">original AMRFinder</a> identifies acquired antimicrobial resistance (AMR) genes, as well as point mutations that confer antimicrobial resistance, in either protein datasets or nucleotide data, including genomic data. <a href="https://github.com/ncbi/amr/wiki">AMRFinderPlus</a> identifies the AMR genes and point mutations that are found by the original AMRFinder, plus it identifies select members of additional classes of genes such as virulence factors, biocide, heat, acid, and metal resistance genes. Unlike other AMR gene detection methods that report the best hit, AMRFinderPlus reports the specific gene symbol based on the available evidence. For example, when presented with a novel blaKPC allele that is nearly identical to blaKPC-2, closest hit tools might return blaKPC-2, but AMRFinderPlus would call it as blaKPC so that users do not incorrectly assume the phenotype (<a href="#amr-finder-hierarchy-illustration">illustrated example</a>). More details about the tool are provided in a publication by <a href="https://www.ncbi.nlm.nih.gov/pubmed/31427293">Feldgarden M, et al., 2019</a>.<br />
<ul>
<li>Separate sections of this document provide <a href="#amr">more details about Antimicrobial Resistance (AMR) Resources</a> and <a href="#amr-finder"><b>more details about AMRFinderPlus</b></a>, including an <a href="#amr-finder-hierarchy-illustration">illustration of the blaKPC example</a>, as well as links to <a href="#amr-finder-install">install AMRFinderPlus software</a>, <a href="#amr-finder-data-files">download data files</a><!-- (<a href="#amr-finder-reference-gene-catalog">Reference Gene Catalog data</a>, <a href="#amr-finder-hmms">Hidden Markov Models (HMMs)</a>, <a href="#amr-finder-hierarchy">AMRFinder Hierarchy</a>) -->, <a href="#amr-finder-results">interpret AMRFinderPlus results</a>, and <a href="#amr-finder-read-more">read more</a><!-- (<a href="#amr-finder-publication">publication</a>) -->.</li>
See <a href="#amrfinder_citations">AMRFinderPlus references</a> for related publications
<!-- <li><b>Publication/Citation</b>: Feldgarden M, Brover V, Haft DH, Prasad AB, Slotta DJ, Tolstoy I, Tyson GH, Zhao S, Hsu CH, McDermott PF, Tadesse DA, Morales C, Simmons M, Tillman G, Wasilenko J, Folster JP, Klimke W. Validating the NCBI AMRFinder Tool and Resistance Gene Database Using Antimicrobial Resistance Genotype-Phenotype Correlations in a Collection of NARMS Isolates. <b><i>Antimicrob Agents Chemother</i> 2019</b> Aug 19. pii: AAC.00483-19. doi: 10.1128/AAC.00483-19. [Epub ahead of print] <a href="https://www.ncbi.nlm.nih.gov/pubmed/31427293">PubMed PMID: 31427293</a>; <a href="https://aac.asm.org/content/early/2019/08/27/AAC.00483-19.long">Full text at AAC</a>.</li> -->
<!-- li>Publication/Citation: <a href="https://doi.org/10.1128/AAC.00483-19">Feldgarden et al. (2019), https://doi.org/10.1128/AAC.00483-19</a>, <a href="https://www.ncbi.nlm.nih.gov/pubmed/31427293">PubMed PMID: 31427293</a>.
[bioarchive: <a href="https://doi.org/10.1101/550707">Feldgarden et al. (2019), https://doi.org/10.1101/550707</a]>]</li -->
</ul>
</li>
<li id="resource-amr-microbigge"><a href="/pathogens/isolates#/microbigge/">MicroBIGG-E</a> is the <b>Micro</b>bial <b>B</b>rowser for <b>I</b>dentification of <b>G</b>enetic and <b>G</b>enomic <b>E</b>lements. Every row in the <a href="/pathogens/isolates#/microbigge/">MicroBIGG-E</a> display is an <b>anti-microbial resistance (AMR)</b>, <b>stress response</b>, and/or <b>virulence</b> gene that has been identified in an isolate by the <a href="/pathogens/docs/data_processing">data processing pipeline</a>, with information about the method used to identify it, supporting evidence, and the element's type, subtype, class, subclass, and more. The purpose of MicroBIGG-E is to enable researchers to obtain the actual contigs that contain a genetic or genomic element of interest, in order to conduct further analysis. The <a href="#microbigge"><b>MicroBIGG-E help</b></a> section provides information on how to use the tool<!--, including <a href="#microbigge-search-tips">search tips</a>, <a href="#microbigge-data-fields">data fields</a>, <a href="#microbigge-output">output</a>, and <a href="#microbigge-sample-searches"><span style="color:#d70000">use cases (sample searches)</span></a -->.
</li>
<li id="resource-amr-submit"><a href="/pathogens/submit-data/">Submit sequence and phenotype data related to AMR</a> - includes links to instructions how to: <a href="/pathogens/submit-data/">submit data for real-time analysis</a>; <a href="https://www.ncbi.nlm.nih.gov/biosample/docs/antibiogram/">submit antibiograms to the BioSample database</a>; and <a href="/pathogens/submit-beta-lactamase/">request new alleles for Beta-Lactamase, MCR, and Qnr Genes</a>.</li>
<li id="resource-amr-ftp"><a href="https://ftp.ncbi.nlm.nih.gov/pathogen/Antimicrobial_resistance/AMRFinderPlus/database/latest/">FTP/Raw Reference Data Download</a> - includes <a href="//www.ncbi.nlm.nih.gov/bioproject/PRJNA313047">AMRFinderPlus data files</a> and the Bacterial Antimicrobial Resistance Reference Gene Database (BioProject <a href="https://www.ncbi.nlm.nih.gov/bioproject/PRJNA313047">PRJNA313047</a>)</li>
<li id="resource-amr-bigquery"><a href="https://www.ncbi.nlm.nih.gov/pathogens/docs/gcp/">Analysis results in Google Cloud</a> - Includes the full data behind MicroBIGG-E and the Isolates Browser as well as contig and protein sequences behind the elements in MicroBIGG-E</li>
<li id="resource-amr-resources-schematic">AMR resources schematic illustration - A separate section of this document provides <a href="#amr"><b>more details about Antimicrobial Resistance (AMR) Resources</b></a>, including a <a href="#amr-resources-schematic"><span style="color:#d70000">schematic illustration</span> of AMR resources</a> that shows the data sets and tools and the relationships among them. An <a href="https://ftp.ncbi.nlm.nih.gov/pub/factsheets/Factsheet_AMR_Project.pdf">antimicrobial resistance factsheet</a> is also available on the FTP site.</li>
</ul>
<!-- I>A separate section of this file provides <a href="#amr">additional information about AMR resources</a>, including <a href="#reference-gene-catalog">Pathogen Detection Reference Gene Catalog help documentation</a>, with details on how that resource can be used and an <a href="#AMRReferenceGeneBrowserIllustration"><span style="color:#d70000">illustrated example</span> of an AMR Reference Gene Catalog display</a>.</i><br -->
</div>
</div>
<!-- ====== END_RESOURCE_AMR_REFERENCE_GENE_BROWSER ========= -->
<!-- ========= RESOURCE_FTP_SITE ============ -->
<div style="padding-left: 2em">
<h4 id="resource-ftp">FTP site <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#components"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Pathogens Project Components, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h4>
<div style="padding-left: 2em">
The <a href="https://ftp.ncbi.nlm.nih.gov/pathogen/">Pathogens FTP site</a> provides files that contain the results of analyses done by NCBI on the isolates data that have been submitted to the <a href="/pathogens/">Pathogen Detection</a> project. The files include genome assemblies that were built from sequence reads, phylogenetic distance trees for isolates placed in clusters using the methods described in <a href="/pathogens/docs/data_processing">data processing</a> section, and antimicrobial resistance (AMR) data.<br /><br />
<i>A separate section of this document provides an <a href="#ftp">overview of the data available</a> on the FTP site, and the <a href="https://ftp.ncbi.nlm.nih.gov/pathogen/ReadMe.txt">FTP readme file</a> provides additional details.</i><br />
</div>
</div>
<!-- ====== END_RESOURCE_FTP_SITE ========= -->
<!-- ========= RESOURCE_DATA_SUBMISSION_TOOLS ============ -->
<div style="padding-left: 2em">
<h4 id="resource-submit">Data submission tools <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#components"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Pathogens Project Components, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h4>
<div style="padding-left: 2em">
NCBI provides a number of tools for submitting data to the Pathogen Detection project, and the specific tool(s) you use depends on the <a href="#data-types">types of data</a> you are submitting.<br /><br />
<i>A separate section of this document provides an <a href="#submit">overview of the data submission process</a>, and links to <a href="/pathogens/submit-data/">detailed submission instructions</a>.</i>
</div>
</div>
<!-- ====== END_RESOURCE_DATA_SUBMISSION_TOOLS ========= -->
<!-- ======== END_COMPONENTS_RESOURCES/TOOLS ========= -->
<!-- ========= COMPONENTS_DATA_TYPES ============ -->
<h3 id="data-types">Types of Data <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#components"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Pathogens Project Components, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h3>
<div style="padding-left: 2em">
The <a href="/pathogens/"><b>Pathogen Detection</b></a> <b>Resource</b> integrates primary records from other NCBI databases so that you can search by their accessions and properties in the <a href="/pathogens/isolates#/search/">Isolates Browser</a>. Many of the data fields that are in the Isolates Browser and other Pathogen resources are derived from these primary data sources. Other data fields are derived during processing of the primary data through the data processing pipeline. The "<b>examples</b>" below retrieve samples of the data types from their original source databases. The "<b>search tips</b>" under <a href="#data-type-genotype">genotypes</a> and <a href="#data-type-phenotype">phenotypes</a> show how to retrieve those data types through the Isolates Browser. <i>A separate section of this document provides details on <a href="#isolates-browser">how to use the Isolates Browser</a>, including searches against specific <a href="#isolates-browser-data-fields">data fields</a>.</i><br /><br />
<a href="#data-type-bioproject">BioProject records</a> | <a href="#data-type-biosample">BioSample records</a> | <a href="#data-type-sequence-read">Raw data: Sequence reads</a> | <a href="#data-type-genome">Genomes</a> | <a href="#data-type-genotype">Genotypes: antimicrobial resistance (AMR) genes</a> | <a href="#data-type-phenotype">Phenotypes: antimicrobial susceptibility test (AST) data (antibiograms)</a>
</div>
<!-- ======= DATA_TYPES_AS_BULLETTED_LIST ========== -->
<!-- ======= DATA_TYPE_BIOPROJECT ========== -->
<div style="padding-left: 2em">
<h4 id="data-type-bioproject">BioProject records <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#components"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Pathogens Project Components, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h4>
<ul>
<li>A <a href="https://www.ncbi.nlm.nih.gov/bioproject/">BioProject</a> is a collection of biological data related to a single initiative, originating from a single organization or from a consortium. A BioProject record provides users a single place to find links to the diverse data types generated for that project. As the sequence data archives (GenBank and SRA) require submission to a BioProject for assembled genomes, this means that every isolate in the Isolate Browser comes from one of these BioProjects. There may be many isolates from any particular BioProject.</li>
<ul>
<li><b>Example</b>: Retrieve the <a href="https://www.ncbi.nlm.nih.gov/bioproject/230969">BioProject PRJNA230969</a>, which describes the GenomeTrakr project by the US Food and Drug Administration (FDA) to sequence <i>Escherichia coli</i> (<b><i>E. coli</i></b>) genomes for the surveillance and rapid detection of foodborne contamination events.</li>
<li><b>Submit</b>: See the <a href="#submit">data submissions</a> section of this document for instructions on <!-- a href="#SubmitBioProjects" -->submitting BioProjects<!-- /a -->.</li>
<!-- li><b>Read more</b>: The <a href="https://www.ncbi.nlm.nih.gov/books/NBK169438/">BioProject chapter</a> in the <a href="https://www.ncbi.nlm.nih.gov/books/NBK143764/">NCBI Handbook, 2nd ed.</a> provides more information about the database.</li -->
</ul>
</ul>
</div>
<!-- ======= END_DATA_TYPE_BIOPROJECT ========== -->
<!-- ======= DATA_TYPE_BIOSAMPLE ========== -->
<div style="padding-left: 2em">
<h4 id="data-type-biosample">BioSample records <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#components"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Pathogens Project Components, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h4>
<ul>
<li><a href="https://www.ncbi.nlm.nih.gov/biosample/">BioSample</a> records describe the biological source materials used in experimental assays. For many pathogen samples, a template/package is used that has a minimal set of required fields that was developed specifically for this project: (<a href="https://www.ncbi.nlm.nih.gov/biosample/docs/packages/Pathogen.cl.1.0/">clinical package</a>, <a href="https://www.ncbi.nlm.nih.gov/biosample/docs/packages/Pathogen.env.1.0/">environmental package</a>).<!-- biological samples from which the sequence data were obtained. (Read more in the <a href="https://www.ncbi.nlm.nih.gov/books/NBK169436/">BioSample chapter</a> in the <a href="https://www.ncbi.nlm.nih.gov/books/NBK143764/">NCBI Handbook, 2nd ed.</a>.) --></li>
<ul>
<li><b>Example</b>: Retrieve an individual BioSample record, <a href="https://www.ncbi.nlm.nih.gov/biosample/SAMN05245394">SAMN05245394</a>, for <i>Escherichia coli</i> isolated from all-purpose flour and sequenced as part of the FDA's GenomeTrakr project (BioProject <a href="https://www.ncbi.nlm.nih.gov/bioproject/230969">PRJNA230969</a>) for the surveillance and rapid detection of foodborne contamination events.</li>
<li><b>Example</b>: Retrieve <a href="https://www.ncbi.nlm.nih.gov/biosample?LinkName=bioproject_biosample_all&amp;from_uid=230969">all biosamples that are part of the FDA's GenomeTrakr project</a> (BioProject <a href="https://www.ncbi.nlm.nih.gov/bioproject/230969">PRJNA230969</a>) for the surveillance and rapid detection of foodborne contamination events.
<!-- BioProject <a href="https://www.ncbi.nlm.nih.gov/bioproject/230969">PRJNA230969</a>, the GenomeTrakr project by the US Food and Drug Administration (FDA) to sequence E. coli genomes for the surveillance and rapid detection of foodborne contamination events. --></li>
<li><b>Submit</b>: See the <a href="#submit">data submissions</a> section of this document for instructions on submitting BioSamples.
</li>
</ul>
</ul>
</div>
<!-- ======= END_DATA_TYPE_BIOSAMPLE ========== -->
<!-- ======= DATA_TYPE_SEQUENCE_READS ========== -->
<div style="padding-left: 2em">
<h4 id="data-type-sequence-read">Raw data: Sequence reads <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#components"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Pathogens Project Components, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h4>
<ul>
<li><a href="https://www.ncbi.nlm.nih.gov/sra/">Sequence Read Archive (SRA)</a> stores raw sequencing data and alignment information from high-throughput sequencing platforms. Most of the major pathogen surveillance efforts use next generation sequencing platforms with raw sequence data deposited in SRA. The majority of isolates in the Isolate Browser have been assembled using the Pathogen Detection <a href="/pathogens/docs/data_processing">data processing pipeline</a> from the raw data in SRA.<!-- (Read more in the <a href="https://www.ncbi.nlm.nih.gov/sra/docs/">Sequence Read Archive (SRA) Overview</a>.) --></li>
<ul>
<li><b>Submit</b>: See the <a href="#submit">data submissions</a> section of this document for instructions on submitting sequence reads.
</li>
</ul>
</ul>
</div>
<!-- ======= END_DATA_TYPE_SHORT_READS ========== -->
<!-- ======= DATA_TYPE_GENOMES ========== -->
<div style="padding-left: 2em">
<h4 id="data-type-genome">Genomes <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#components"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Pathogens Project Components, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h4>
<ul>
<li>Pathogen genomes are from two sources: 1) assemblies submitted to the GenBank nucleotide sequence database from outside contributors, 2) genomes assembled in the Pathogen Detection data processing pipeline using the raw sequencing data in SRA. <i>Currently NCBI is working on depositing these assemblies into GenBank, however the vast majority are not yet available there.</i></li>
<ul>
<li><b>Submit</b>: See the <a href="#submit">data submissions</a> section of this document for instructions on submitting assembled genomes.</li>
<li><b>Note</b>: Each Pathogen Detection Target (<a href="#accession-prefix-pdt">"PDT" record</a>) in the Pathogen Detection Project contains the genome assembly for a single pathogen isolate.</li>
<li>There are <b>several types of genome assemblies in the Project</b>:<br />
<ol>
<li>isolates submitted directly to GenBank as assembled genomes, and therefore have a corresponding <a href="#accession-prefix-gca">"GCA" accession</a></li>
<li>isolate genomes assembled by the NCBI Pathogens <a href="/pathogens/docs/data_processing">data processing</a> pipeline from sequence reads, but not published as genome sequence records in GenBank</li>
<li>isolate genomes assembled by the NCBI data processing pipeline and then submitted to GenBank either by the submitter or on behalf of the submitter with their permission.</li>
</ol>
</li>
</ul>
</ul>
</div>
<!-- ======= END_DATA_TYPE_GENOMES ========== -->
<!-- ======= DATA_TYPE_GENOTYPES ========== -->
<div style="padding-left: 2em">
<h4 id="data-type-genotype">Genotypes <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#components"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Pathogens Project Components, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h4>
<ul>
<li><b>Antimicrobial resistance (AMR)</b>, <b>virulence</b>, and <b>stress resistance</b> genotypes are available in the Isolates Browser and are derived from the annotation of the assembled pathogen isolate using the NCBI <a href="/pathogens/antimicrobial-resistance/AMRFinder/">AMRFinderPlus</a> tool. For assemblies that have genomes already released in GenBank the full results of running AMRFinderPlus are available in <a href="/pathogens/microbigge/">MicroBIGG-E</a>. <i>(The <a href="/pathogens/docs/data_processing">data processing pipeline</a> section of this document provides additional details about genome annotation.)</i> For more information on NCBI antimicrobial resistance resources see <a href="/pathogens/antimicrobial-resistance/">this page</a>.</li>
<ul>
<li><b>Search tip</b>: To retrieve all pathogen isolates that have AMR genotype data, open the Pathogens <a href="/pathogens/isolates#/search/">Isolates Browser</a>, click on the <b>"Filters" menu</b>, scroll down to the <b>"Property" filter</b>, and select the checkbox for the desired property, such as "<b>has AMR genotypes</b>," "<b>has stress genotypes</b>," and/or "<b>has virulence genotypes</b>". <i>(See <a href="#isolates-browser">Isolates Browser help</a> for more information about <a href="#filters">Filters</a>, as well as information about <a href="#isolates-browser-data-field-AMRGenotypes">how to search the "AMR Genotypes" data field directly</a>.)</i></li>
<li><b>Genotype categories</b>: The genes that have been identified in an isolate's genome sequence are grouped into genotype categories, such as <i><b>complete</b></i>, <i><b>partial</b></i>, <i><b>partial end of contig</b></i>. The genotype categories appear when you use the Isolates Browser's <a href="#isolates-browser-display-options">choose columns</a> function to display the genotype data columns. The <a href="#isolates-browser-data-field-AMRGenotypes"><b>AMR genotypes</b></a> column is displayed by default, and you can use the <a href="#isolates-browser-display-options">choose columns</a> function to display additional data columns, such as <a href="#isolates-browser-data-field-stress-genotypes"><b>Stress genotypes</b></a> and/or <a href="#isolates-browser-data-field-virulence-genotypes"><b>Virulence genotypes</b></a>. <i>(The <a href="/pathogens/docs/data_processing">data processing pipeline</a> section provides <a href="/pathogens/docs/data_processing/#genotype-categories">more information about genotype categories</a>.)</i></li>
<li><b>Additional details</b>: A separate section of this document provides an <a href="#resource-amr">overview of the Antimicrobial Resistance (AMR) resources</a> that are available from the Pathogen Detection Project.</li>
<li><b>Submit</b>: See the <a href="#submit">data submissions</a> section of this document for instructions on submitting antimicrobial resistance genes.</li>
</ul>
</ul>
</div>
<!-- ======= END_DATA_TYPE_GENOTYPES ========== -->
<!-- ======= DATA_TYPE_PHENOTYPES ========== -->
<div style="padding-left: 2em">
<h4 id="data-type-phenotype">Phenotypes <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#components"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Pathogens Project Components, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h4>
<ul>
<li><b>Antimicrobial Susceptibility Test (AST)</b> data, also referred to as <b>AST phenotypes</b> or <b>antibiograms</b>, are included by submitters as data in <a href="https://www.ncbi.nlm.nih.gov/biosample/">BioSample</a> records, when available. Those BioSample records with AST data can be retrieved from the BioSample database directly. For those BioSample records for which sequencing data is submitted, and which are also incorporated into the Pathogen resources, the Isolate Browser displays the antibiotic compounds from each antibiogram, binned into the SIR (sensitive, intermediate, resistance) calls as made by the submitter into a separate column: AST_phenotypes. You can submit AST data for your samples. See <a href="/pathogens/submit-data/#ast">How to submit</a> for information on how to submit that data<br /><br />
<ul>
<li><b>Example</b>: View <a href="https://www.ncbi.nlm.nih.gov/biosample/SAMN05170351">BioSample SAMN05170351</a>, an <i>Escherichia coli</i> isolate that was sequenced as part of a Multi-Site Gram-Negative Bacilli Surveillance Initiative by the CDC's Emerging Infections Program (EIP), <a href="https://www.ncbi.nlm.nih.gov/bioproject/288601">BioProject PRJNA288601</a>. The BioSample record includes antibiogram data for more than 20 antibiotics.</li>
<li><b>Example</b>: Retrieve <a href="https://www.ncbi.nlm.nih.gov/biosample/?term=antibiogram%5Bfilter%5D+AND+%22Escherichia+coli%22%5Borgn%5D">all BioSample records that include antibiograms and that are from <i>Escherichia coli</i></a>.</li>
<li><b>Search tip</b>: To retrieve all pathogen isolates that have AST phenotype data, open the Pathogens <a href="/pathogens/isolates#/search/">Isolates Browser</a>, click on the <b>"Filters" menu</b>, scroll down to the <b>"Property" filter</b>, and select the checkbox for "<b>has AST phenotypes</b>." <i>(See <a href="#isolates-browser">Isolates Browser help</a> for more information about <a href="#filters">Filters</a>, as well as information about <a href="#isolates-browser-data-field-ASTPhenotypes">how to search the "AST Phenotypes" data field directly</a>.)</i><br />
Note that Isolates Browser default display does not show the AST_Phenotypes data column, but you can easily add it to the display by using the <a href="#isolates-browser-display-options">Choose columns</a> option.</li>
<li><b>Submit</b>: See the <a href="#submit">data submissions</a> section of this document for instructions on submitting antimicrobial susceptibility test data (antibiograms).</li>
</ul>
</li>
<li>A list of possible <b>phenotype values</b> is shown on the <a href="https://www.ncbi.nlm.nih.gov/biosample/docs/beta-lactamase/">BioSample Beta-Lactamase Antibiograms</a> page, under the <b>"Resistance Phenotype" tab</b>, and includes:<br /><br />
<ul>
<li>intermediate (I)</li>
<li>nonsusceptible (NS)</li>
<li>not defined (N, ND)</li>
<li>resistant (R)</li>
<li>susceptible (S, sensitive)</li>
<li>susceptible-dose dependent (SSD)</li>
</ul>
</li>
</ul>
</div>
<!-- ======= END_DATA_TYPE_PHENOTYPES ========== -->
<!-- ====== END_DATA_TYPES_AS_BulLETTED_LIST ========= -->
<!-- ======== END_COMPONENTS_DATA_TYPES ============ -->
<!-- ========= COMPONENTS_CONTRIBUTORS ============ -->
<h3 id="contributors">Contributors <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#components"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Pathogens Project Components, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h3>
<div style="padding-left: 2em">
<ul>
<li>The Pathogen Detection project continues to grow and welcomes data submissions from various contributors. The filter interface and <a href="#isolates-browser-data-fields">data fields</a> can be used to identify those agencies and organizations responsible for collecting and submitting the data. The <a href="#submit">data submissions</a> section of this document provides an overview of the submissions process and links to pages that provide detailed instructions.</li>
</ul>
</div>
<!-- ======== END_COMPONENTS_CONTRIBUTORS ========= -->
<!-- ########## END_H2_SECTION:COMPONENTS ########## -->
<!-- ======== HORIZONTAL_RULE ============ -->
<hr />
<!-- ======== END_HORIZONTAL_RULE ======== -->
<!-- ########## H2_SECTION:DATA_RETRIEVAL_AND_ANALYSIS ########## -->
<h2 id="data-retrieval">Data Retrieval &amp; Analysis <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h2>
<!-- div style='padding-left: 2em'>
Data from the <a href="/pathogens/">Pathogen Detection</a> project can be retrieved by <a href="#text-terms"><b>text term searches</b></a> or by <a href="#sequence-data"><b>sequence data analysis</b></a>, depending upon the tool you are using, as described below.<br /><br />
The Pathogen Detection project also provides <a href="#data-retrieval-automated-searches"><b>automatic e-mail notifications of new data</b></a> that alert you to new data that match the criteria of a <a href="#data-retrieval-automated-searches-save">saved search</a>, or that fall within a specified SNP distance from isolate(s) of a <a href="#data-retrieval-automated-searches-watch">watched isolate</a>.<br />
</div -->
<ul>
<li><a href="#text-terms">Text term searches</a>
<ul>
<li><a href="#text-terms-input">Input text terms</a></li>
<li><a href="#text-terms-example">Example</a></li>
<li><a href="#text-terms-output">Output list of isolates</a></li>
<!-- li><a href="#text-terms-more-info">More information</a></li -->
</ul>
</li>
<li><a href="#sequence-data">Sequence data analysis</a>
<ul>
<li><a href="#sequence-data-real-time-analysis">Real time analysis</a></li>
<li><a href="#sequence-data-input">Input sequence data</a></li>
<li><a href="#sequence-data-output">Output phylogenetic distance trees</a>
<!-- ul>
<li><a href="#sequence-data-output-snp-tree-viewer">...in SNP Tree Viewer</a></li>
<li><a href="#sequence-data-output-ftp">...on FTP site</a></li>
</ul -->
</li>
<li><a href="#sequence-data-example">Example</a></li>
<!-- li><a href="#sequence-data-more-info">More information</a></li -->
</ul>
</li>
<li><a href="#data-retrieval-automated-searches">Automatic e-mail notifications of new data</a>
<ul>
<li><a href="#data-retrieval-automated-searches-save">"SAVE" a search in the Isolates Browser</a>
<ul>
<li><a href="#automated-searches-save-illustration"><span style="color:#d70000">Illustrated example</span> of an automatic e-mail for a saved search</a></li>
</ul>
</li>
<li><a href="#data-retrieval-automated-searches-watch">"WATCH" an isolate of interest in the SNP Tree Viewer</a>
<ul>
<li><a href="#automated-searches-watch-illustration"><span style="color:#d70000">Illustrated example</span> of automatic e-mail for a watched isolate</a></li>
</ul>
</li>
</ul>
</li>
<li><a href="/pathogens/docs/gcp/">Pathogen Detection Resources at Google Cloud Platform</a></li>
</ul>
<!-- ========= RETRIEVAL_AND_ANALYSIS_TEXT_TERMS ============ -->
<h3 id="text-terms">Text term searches <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#data-retrieval"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Data Retrieval &amp; Analysis, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h3>
<div style="padding-left: 2em">
<a href="#text-terms-input">input text terms</a> | <a href="#text-terms-example">example</a> | <a href="#text-terms-output">output list of isolates</a> | <a href="#text-terms-more-info">more information</a>
</div>
<div style="padding-left: 2em">
<h4 id="text-terms-input">Input text term(s) <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#data-retrieval"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Data Retrieval &amp; Analysis, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h4>
<ul>
<li>If you want to retrieve isolates from the existing data in the Pathogen Detection project, you can use the <a href="/pathogens/isolates#/search/">Isolates Browser</a> to search for isolates that contain a term(s) of interest, as shown in the <!-- a href="#TextTermsExample" -->example<!-- /A --> below.</li>
</ul>
</div>
<div style="padding-left: 2em">
<h4 id="text-terms-example">Example of text term search: <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#data-retrieval"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Data Retrieval &amp; Analysis, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h4>
<ul>
<li>Retrieve the set of isolates that contain the phrase <a href="/pathogens/isolates#/search/%22all-purpose%20flour%22">"all-purpose flour"</a>.<br /><br />
<i>The <a href="#isolates-browser">Isolates Browser Help</a> section of this document provides information about <a href="#allowable-search-terms">allowable search terms</a>, <a href="#isolates-browser-query-tips">query tips</a> about <a href="#query-tips-special-characters">special characters</a> such as hyphens in search terms, the use of <a href="#query-tips-phrase-search-quotes">quotes for phrase searches</a>, and <a href="#query-tips-case-sensitive-vs-case-insensitive">case sensitive vs. case insensitive searches</a>, available <a href="#isolates-browser-data-fields">data fields</a>, and more.</i></li>
</ul>
</div>
<div style="padding-left: 2em">
<h4 id="text-terms-output">Output tabular list of isolates that contain your search term(s) <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#data-retrieval"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Data Retrieval &amp; Analysis, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h4>
<ul>
<li>The Isolates Browser will display a table listing the isolates that contain at least one of the specified search terms (if you do a <a href="#isolates-browser-basic-search">basic search</a>), or the isolates that meet more stringent search criteria (if you do an <a href="#isolates-browser-advanced-search">advanced search</a>).<br /><br />
<i><a href="#isolates-browser-output">Read more about the Isolates Browser output</a> and see an <a href="#isolates-browser-illustration"><span style="color:#d70000">illustrated example</span> of search results</a>.</i></li>
</ul>
</div>
<div style="padding-left: 2em">
<h4 id="text-terms-more-info">More information about text term searches: tips and techniques <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#data-retrieval"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Data Retrieval &amp; Analysis, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h4>
<ul>
<li><i>The <a href="#isolates-browser">Isolates Browser Help</a> section of this document provides additional information about <a href="#isolates-browser-basic-search">basic searches</a>, <a href="#isolates-browser-advanced-search">advanced searches using the <b>SOLR query language</b></a>, available <a href="#isolates-browser-data-fields"><b>data fields</b></a>, <a href="#solr-sample-searches"><span style="color:#d70000">examples of SOLR queries</span></a>, and more.</i></li>
</ul>
</div>
<!-- ======== END_RETRIEVAL_AND_ANALYSIS_TEXT_TERMS ========= -->
<!-- ========= RETRIEVAL_AND_ANALYSIS_SEQUENCE_DATA ============ -->
<h3 id="sequence-data">Sequence data analysis <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#data-retrieval"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Data Retrieval &amp; Analysis, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h3>
<div style="padding-left: 2em">
<!-- a href="#SequenceData">Sequence data analysis</a> | --><a href="#sequence-data-real-time-analysis">real time analysis</a> | <a href="#sequence-data-input">input sequence data</a> | <a href="#sequence-data-output">output phylogenetic distance trees</a> | <a href="#sequence-data-example">example</a> | <a href="#sequence-data-more-info">more information</a>
</div>
<div style="padding-left: 2em">
<h4 id="sequence-data-real-time-analysis">Real time analysis <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#data-retrieval"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Data Retrieval &amp; Analysis, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h4>
<ul>
<li>Unlike other NCBI system such as BLAST, the <a href="/pathogens/">Pathogen Detection</a> project is not built with an interactive interface that allows users to upload their data and immediately obtain an answer. Instead, this project was set up to facilitate interactive analyses of large-scale surveillance projects that are automatically submitting real-time data to the NCBI archives that are then routed to an automated pipeline that generates interactive web reports on a daily basis. The web displays allow users to search, browse, and filter the automatically analyzed data that has been already submitted.</li>
</ul>
</div>
<div style="padding-left: 2em">
<h4 id="sequence-data-input">Input sequence data <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#data-retrieval"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Data Retrieval &amp; Analysis, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h4>
<ul>
<li>If you have sequenced <b>new isolates</b> and want to determine their relationship to existing isolates in the Pathogen Detection project, then you can follow the <a href="#submit">data submission procedures</a> described in a separate section of this document. Your submission(s) will go through the NCBI data processing pipeline, which includes sequence analysis to identify closely related isolates. The results of the analysis on your data are then made available on the FTP site and in the SNP Tree Viewer, as described in the <a href="#sequence-data-example">example</a> below.</li>
<li>All of the <b>existing isolates</b> in the Pathogen Detection project have also undergone sequence analysis after they were submitted, and their results are also available on the FTP site and in the SNP Tree Viewer.</li>
</ul>
</div>
<div style="padding-left: 2em">
<h4 id="sequence-data-output">Output phylogenetic distance trees <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#data-retrieval"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Data Retrieval &amp; Analysis, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h4>
<div style="padding-left: 1em">
NCBI has developed a <a href="/pathogens/docs/data_processing">data processing pipeline</a> that analyzes pathogens sequence data from GenBank or the Sequence Read Archive (SRA). Individual phylogenetic trees for each SNP cluster are available on FTP as well as the NCBI Pathogen Detection Isolates Browser, as noted below:<br />
<ul>
<li id="sequence-data-output-snp-tree-viewer"><b>Sequence data analysis results in SNP Tree Viewer</b> -- When you are viewing pathogens in the <a href="/pathogens/isolates#/search/">Isolates Browser</a>, any isolate that belongs to a SNP cluster has a "PDS*" accession number in the "SNP Cluster" column of the Isolates Browser search results. The "PDS*" accession links to the SNP Tree Viewer, which displays an interactive phylogenetic tree of all the isolates in the SNP cluster.<br /><br />
<i>(See the <a href="#snp-tree-viewer">SNP Tree Viewer Help</a> section of this document for additional details on how to use that tool. It includes an <a href="#snp-tree-viewer-access"><span style="color:#d70000">illustrated example</span> of SNP Tree Viewer launch points</a> and <a href="#snp-tree-viewer-illustration"><span style="color:#d70000">illustrated example</span> of a SNP Tree Viewer display</a>.)</i>
</li>
<li id="sequence-data-output-ftp"><b>Sequence data analysis results on FTP</b> -- The phylogenetic distance trees are also available in the <a href="https://ftp.ncbi.nlm.nih.gov/pathogen/Results/">Pathogen FTP site, under the "Results" directory</a>. (<i>A separate section of this document provides <a href="#ftp">more information about the FTP site</a></i>.)</li>
</ul>
</div>
</div>
<div style="padding-left: 2em">
<h4 id="sequence-data-example">Example of sequence data analysis results (as interactive displays in SNP Tree Viewer) <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#data-retrieval"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Data Retrieval &amp; Analysis, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h4>
<ul>
<li>The FDA's GenomeTrakr project (BioProject <a href="https://www.ncbi.nlm.nih.gov/bioproject/230969">PRJNA230969</a>) for the surveillance and rapid detection of foodborne contamination events include a <a href="/pathogens/isolates#/search/PRJNA230969%20AND%20PDS000003441"><b>subset of <i>E. coli</i> isolates that belong to the SNP cluster "PDS000003441</b></a>." Upon submission to NCBI, those isolates were compared to all other isolates in the Pathogen Detection project and were found, via the Pathogens <a href="/pathogens/docs/data_processing">data processing pipeline</a>, to be closely related to other isolate genome sequences in that SNP cluster. In the Isolates Browser display, you can <b>click on the "PDS*" accession number</b> that appears in the <b>"SNP Cluster" column</b> for any one of those isolates (e.g., isolate PDT000133982.1) to open a SNP Tree Viewer display for the SNP cluster and interactively examine the phylogenetic distance tree. The Tree View shows a number of <b>clinical and environmental samples that are very closely related</b>, and therefore sheds light on the possible source of the outbreak. <i>(<a href="https://www.cdc.gov/ecoli/2016/o121-06-16/index.html">Read more on the CDC website about that outbreak</a>.)</i>
</li>
</ul>
</div>
<div style="padding-left: 2em">
<h4 id="sequence-data-more-info">More information about pathogen sequence data analysis <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#data-retrieval"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Data Retrieval &amp; Analysis, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h4>
<ul>
<li><i>A separate section of this document provides <a href="#snp-tree-viewer">more information about the SNP Tree Viewer</a>.</i></li>
<li><i>A separate section of this document provides <a href="#ftp">more information about the FTP site</a>.</i></li>
</ul>
</div>
<!-- ======== END_RETRIEVAL_AND_ANALYSIS_SEQUENCE_DATA ========= -->
<!-- ========= RETRIEVAL_AND_ANALYSIS_AUTOMATED_SEARCHES ============ -->
<h3 id="data-retrieval-automated-searches">Automatic E-mail Notifications of New Data <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#data-retrieval"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Data Retrieval &amp; Analysis, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h3>
<div style="padding-left: 2em">
You can <b>perform a search</b> in the Pathogens Isolates Browser, or to <b>select an isolate of interest</b> in the SNP Tree Viewer, and then automatically receive e-mail notifications each time new isolates become available that match your search criteria, or are closely related to your isolate of interest.<br /><br />
There are two ways to receive <a href="#automated-searches">automatic e-mail notifications of new data</a>, and you must be <a href="#automated-searches-requirements">logged into your free My NCBI</a> account to use either one:
</div>
<div style="padding-left: 2em">
<h4 id="data-retrieval-automated-searches-save">"Save" a search in the Isolates Browser <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#data-retrieval"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Data Retrieval &amp; Analysis, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h4>
<ul>
<li>A "<b>Save</b>" button in the <b>Isolates Browser</b> interface allows you to save one or more searches, and automatically notifies you about new isolates that match the criteria of each saved search.
<i>(<a href="#automated-searches-save">Read more</a> and view an <a href="#automated-searches-save-illustration"><span style="color:#d70000">illustrated example</span></a>.)</i></li>
</ul>
</div>
<div style="padding-left: 2em">
<h4 id="data-retrieval-automated-searches-watch">"Watch" an isolate of interest in the SNP Tree Viewer <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#data-retrieval"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Data Retrieval &amp; Analysis, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h4>
<ul>
<li>A "<b>Watch</b>" button in the <b>SNP Tree Viewer</b> interface allows you to watch one or more selected isolates in a tree, and automatically notifies you about new isolates that fall within the SNP distance that you have specified from the watched isolate(s).
<i>(<a href="#automated-searches-watch">Read more</a> and view an <a href="#automated-searches-watch-illustration"><span style="color:#d70000">illustrated example</span></a>.)</i></li>
</ul>
</div>
<br />
<!-- ======== END_RETRIEVAL_AND_ANALYSIS_AUTOMATED_SEARCHES ========= -->
<!-- ########## END_H2_SECTION:DATA_RETRIEVAL_AND_ANALYSIS ########## -->
<!-- ======== HORIZONTAL_RULE ============ -->
<hr />
<!-- ======== END_HORIZONTAL_RULE ======== -->
<!-- ########## H2_SECTION:ISOLATES_BROWSER ########## -->
<h2 id="isolates-browser">Isolates Browser help <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h2>
<!-- div style='padding-left: 2em'>
<a href="#isolates-browser-what-is"><b>What is</b> the Isolates Browser?</a><br />
<a href="#isolates-browser-input"><b>Input</b></a> | <a href="#allowable-search-terms">Allowable search terms</a> | <a href="#synonyms">Free text vs. controlled vocabulary</a> | <a href="#unique-identifiers">Unique identifiers</a> | <a href="#accession-prefixes">NCBI accession prefixes</a><br />
<a href="#isolates-browser-basic-search"><b>Basic search</b></a> | <a href="#isolates-browser-query-tips">Query tips</a> | <a href="#query-tips-multiple-terms">Multiple search terms</a> | <a href="#query-tips-special-characters">Special characters</a>| <a href="#query-tips-phrase-search-quotes">Phrase searches</a> | <a href="#query-tips-advanced-search">Advanced searches</a> | <a href="#query-tips-case-sensitive-vs-case-insensitive">Case sensitive vs. case insensitive searches</a><br />
<a href="#filters"><b>Filters</b> to refine search</a> | <a href="#filters-menu">Filters menu options</a> | <a href="#filters-on-the-fly">Filters are generated on the fly</a>| <a href="#filters-synonyms">Look for synonyms within a filter</a><br />
<a href="#isolates-browser-advanced-search"><b>Advanced search</b></a> | <a href="#solr">SOLR query language</a> | <a href="#solr-query-terms">Query Terms</a> | <a href="#operators">Operators</a> | <a href="#parentheses">Parentheses</a> | <a href="#isolates-browser-data-fields"><b>Data Fields</b></a> | <a href="#solr-sample-searches"><span style="color:#d70000">Examples of SOLR queries</span></a><br />
<a href="#isolates-browser-output"><b>Output</b></a> | <a href="#isolates-browser-output-table">Tabular list of isolates</a> | <a href="#isolates-browser-output-filters">Filters to refine results</a> | <a href="#sort-order">Sort order</a> | <a href="#isolates-browser-display-options">Customize the display</a> (<a href="#isolates-browser-display-options">choose columns</a>, <a href="#columns-default">default columns</a>, <a href="#columns-additional">additional columns</a>) | <a href="#isolates-browser-output-tree-viewer-link">SNP Tree Viewer link for each isolate that belongs to a SNP cluster</a> | <a href="#isolates-browser-share">"<b>Share</b>" function in the Isolates Browser</a> | <a href="#isolates-browser-illustration"><span style="color:#d70000">Illustrated example</span> of Isolates Browser search results</a><br />
<a href="#automated-searches-save">"<b>Save</b>" function to receive automatic e-mail notifications about new data that match your saved search</a><br />
<a href="#automated-searches-save-illustration"><span style="color:#d70000">Illustrated example</span> of an automatic notification for a saved search</a><br />
</div -->
<ul>
<li><a href="#isolates-browser-what-is">What is the Isolates Browser?</a></li>
<li id="toc-isolates-browser-input"><a href="#isolates-browser-input"><b>Input to Isolates Browser</b></a>
<ul>
<li><a href="#allowable-search-terms">Allowable search terms</a>
<ul>
<li><a href="#synonyms">Free text vs. controlled vocabulary</a></li>
<li><a href="#unique-identifiers">Unique identifiers</a> such as <a href="#ncbi-unique-identifiers">NCBI accessions</a>
<!-- ul>
<li><a href="#accession-prefix-gca">GCA_</a></li>
<li><a href="#accession-prefix-gcf">GCF_</a></li>
<li><a href="#accession-prefix-pdg">PDG</a></li>
<li><a href="#accession-prefix-pds">PDS</a></li>
<li><a href="#accession-prefix-pdt">PDT</a></li>
<li><a href="#accession-prefix-prj">PRJ</a></li>
<li><a href="#accession-prefix-samn">SAMN</a></li>
<li><a href="#accession-prefix-srr">SRR</a></li>
<li><a href="#accession-prefix-srs">SRS</a></li>
</ul -->
</li>
</ul>
</li>
<li id="toc-basic-search"><a href="#isolates-browser-basic-search">Basic Search</a>
<ul>
<li><a href="#isolates-browser-query-tips">Query tips</a>
<ul>
<!-- li><a href="#query-tips-multiple-terms">Multiple search terms</a></li>
<li><a href="#query-tips-special-characters">Special characters</a></li>
<li><a href="#query-tips-phrase-search-quotes">Phrase searches</a></li>
<li><a href="#query-tips-advanced-search">Advanced searches</a></li -->
<li><a href="#query-tips-case-sensitive-vs-case-insensitive">Case sensitive vs. case insensitive searches</a></li>
</ul>
</li>
<li><a href="#filters"><b>Filters</b> to refine search</a>
<ul>
<li><a href="#filters-menu">Filters menu options</a>
</li>
<li><a href="#filters-on-the-fly">Filters are generated on the fly</a></li>
<li><a href="#filters-gene-fields">Filters for gene fields</a></li>
<li><a href="#filters-scientific-name">Filter for Scientific name</a></li>
<li><a href="#filters-synonyms">Look for synonyms within a filter</a></li>
</ul>
</li>
</ul>
</li>
<li id="toc-advanced-search"><a href="#isolates-browser-advanced-search">Advanced Search</a>: <a href="#solr"><span style="color:#d70000"><b>SOLR Query Language</b></span></a>
<ul>
<li><a href="#solr-query-terms"><b>Query terms</b></a>
<ul>
<li><a href="#solr-single-term">Single term</a></li>
<li><a href="#solr-multiple-terms">Multiple terms</a></li>
<li><a href="#solr-phrase">Phrase</a></li>
<li><a href="#solr-term-modifiers">Term modifiers</a></li>
<li><a href="#wildcards">Wildcard searches</a></li>
<li><a href="#special-characters">Special characters in search terms</a></li>
</ul>
</li>
<li><a href="#operators"><b>Operators</b></a>
<ul>
<li><a href="#operators-boolean">AND, OR, NOT</a></li>
<li><a href="#operators-plus-and-minus">Plus (+) and Minus (-) symbols</a></li>
<li><a href="#range-searches">Range searches [nnnn TO nnnn]</a></li>
</ul>
</li>
<li><a href="#parentheses"><b>Parentheses</b></a>
<ul>
<li><a href="#parentheses-boolean">Use to order Boolean queries</a></li>
<li><a href="#parentheses-list-of-terms">Use to input a list of query terms</a></li>
<li><a href="#parentheses-in-gene-name">Are automatically escaped if they are an internal part of a gene name or query term</a></li>
</ul>
</li>
<li id="toc-data-fields"><a href="#isolates-browser-data-fields"><b>Data fields</b></a>
<ul>
<li><a href="#isolates-browser-data-field-AMRGenotypes">AMR Genotypes (AMR_genotypes)</a></li>
<li><a href="#isolates-browser-data-field-AMRGenotypesCore">AMR Genotypes core (AMR_genotypes_core)</a></li>
<li><a href="#isolates-browser-data-field-ASTPhenotypes">AST Phenotypes (AST_phenotypes)</a></li>
<li><a href="#isolates-browser-data-field-CollectionDate">Collection Date (collection_date)</a></li>
<li><a href="#isolates-browser-data-field-CreateDate">Create Date (creation_date)</a></li>
<li><a href="#isolates-browser-data-field-FoodOrigin">Food origin (food_origin)</a></li>
<li><a href="#isolates-browser-data-field-IsolationSource">Isolation Source (isolation_source)</a></li>
<li><a href="#isolates-browser-data-field-IsolationType">Isolation type (epi_type)</a></li>
<li><a href="#isolates-browser-data-field-Location">Location (geo_loc_name)</a></li>
<li><a href="#isolates-browser-data-field-MinSame">Minimum SNP distance within same isolation source type (minsame)</a></li>
<li><a href="#isolates-browser-data-field-MinDiff">Minimum SNP distance across different isolation source types (mindiff)</a></li>
<li><a href="#isolates-browser-data-field-OrganismGroup">Organism Group (taxgroup_name)</a></li>
<li><a href="#isolates-browser-data-field-Strain">Strain (Strain)</a></li>
<li><a href="#isolates-browser-data-field-Serovar">Serovar (serovar)</a></li>
<li><a href="#isolates-browser-data-fields-list">see a list of all Isolates Browser data fields...</a></li>
</ul>
</li>
<!-- FULL LIST OF DATA FIELDS -->
<!-- ul>
<li><a href="#isolates-browser-data-field-AMRGenotypes">AMR genotypes (<b><i>AMR_genotypes</i></b>)</a><br />
<a href="#isolates-browser-data-field-Assembly">Assembly (<b><i>asm_acc</i></b>)</a><br />
<a href="#isolates-browser-data-field-ASTPhenotypes">AST phenotypes (<b><i>AST_phenotypes</i></b>)</a><br />
<a href="#isolates-browser-data-field-BioProject">BioProject (<b><i>bioproject_acc</i></b>)</a><br />
<a href="#isolates-browser-data-field-BioSample">BioSample (<b><i>biosample_acc</i></b>)</a><br />
<a href="#isolates-browser-data-field-CollectedBy">Collected by (<b><i>collected_by</i></b>)</a><br />
<a href="#isolates-browser-data-field-CollectionDate">Collection Date (<b><i>collection_date</i></b>)</a><br />
<a href="#isolates-browser-data-field-Contigs">Contigs (<b><i>asm_stats_n_contig</i></b>)</a><br />
<a href="#isolates-browser-data-field-CreateDate">Create Date (<b><i>creation_date</i></b>)</a><br />
<a href="#isolates-browser-data-field-Host">Host (<b><i>host</i></b>)</a><br />
<a href="#isolates-browser-data-field-HostDisease">Host Disease (<b><i>host_disease</i></b>)</a><br />
<a href="#isolates-browser-data-field-FoodOrigin">Food origin(<b><i>food_origin</i></b>)</a><br />
<a href="#isolates-browser-data-field-IFSAC_category">IFSAC_category (<b><i>IFSAC_category</i></b>)</a><br />
<a href="#isolates-browser-data-field-Isolate">Isolate (<b><i>target_acc</i></b>)</a><br />
<a href="#isolates-browser-data-field-IsolationSource">Isolation Source (<b><i>isolation_source</i></b>)</a><br />
<a href="#isolates-browser-data-field-IsolationType">Isolation type (<b><i>epi_type</i></b>)</a><br />
<a href="#isolates-browser-data-field-KmerGroup">K-mer group (<b><i>kmer_group</i></b>)</a><br />
<a href="#isolates-browser-data-field-LatLon">Lat/Lon (<b><i>lat_lon</i></b>)</a><br />
<a href="#isolates-browser-data-field-Length">Length (<b><i>asm_stats_length_bp</i></b>)</a><br />
<a href="#isolates-browser-data-field-Level">Level (<b><i>asm_level</i></b>)</a><br />
<a href="#isolates-browser-data-field-LibraryLayout">Library Layout (<b><i>LibraryLayout</i></b>)</a><br />
<a href="#isolates-browser-data-field-Location">Location (<b><i>geo_loc_name</i></b>)</a><br />
<a href="#isolates-browser-data-field-Method">Method (<b><i>assembly_method</i></b>)</a><br />
<a href="#isolates-browser-data-field-MinSame">Min-same (<b><i>minsame</i></b>)</a><br />
<a href="#isolates-browser-data-field-MinDiff">Min-diff (<b><i>mindiff</i></b>)</a><br />
<a href="#isolates-browser-data-field-N50">N50 (<b><i>asm_stats_contig_n50</i></b>)</a><br />
<a href="#isolates-browser-data-field-OrganismGroup">Organism Group (<b><i>taxgroup_name</i></b>)</a><br />
<a href="#isolates-browser-data-field-Outbreak">Outbreak (<b><i>outbreak</i></b>)</a><br />
[<a href="#isolates-browser-data-field-ParentGroup">Parent group (<b><i>parent_group</i></b>)</a><br />]
<a href="#isolates-browser-data-field-PFGEPrimaryEnzymePattern">PFGE Primary Enzyme Pattern (<b><i>PFGE_PrimaryEnzyme_pattern</i></b>)</a><br />
<a href="#isolates-browser-data-field-PFGESecondaryEnzymePattern">PFGE Secondary Enzyme Pattern (<b><i>PFGE_SecondaryEnzyme_pattern</i></b>)</a><br />
<a href="#isolates-browser-data-field-Platform">Platform (<b><i>Platform</i></b>)</a><br />
<a href="#isolates-browser-data-field-Run">Run (<b><i>Run</i></b>)</a><br />
<a href="#isolates-browser-data-field-Strain">Strain (<b><i>strain</i></b>)</a><br />
<a href="#isolates-browser-data-field-Serovar">Serovar (<b><i>serovar</i></b>)</a><br />
[<a href="#isolates-browser-data-field-Serotype">Serotype (<b><i>serotype</i></b>)</a>]<br />
<a href="#isolates-browser-data-field-SNPCluster">SNP cluster (<b><i>erd_group</i></b>)</a><br />
<a href="#isolates-browser-data-field-ScientificName">Scientific name (<b><i>scientific_name</i></b>)</a><br />
<a href="#isolates-browser-data-field-source_type">Source type (<b><i>source_type</i></b>)</a><br />
<a href="#isolates-browser-data-field-SpeciesTaxID">Species TaxID (<b><i>species_taxid</i></b>)</a><br />
<a href="#isolates-browser-data-field-SRACenter">SRA Center (<b><i>sra_center</i></b>)</a><br />
<a href="#isolates-browser-data-field-SRAReleaseDate">SRA Release Date (<b><i>sra_release_date</i></b>)</a><br />
[<a href="#isolates-browser-data-field-Status">Status (<b><i>status</i></b>)</a><br />]
<a href="#isolates-browser-data-field-TaxID">TaxID (<b><i>taxid</i></b>)</a><br />
[<a href="#tree_node_ids">tree_node_ids (<b><i>tree_node_ids</i></b>)</a><br />]
<a href="#isolates-browser-data-field-WGSAccession">WGS Accession (<b><i>wgs_master_acc</i></b>)</a><br />
<a href="#isolates-browser-data-field-WGSPrefix">WGS Prefix (<b><i>wgs_acc_prefix</i></b>)</a><br />
</li>
</ul -->
<!-- END FULL LIST OF DATA FIELDS -->
<li id="toc-search-modifiers"><a href="#isolates-browser-search-modifiers"><b>Search modifiers</b></a>
<ul>
<li><a href="#isolates-browser-search-modifier-new"><b>new</b></a></li>
<br />
</ul>
</li>
<li id="toc-solr-sample-searches"><a href="#solr-sample-searches"><span style="color:#d70000">Examples of SOLR queries</span></a>
<ul>
<li><a href="#solr-sample-search-IsolationSourceAllPurposeFlour"><b>Isolation source:</b><br />
Show all isolates that have the exact phrase "All-Purpose Flour" in the isolation_source data field</a></li>
<li><a href="#solr-sample-search-LocationAndOrganismGroup"><b>Geographic location and organism group:</b><br />
Show all Salmonella isolates collected in USA</a></li>
<li><a href="#solr-sample-search-GenotypesMcrAndBlakpc"><b>Genotypes: isolates that have specific genes:</b><br />
Show all of the isolates that have a mobile colistin resistance gene and a KPC beta-lactamase</a></li>
<li><a href="#solr-sample-search-PhenotypesCiproResistant"><b>Phenotypes: isolates that are resistant to a given antibiotic:</b><br />
Show all of the isolates that are resistant to ciprofloxacin</a></li>
<li><a href="#solr-sample-search-GenotypesAndPhenotypes"><b>Genotypes and phenotypes:</b></a><br />
<a href="#solr-sample-search-GenotypesNoBlakpcNoBlandmImipenemResistant"><b>Example 1: missing specific genes, resistant to antiobiotic:</b><br />
Show all of the isolates that lack both a blaKPC and blaNDM carbapenemase but are resistant to imipenem</a><br />
<a href="#solr-sample-search-GenotypesBlakpcMeropenemSusceptible"><b>Example 2: has specific gene, susceptible to antiobiotic:</b><br />
Show all of the isolates that have a blaKPC gene and are susceptible to meropenem</a><br />
<a href="#solr-sample-search-GenotypesQnrCiproResistant"><b>Example 3: has specific gene, resistant to either of two antiobiotics:</b><br />Show all of the isolates that have a qnr gene and that are resistant to either ciprofloxacin or nalidixic acid</a>
</li>
<!-- li><a href="#solr-sample-search-GeneNameSpecialCharacters"><b>Genotypes: gene name with special characters:</b><br />
Show all of the isolates that have the gene aph(4)-Ia and a blaKPC carbapenemase</a></li -->
<li><a href="#solr-sample-search-WhereIsMyIsolate"><b>Where is my isolate?</b><br />
Retrieve your data by BioSample accession numbers or SRA Run accession numbers</a></li>
<li><a href="#solr-sample-search-BatchSearch"><b>Batch search with isolate identifiers that contain a hyphen:</b><br />
Input a list of isolate identifiers that contain special characters (e.g., hyphens)</a></li>
</ul>
</li>
</ul>
</li>
</ul>
</li>
<li id="toc-isolates-browser-output"><a href="#isolates-browser-output"><b>Output from Isolates Browser</b></a>
<ul>
<li><a href="/pathogens/docs/isolates_gcp">Search/retrieve isolates browser data in Google Cloud BigQuery</a></li>
<li><a href="#isolates-browser-output-table">Tabular list of isolates</a></li>
<li><a href="#isolates-browser-exceptions-table">Exceptions table</a></li>
<li><a href="#isolates-browser-matched-clusters">Matched clusters</a></li>
<li><a href="#isolates-browser-output-filters">Filters to refine results</a></li>
<li><a href="#sort-order">Sort order</a>
<ul>
<li><a href="#sort-order-lifo">Default sort order</a></li>
<li><a href="#sort-order-column-headers">Sort by column headers</a></li>
</ul>
</li>
<li id="toc-isolates-browser-display-options"><a href="#isolates-browser-display-options">Customize the Isolates Browser display</a>
</li>
<li><a href="#isolates-browser-output-tree-viewer-link">SNP Tree Viewer link for each isolate that belongs to a SNP cluster</a></li>
<li><a href="#isolates-browser-share">"<b>Share</b>" function in the Isolates Browser</a></li>
<li><a href="#isolates-browser-illustration"><span style="color:#d70000">Illustrated example</span> of Isolates Browser search results</a></li>
<li><a href="#automated-searches-save">"<b>Save</b>" function to receive automatic e-mail notifications about new data from a saved search</a></li>
<ul>
<li><a href="#automated-searches-save-illustration"><span style="color:#d70000">Illustrated example</span> of an automatic notification for a saved search</a></li>
</ul>
<li><a href="#isolates-browser-display-in-microbigge">Display isolates in MicroBIGG-E using Cross-browser selection</a></li>
<li><a href="#isolates-browser-download">Download data from the Isolates Browser web display</a>
<ul>
<li><a href="#isolates-browser-download-metadata">Metadata</a></li>
<li><a href="#isolates-browser-download-assemblies">Assemblies</a></li>
</ul>
</li>
</ul>
</li>
</ul>
<!-- ========= ISOLATES_BROWSER_WHAT_IS ============ -->
<h3 id="isolates-browser-what-is">What is the Isolates Browser? <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Isolates Browser, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h3>
<div style="padding-left: 2em">
The NCBI Pathogen Detection <a href="/pathogens/isolates#/search/">Isolates Browser</a> is a web-based portal that provides analysis results for the two fundamental components of the Pathogen Detection Project: 1) pathogen isolate similarity and 2) antimicrobial resistance. The results are presented in tabular format with the full unfiltered results set presented as default, as opposed to summary documents appearing only after a search is completed as in other NCBI resources. You can query the Browser by entering various text strings, as described under "<a href="#allowable-search-terms">Allowable search terms</a>."<br /><br />
Upon opening the <a href="/pathogens/isolates#/search/">Isolates Browser</a>, a table displays <b>data for all available isolates</b>, with the most recently added data at the top. The data can be <b>faceted</b> by using <a href="#filters">filters</a> (e.g., Property: has antimicrobial resistance (AMR) genotypes), <a href="#isolates-browser-input"><b>queried</b></a> with a wide variety of <a href="#allowable-search-terms">allowable search terms</a>, using either <a href="#isolates-browser-basic-search">basic</a> or <a href="#isolates-browser-advanced-search">advanced</a> search methods, and <b>sorted</b> by clicking on column headers.<br /><br />
<b>Every row</b> in the Isolates Browser is an <b>assembled isolate</b>, possibly with antimicrobial resistance (AMR), virulence, and/or stress response <a href="#data-type-genotype"><b>genotype data</b></a>, and antibiotic susceptibility (AST) <a href="#data-type-phenotype"><b>phenotype data</b></a>, as available.<br /><br />
The table summarizes and links to the data available for each pathogen, such as strain name, geographic origin, isolation type (environmental or clinical), BioSample UID, organism group (PDG* accession), antimicrobial resistance (AMR)/virulence/stress response genotypes, and antibiotic susceptibility (AST) phenotypes, and more (see list of <a href="#isolates-browser-data-fields">data fields</a> available in the Isolates Browser).<br /><br />
If an isolate has a "PDS*" accession number in the <b>"SNP Cluster" column</b>, that indicates it is part of a SNP cluster, and you can click on the PSD* accession to launch the <a href="#snp-tree-viewer"><b>SNP Tree Viewer</b></a> and examine the relationships among your isolate of interest and other similar isolates.<br /><br />
The information below provides details on how the <a href="/pathogens/isolates#/search/">Isolates Browser</a> can be used, including allowable <a href="#isolates-browser-input"><b>input</b></a>, a description of the <a href="#isolates-browser-output"><b>output</b></a>, and an <a href="#isolates-browser-illustration"><span style="color:#d70000">illustrated example</span> of search results</a>. The browser accepts <a href="#isolates-browser-basic-search"><b>basic queries</b></a> that contain one or more text terms, with or without quotes. It also accepts <a href="#solr"><b>advanced queries</b> using the <b>SOLR query language</b></a>, such as <a href="#operators">complex Boolean queries</a> that look for the search terms in specific <a href="#isolates-browser-data-fields"><b>data fields</b></a>. <a href="#filters"><b>Filters</b></a> on the results page enable you to further narrow your retrieval, if desired, and links from the Isolates Browser to the <a href="#snp-tree-viewer"><b>SNP Tree Viewer</b></a> enable you to interactively explore the relationship of an isolate of interest to other isolates in the SNP cluster, which were found, via the Pathogens <a href="/pathogens/docs/data_processing">data processing pipeline</a>, to have closely related genome sequences.<br />
</div>
<!-- ======== END_ISOLATES_BROWSER_WHAT_IS ========= -->
<!-- ========= ISOLATES_BROWSER_INPUT ============ -->
<h3 id="isolates-browser-input">Input for Isolates Browser <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Isolates Browser, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h3>
<div style="padding-left: 2em">
<a href="#allowable-search-terms"><b>Allowable search terms</b></a> | <a href="#synonyms">Free text vs. controlled vocabulary</a> | <a href="#unique-identifiers">Unique identifiers</a> | <a href="#accession-prefixes">NCBI accession prefixes</a><br />
<a href="#isolates-browser-basic-search"><b>Basic search</b></a> |
<a href="#isolates-browser-query-tips"><b>Query tips</b></a> | <a href="#query-tips-multiple-terms">multiple terms</a> | <a href="#query-tips-special-characters">special characters</a> | <a href="#query-tips-phrase-search-quotes">phrase searches</a> | <a href="#query-tips-advanced-search">advanced searches</a> | <a href="#case-sensitive">case sensitive vs. case insensitive searches</a><br />
<a href="#filters"><b>Filters</b> to refine search</a> | <a href="#filters-menu">filters menu options</a> | <a href="#filters-on-the-fly">filters are generated on the fly</a> | <a href="#filters-synonyms">look for synonyms within a filter</a><br />
<a href="#isolates-browser-advanced-search"><b>Advanced search</b></a> |
<a href="#solr"><span style="color:#d70000">SOLR query language</span></a> | <a href="#solr-query-terms">Query terms</a> | <a href="#operators">Operators</a> | <a href="#parentheses">Parentheses</a> | <a href="#isolates-browser-data-fields"><b>Data fields</b></a> | <a href="#solr-sample-searches"><span style="color:#d70000">Examples of SOLR queries</span></a>
</div>
<!-- =========== ISOLATES_BROWSER_ALLOWABLE_SEARCH_TERMS ========== -->
<div style="padding-left: 2em">
<h4 id="allowable-search-terms">Allowable search terms <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Isolates Browser, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h4>
<ul>
<li>The <a href="/pathogens/isolates#/search/">Isolates Browser</a> accepts a variety of text strings as input. For example, the browser can retrieve isolates that contain terms such as <a href="/pathogens/isolates#/search/lettuce">lettuce</a> or <a href="/pathogens/isolates#/search/romaine">romaine</a> or <a href="/pathogens/isolates#/search/strawberry">strawberry</a> or <a href="/pathogens/isolates#/search/strawberries">strawberries</a> or <a href="/pathogens/isolates#/search/%22all-purpose%20flour%22">"all-purpose flour"</a>. You can also search for many other types of text strings, such as <a href="#isolates-browser-data-field-OrganismGroup">organism group</a>, <a href="#isolates-browser-data-field-AMRGenotypes">antimicrobial resistance (AMR) genotype</a>, <a href="#isolates-browser-data-field-ASTPhenotypes">Antimicrobial Susceptibility Test (AST) phenotype</a>, and more. The <a href="#isolates-browser-data-fields"><b>data fields</b></a> section of this document lists the many types of strings that can be searched, and provides example searches for the various data fields.</li>
</ul>
</div>
<!-- ========= END_ISOLATES_BROWSER_ALLOWABLE_SEARCH_TERMS ======== -->
<!-- ====== ISOLATES_BROWSER_FREE_TEXT_VS_CONTROLLED_VOCABULARY ====== -->
<div style="padding-left: 2em">
<h4 id="synonyms">Free text vs. controlled vocabulary <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Isolates Browser, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h4>
<ul>
<li id="free-text"><b>Free Text</b> - Many data fields in the <a href="/pathogens/isolates#/search/">Isolates Browser</a> are free text and therefore contain the exact terms that were supplied by the data submitters.</li>
<ul>
<li>Please note that <b>data submitters might use different forms of a term</b> in their submissions.</li>
<li>For example, some submitters might use <b>hyphens</b> between terms (e.g., "all-purpose flour") while others might use <b>spaces</b> (e.g., "all purpose flour").</li>
<li>For a <b>comprehensive</b> search, include <b>synonyms</b> in your query, or use <a href="#wildcards">wildcards</a> to search for a word stem.</li>
<li>For a more <b>precise</b> search, you can limit your query to a specific <a href="#isolates-browser-data-fields"><b>data field</b></a>, such as <a href="#isolates-browser-data-field-IsolationSource">Isolation source</a>. Please note that, in field-specified queries, both the <b>data field names</b> and <b>values</b> are <a href="#case-sensitive"><b>case sensitive</b></a>.</li>
<li>Separate sections of this document provide query tips about <a href="#synonyms">searching for synonyms</a>, and describe how the Isolates Browser handles <a href="#special-characters">special characters</a> in search terms (such as <b>hyphens</b> in <a href="#isolates-browser-data-field-Strain">strain</a> names, <b>parentheses</b> in <a href="#isolates-browser-data-field-AMRGenotypes">gene names</a>, slashes in <a href="#isolates-browser-data-field-Serovar">serovar</a> names, etc.).</li>
</ul>
<br />
<!-- ul>
<li>Examples of free text data fields include: _________, _________, _________, _________.</li>
</ul>
<br -->
<li id="controlled-vocabulary"><b>Controlled Vocabulary</b> - Some data fields in the <a href="/pathogens/isolates#/search/">Isolates Browser</a> contain a controlled vocabulary. In these fields, it is not necessary to search for synonyms.</li> <br />
<ul>
<li>For example, the <a href="#isolates-browser-data-field-Location">Location</a> data field, which lists the geographic location where the sample was isolated, contains two parts: <i>Country</i> and <i>Region</i>. <i>Country</i> is a controlled vocabulary (<a href="https://www.ncbi.nlm.nih.gov/genbank/collab/country">https://www.ncbi.nlm.nih.gov/genbank/collab/country</a>). <i>Region</i> is not controlled and can be anything (i.e., free text, such as a state abbreviation, province name, city name, zip code, etc.).</li>
<!-- li>Additional examples of controlled vocabulary data fields include: ________, _________, _________, _________.</li>
<li>The <a href="#isolates-browser-data-fields"><b>data fields</b></a> section of this document indicates whether each field contains controlled vocabulary, free text, or a combination of both.</li -->
</ul>
</ul>
</div>
<!-- ====== END_ISOLATES_BROWSER_FREE_TEXT_VS_CONTROLLED_VOCABULARY ===== -->
<!-- ====== ISOLATES_BROWSER_FREE_TEXT_VS_CONTROLLED_VOCABULARY ====== -->
<div style="padding-left: 2em">
<h4 id="unique-identifiers">Unique identifiers and NCBI accession prefixes<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Isolates Browser, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h4>
<ul>
<li id="ncbi-unique-identifiers"><b>NCBI Unique identifiers</b>, such as an NCBI accessions (e.g., biosample ID <a href="/pathogens/isolates#/search/SAMN05245394">SAMN05245394</a>, bioproject ID <a href="/pathogens/isolates#/search/PRJNA230969">PRJNA230969</a>, etc.) can be used to retrieve pathogen isolates.<br /><br />
Note that while NCBI accessions are unique, there can be multiplicity involved and it is possible for the same accession to appear in multiple current Pathogen records. For example, two or more isolates can belong to the same BioProject and/or same SNP cluster, so the record for each isolate will have its own PDT accession, but all of those records will contain the same PRJ and/or PDS accession.</li>
<li id="accession-prefixes">Some <b>NCBI accessions</b> that can be searched in Pathogens Detection Project have the following prefixes:<br />
<a href="#accession-prefix-gca">GCA</a> | <a href="#accession-prefix-gcf">GCF</a> | <a href="#accession-prefix-ng">NG</a> | <a href="#accession-prefix-pdg">PDG</a> | <a href="#accession-prefix-pds">PDS</a> | <a href="#accession-prefix-pdt">PDT</a> | <a href="#accession-prefix-prj">PRJ</a> | <a href="#accession-prefix-samn">SAMN</a> | <a href="#accession-prefix-srr">SRR</a> | <a href="#accession-prefix-srs">SRS</a> | <a href="#accession-prefix-wp">WP</a><br />
<ul>
<li id="accession-prefix-gca"><b>GCA_</b> - Accession number prefix for a <b>GenBank genome assembly</b>. This is data submitted by the scientific community directly to GenBank as an assembled genome.<br />
<i>(Read more about <a href="#data-type-genome">genomes</a> in the <a href="#data-types">data types</a> section of this document.)</i></li>
<li id="accession-prefix-gcf"><b>GCF_</b> - Accession number prefix for a <b>RefSeq genome assembly</b>. This is a representative genome assembly for a given organism in <a href="https://www.ncbi.nlm.nih.gov/refseq/">RefSeq</a>, a non-redundant database. <br />
<i>(Read more about <a href="https://www.ncbi.nlm.nih.gov/refseq/about/prokaryotes/">Prokaryotic RefSeq Genomes</a>.)</i><br />
<i>(Read more about <a href="https://www.ncbi.nlm.nih.gov/assembly/model/">NCBI Genome Assembly Models</a>.)</i>
</li>
<li id="accession-prefix-ng"><b>NG_</b> - Accession number prefix for a <b>RefSeq genomic sequence record</b>.<br />
<i>(Read more about <a href="https://www.ncbi.nlm.nih.gov/books/NBK50679/#RefSeqFAQ.what_is_an_ng_accession_and_wh">NG_* accessions</a>.)</i>
</li>
<li id="accession-prefix-pdg"><b>PDG</b> - Accession number prefix for a <b>P</b>athogen <b>D</b>etection Organism <b>G</b>roup.<br />
<i>Technical note: An organism group (PDG) contains one or more targets (PDTs). A PDT is a member of zero or one SNP cluster (PDS), and never more than one cluster. A SNP cluster is composed of two or more PDTs, and each PDS is completely contained within a PDG.</i> Each of these objects is versioned. A version change in a PDG accession implies a membership change in the organism group (isolates added or subtracted). A version change in a PDS accession implies membership change in the cluster. A version change in PDT implies a new assembly that may differ from the previous assembly.<br />
<i>(Read more about <a href="#isolates-browser-data-field-OrganismGroup">organism groups</a> in the <a href="#isolates-browser-data-fields">data fields</a> section of this document.)</i></li>
<li id="accession-prefix-pds"><b>PDS</b> - Accession number prefix for a <b>P</b>athogen <b>D</b>etection <b>SNP</b> Cluster.<br />
<i>(Read more about <a href="#isolates-browser-data-field-SNPCluster">SNP clusters</a> in the <a href="#isolates-browser-data-fields">data fields</a> section of this document.)</i></li>
<li id="accession-prefix-pdt"><b>PDT</b> - Accession number prefix for a <b>P</b>athogen <b>D</b>etection <b>T</b>arget. This is the Pathogen project accession for an individual isolate's genome assembly.<br />
<i>(Read more about <a href="#data-type-genome">genome asemblies</a> in the <a href="#data-types">data types</a> section of this document.)</i></li>
<li id="accession-prefix-prj"><b>PRJ</b> - Accession number prefix for an International Nucleotide Sequence Database Collaboration (<a href="http://www.insdc.org/">INSDC</a>) <b>BioProject</b>.<br />
<i>(Read more about <a href="#data-type-bioproject">bioprojects</a> in the <a href="#data-types">data types</a> section of this document.)</i></li>
<li id="accession-prefix-samn"><b>SAMN, SAME, SAMD</b> - Accession number prefix for an INSDC <b>BioSample</b> record.<br />
(<a href="https://www.ebi.ac.uk/">EBI</a> BioSamples have the prefix SAMEA, and <a href="https://www.ddbj.nig.ac.jp/index-e.html">DDBJ</a> BioSamples have the prefix SAMD.)<br />
<i>(Read more about <a href="#data-type-biosample">biosamples</a> in the <a href="#data-types">data types</a> section of this document.)</i></li>
<li id="accession-prefix-srr"><b>SRR, ERR, DRR</b> - Accession number prefix for an INSDC <b>S</b>equence <b>R</b>ead Archive (SRA) <b>R</b>un. A Run is an object that contains actual <b>sequencing data</b> for a particular sequencing experiment. SRA experiments may contain many Runs depending on the number of sequencing instrument runs that were needed.<br />
<i>(Read more about <a href="https://www.ncbi.nlm.nih.gov/books/NBK56913/#search.what_do_the_different_sra_accessi">SRA accessions</a>.)</i></li>
<li id="accession-prefix-srs"><b>SRS, ERS, DRS</b> - Legacy accession number prefix for an INSDC <b>S</b>equence <b>R</b>ead Archive (SRA) Experiment <b>S</b>ample. A Sample is an object that contains the <b>metadata</b> describing the physical sample upon which a sequencing experiment was performed. That information is imported from the BioSample record. This string is included in the list of <a href="#isolates-browser-data-field-Isolate_identifiers">isolate_identifiers</a><br />.
<i>(Read more about <a href="https://www.ncbi.nlm.nih.gov/books/NBK56913/#search.what_do_the_different_sra_accessi">SRA accessions</a>.)</i></li>
<li id="accession-prefix-wp"><b>WP_</b> - Accession number prefix for a <b>RefSeq protein sequence</b> that has been found in one or more archaeal and bacterial RefSeq genomes. If the identical protein sequence has been found in multiple genomes, the <b>WP_ sequence record is a non-redundant representation</b> of all the instances of the protein, and includes links to the genomic sequences that code for the protein.<br />
<i>Details about <b>WP_* accessions</b></i> <i>are provided on the web pages that describe the <a href="https://www.ncbi.nlm.nih.gov/refseq/about/nonredundantproteins/">RefSeq non-redundant proteins</a>, the <a href="https://www.ncbi.nlm.nih.gov/refseq/about/prokaryotes/reannotation/">Prokaryotic RefSeq Genome Re-annotation Project</a>, and the <a href="https://ftp.ncbi.nlm.nih.gov/refseq/release/announcements/WP-proteins-06.10.2013.pdf">New RefSeq protein product and data model</a>.</i>
</li>
</ul>
</li>
</ul>
</div>
<!-- =========== END_ISOLATES_BROWSER_ALLOWABLE_SEARCH_TERMS ========== -->
<!-- =========== ISOLATES_BROWSER_BASIC_SEARCH ========== -->
<div style="padding-left: 2em">
<h4 id="isolates-browser-basic-search">Basic Search <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Isolates Browser, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h4>
<div style="padding-left: 2em">A basic search simply consists of <b>one or more <!-- a href="#IsolatesBrowserAllowableTerms" -->search terms<!-- /A --></b>, and <b>does not include</b> any Boolean operators, parentheses, or other criteria such as search field (<a href="#isolates-browser-data-fields">data field</a>) specifiers. Below is information about:<br /><br />
<a href="#isolates-browser-query-tips"><b>Query tips</b></a> | <a href="#query-tips-multiple-terms">multiple terms</a> | <a href="#query-tips-special-characters">special characters</a> | <a href="#query-tips-phrase-search-quotes">phrase searches</a> | <a href="#query-tips-advanced-search">advanced searches</a> | <a href="#query-tips-case-sensitive-vs-case-insensitive">case sensitive vs. case insensitive searches</a><br />
<a href="#filters"><b>Filters to refine search</b></a> |
<a href="#filters-menu">filters menu options</a> | <a href="#filters-on-the-fly">filters are generated on the fly </a> | <a href="#filters-gene-fields">Filters for gene fields</a> | <a href="#filters-scientific-name">Filter for <em>Scientific name</em></a> | <a href="#filters-synonyms">look for synonyms within a filter</a>
</div>
<!-- =========== ISOLATES_BROWSER_QUERY_TIPS ========== -->
<ul>
<li id="isolates-browser-query-tips"><b>Query tips</b> <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Isolates Browser, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
<a href="#query-tips-multiple-terms">multiple terms</a> | <a href="#query-tips-special-characters">special characters</a> | <a href="#query-tips-phrase-search-quotes">phrase searches</a> | <a href="#query-tips-advanced-search">advanced searches</a> | <a href="#query-tips-case-sensitive-vs-case-insensitive">case sensitive vs. case insensitive searches</a><br /><br />
<ul>
<!-- ======== QUERY_TIPS:MULTIPLE_TERMS ========= -->
<li id="query-tips-multiple-terms"><b>Multiple search terms</b> <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Isolates Browser, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
If you enter <b>multiple search terms</b>, the system will automatically separate the terms with a <b>Boolean OR</b>, and will therefore retrieve isolates that have <b>at least one</b> of the terms in your query. Note, that this is different than many other NCBI resources that require explicity use of "OR" in the search. For isolates that have <b>more than one term</b> from your query, please note that the terms will not necessarily be adjacent to each other, and will not have to be present in the same <a href="#isolates-browser-data-fields">data field</a>. <i>(If desired, use <b><a href="#query-tips-phrase-search-quotes">quotes to force a phrase search</a></b>, and use an <a href="#QueryTipsAdvancedSearch">advanced search</a> to limit searches to a specific data field.)</i><br /><br />
<div style="padding-left: 2em">
For example, try a search for the following query (with no quotes and no special characters):<br />
<a href="/pathogens/isolates#/search/all%20purpose%20flour"><b><i>all purpose flour</i></b></a><br />
The search system <b>interprets the query as</b> three separate terms:<br />
<b><i>all OR purpose OR flour</i></b><br />
It therefore retrieves isolates whose records contain the term "all" in any data field, or the term "purpose" in any data field, or the term "flour" in any data field.
</div>
<br />
</li>
<!-- ======== END_QUERY_TIPS:MULTIPLE_TERMS ========= -->
<!-- ======== QUERY_TIPS:SPECIAL_CHARACTERS ========= -->
<li id="query-tips-special-characters"><b>Special characters</b> <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Isolates Browser, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
If a search term contains <a href="#special-characters"><b>special characters</b></a> (such as <b>hyphens</b> in <a href="#isolates-browser-data-field-Strain">strain</a> names, <b>parentheses</b> in <a href="#isolates-browser-data-field-AMRGenotypes">gene names</a>, slashes in <a href="#isolates-browser-data-field-Serovar">serovar</a> names, etc.), the system recognizes the special characters as part of the search term, and only retrieves isolates that include the term exactly as it was entered.<br /><br />
<div style="padding-left: 2em">
For example, try a search for the following query (with no quotes but with a hypen):<br />
<a href="/pathogens/isolates#/search/all-purpose%20flour"><b><i>all-purpose flour</i></b></a><br />
The search system treats the hyphen as part of the search term and <b>interprets the query as</b> two separate terms:<br />
<b><i>all-purpose OR flour</i></b><br />
It therefore retrieves isolates whose records contain the hyphenated term "<i>all-purpose</i>" in any data field, or the term "<i>flour</i>" in any data field.<br /><br />
A separate section of this document provides <a href="#special-characters">additional information about special characters</a>.
</div>
<br />
</li>
<!-- ======== QUERY_TIPS:SPECIAL_CHARACTERS ========= -->
<!-- ======== QUERY_TIPS:PHRASE_SEARCH ========= -->
<li id="query-tips-phrase-search-quotes"><b>Phrase searches using quotes</b> <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Isolates Browser, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
Use <b>quotes</b> around a set of words if you want to search all of the words together as a <b>phrase</b>. That will retrieve isolates which have the terms adjacent to each other, and the phrase can occur in any data field of the record. <i>(If desired, use an <a href="#QueryTipsAdvancedSearch">advanced search</a> to limit searches to a specific <a href="#isolates-browser-data-fields">data field</a>.)</i><br /><br />
<div style="padding-left: 2em">
For example, try a search, with a hyphen and with quotes, for:<br />
<a href="/pathogens/isolates#/search/%22all-purpose%20flour%22"><b><i>"all-purpose flour"</i></b></a>.<br />
The quotes require the search system to <b>interpret the query as</b> the complete phrase:<br />
<b><i>all-purpose flour</i></b><br />
It therefore only retrieve isolates whose records contain that exact character string.<br /><br />
If no quotes are used, the system will automatically insert a Boolean OR when it encounters a space in the query string. In the example above, if the quotes were absent, the system would interpret the search as <i>all-purpose OR flour</i>. The hypen would be retained because the search system recognizes <a href="#special-characters">special characters</a> as part of the search term.
</div>
<br />
</li>
<!-- ======== QUERY_TIPS:PHRASE_SEARCH ========= -->
<!-- ======== QUERY_TIPS:ADVANCED_SEARCHES ========= -->
<li id="query-tips-advanced-search"><b>Advanced searches</b> <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Isolates Browser, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
Use an <a href="#isolates-browser-advanced-search">advanced search</a> strategy if you want to <b>exercise more control over the search</b>, such as specify the desired <a href="#operators">Boolean operators</a>; use <a href="#parentheses">parentheses</a> to specify a list of items or to determine the order of execution of the query; and/or limit your search to a specific <a href="#isolates-browser-data-fields">data field</a>. For queries that specify data fields, please note that both the <b>data field names</b> and <b>values</b> are <a href="#case-sensitive">case sensitive</a>.<br /><br />
Examples of advanced searches are available in a separate section of this document and include:<br />
<ul>
<li><a href="#solr-sample-search-IsolationSourceAllPurposeFlour"><b>Isolation source:</b><br />
Show all isolates that have the exact phrase "All-Purpose Flour" in the isolation_source data field</a></li>
<li><a href="#solr-sample-search-LocationAndOrganismGroup"><b>Geographic location and organism group:</b><br />
Show all Salmonella isolates collected in USA</a></li>
<li><a href="#solr-sample-search-GenotypesMcrAndBlakpc"><b>Genotypes: isolates that have specific genes:</b><br />
Show all of the isolates that have a mobile colistin resistance gene and a KPC beta-lactamase</a></li>
<li><a href="#solr-sample-search-GenotypesAndPhenotypes"><b>Genotypes and phenotypes:</b></a><br />
<a href="#solr-sample-search-GenotypesNoBlakpcNoBlandmImipenemResistant"><b>Example 1: missing specific genes, resistant to antiobiotic:</b><br />
Show all of the isolates that lack both a blaKPC and blaNDM carbapenemase but are resistant to imipenem</a><br />
<a href="#solr-sample-search-GenotypesBlakpcMeropenemSusceptible"><b>Example 2: has specific gene, susceptible to antiobiotic:</b><br />
Show all of the isolates that have a blaKPC gene and are susceptible to meropenem</a><br />
<a href="#solr-sample-search-GenotypesQnrCiproResistant"><b>Example 3: has specific gene, resistant to either of two antiobiotics:</b><br />Show all of the isolates that have a qnr gene and that are resistant to either ciprofloxacin or nalidixic acid</a>
</li>
<!-- li><a href="#solr-sample-search-GeneNameSpecialCharacters"><b>Genotypes: gene name with special characters:</b><br />
Show all of the isolates that have the gene aph(4)-Ia and a blaKPC carbapenemase</a></li><br -->
<li><a href="#solr-sample-search-WhereIsMyIsolate"><b>Where is my isolate?</b><br />
Retrieve your data by BioSample accession numbers or SRA Run accession numbers</a></li>
<li><a href="#solr-sample-search-BatchSearch"><b>Batch search with isolate identifiers that contain a hyphen:</b><br />
Input a list of isolate identifiers that contain special characters (e.g., hyphens)</a></li>
</ul>
</li>
<!-- ======== QUERY_TIPS:ADVANCED_SEARCHES ========= -->
<!-- ====== QUERY_TIPS:CASE_SENSITIVE ===== -->
<li id="query-tips-case-sensitive-vs-case-insensitive">
<b><a href="#case-sensitive">Case sensitive</a> versus <a href="#case-insensitive">case insensitive</a> searches:</b> <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Isolates Browser, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
<span id="case-sensitive"><b>Case sensitive searches:</b></span> <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Isolates Browser, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
If you want to do an <a href="#isolates-browser-advanced-search">advanced search</a> in order to query specific <a href="#isolates-browser-data-fields">data fields</a>, please note that the <b>names of <a href="#isolates-browser-data-fields">data fields</a></b>, and the <b>values they contain</b>, are <b>case sensitive</b>.<br /><br />
The values in the data fields represent text strings <b>exactly as they were entered by the submitter</b>, including upper case and lower case letters, <a href="#special-characters">special characters</a> such as hyphens, etc.<br /><br />
The case-sensitivity and the retention of special characters such as hyphens and parentheses (when they are internal to a search term) were built into the system in order to ensure <b>precise handling of searches</b> for values such as <b>strain name</b>, <b>serovar</b>, <b>gene symbol</b>, and more. The case sensitivity and handling of special characters applies to other data fields as well. <br /><br />
Therefore, <b>when you search a specific data field</b>, the system will retrieve isolates that contain the <b>exact string you have specified</b>, including upper case and lower case letters, as well as special characters such as hyphens and parentheses.<br /><br />
<div style="padding-left: 2em">
For example, search the Isolation Source data field for the phrase "All-Purpose Flour" by entering the following query:<br />
<a href="/pathogens/isolates#/search/isolation_source:%22All-Purpose%20Flour%22"><b><i>isolation_source:"All-Purpose Flour"</i></b></a><br />
The system will retrieve isolates that contain the exact string you have specified, including upper and lower case and the hyphen.
</div>
<br />
<span id="case-insensitive"><b>Case insensitive searches:</b></span> <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Isolates Browser, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
<b>If you are uncertain</b> about whether to use <b>upper case or lower case letters </b> in your query, then simply enter your search terms, regardless of case, <b>without a data field specifier</b>.<br /><br />
<div style="padding-left: 2em">
For example, any one of the following three queries will work equally well<!-- (although the results will be different if you omit the hypen) -->:<br />
<a href="/pathogens/isolates#/search/%22all-purpose%20flour%22"><b><i>"all-purpose flour"</i></b></a><br />
-- or --<br />
<a href="/pathogens/isolates#/search/%22ALL-PURPOSE%20FLOUR%22"><b><i>"ALL-PURPOSE FLOUR"</i></b></a><br />
-- or --<br />
<a href="/pathogens/isolates#/search/%22All-Purpose%20Flour%22"><b><i>"All-Purpose Flour"</i></b></a><br />
</div>
<br />
Those queries work because, in the absence of a data field specifier, the system searches a <b>text index</b>, which is a <b>case insensitive compilation of terms</b> from many text-containing data fields. Such searches are less precise in their retrieval, because the query terms can appear in any text field of pathogen isolate records; however, they provide a flexible data retrieval mechanism.<br /><br />
<i>(Note: The <b>presence or absence of the hyphen</b> *will* affect the results, whether or not you specify a data field. This is because the hyphen is considered to be part of the search term and therefore must be present in the retrieved isolates. A separate section of this document provides additional information about <a href="#query-tips-special-characters">special characters</a>, as well as the use of <a href="#query-tips-phrase-search-quotes">quotes to force a phrase search</a>.)</i>
</li>
<!-- ====== END_QUERY_TIPS:CASE_SENSITIVE ===== -->
</ul>
</li>
</ul>
<!-- =========== END_ISOLATES_BROWSER_QUERY_TIPS ========== -->
</div>
<!-- =========== END_ISOLATES_BROWSER_BASIC_SEARCH ========== -->
<!-- =========== ISOLATES_BROWSER_FILTERS ========== -->
<div style="padding-left: 2em">
<h4 id="filters">Filters to refine search <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Isolates Browser, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h4>
<div style="padding-left: 2em"><a href="#filters-menu">Filters menu options</a> | <a href="#filters-on-the-fly">Filters are generated on the fly</a> | <a href="#filters-synonyms">Look for synonyms within a filter</a></div>
<ul>
<!-- ========= FILTERS_MENU_OPTIONS ========= -->
<li id="filters-menu">The <b>"Filters" menu options</b> <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Isolates Browser, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
The "Filters" menu options in the <a href="/pathogens/isolates#/search/">Isolates Browser</a> enable you to <b>facet or subset the data</b> in a variety of ways, and therefore can be used to refine your results, whether you have done a <a href="#isolates-browser-basic-search">basic search</a> or an <a href="#isolates-browser-advanced-search">advanced search</a>.<br /><br />. The filter menu now allows all data fields in the column chooser to be filtered. Counts next to the filter values indicate the number of records that match that value. These counts can allow you to do counting analyses using only the filters interface.
By default, each filter displays the <b>top 100 terms</b> (based on the number of isolates retrieved by a term). Note that:
<ul>
<li>A <b>Boolean "OR"</b> is applied if multiple items are checked in the same filter field. This way you can choose multiple values in the same filter. For example:
<ul>
<li>Open the "Filters" tab of the <a href="/pathogens/isolates#/search/">Isolates Browser</a>, scroll to the "Isolation source" field, and check the boxes for "stool" and "feces" The system will retrieve isolates that have either one of those values in the "Isolation source" field.</li>
</ul>
</li>
<li>A <b>Boolean "AND"</b> is applied if you select items in several different filter fields (Location, Source, etc). For example:
<ul>
<li>Open the "Filters" tab of the <a href="/pathogens/isolates#/search/">Isolates Browser</a>, then check the boxes for "clinical" in the "Isolation type" filter and "wound" in the "Isolation source" filter. The system will retrieve isolates that have both of your specified criteria.</li>
</ul>
</li>
<li>If you prefer to apply a <b>Boolean "AND"</b> to multiple items within the same filter field, you can enter a <b>SOLR query</b>. For example:
<ul>
<li>To retrieve isolates that have <b>both</b> AMR genotypes AND Stress genotypes, open the <a href="/pathogens/isolates#/search/">Isolates Browser</a> and enter a SOLR query such as:
<a href="/pathogens/isolates#/search/property:%22has%20AMR%20genotypes%22%20AND%20property:%22has%20stress%20genotypes%22">property:"has AMR genotypes" AND property:"has stress genotypes"</a>.<br />
<i>(A separate section of this document provides additonal information about the <a href="#solr">SOLR query language</a>. Additionally, note that the <a href="#isolates-browser-data-fields">default columns</a> in the <a href="#isolates-browser-output">Isolates Browser output</a> include AMR genotypes but not Stress genotypes; use the <a href="#isolates-browser-display-options">choose columns</a> function in the Isolates Browesr to add additional columns to the display.)</i></li>
</ul>
</li>
</ul>
As mentioned under "<a href="#filters-on-the-fly"><b>Filters are generated on the fly</b></a>," the terms that are listed under each filter will depend on the data set you are currently displaying in the browser and on the number and count of values in the filters if multiple filters have selections.<br /><br />
</li>
<!-- ======== END_FILTERS_MENU_OPTIONS ========= -->
<!-- ======== FILTERS_ON_THE_FLY ======= -->
<li id="filters-on-the-fly"><b>Filters are generated on the fly for a given data set</b> <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Isolates Browser, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
The choices listed in the "Filters" tab reflect the attributes of the isolates that you are currently viewing in the browser. By default the <b>top 100 terms</b> (based on the number of isolates retrieved by a term, and listed by count of isolates per value are displayed). The total number of unique values is also shown at the bottom of each filter tab.</li><br /><br />
<li id="filter-search-box"><b>Searching within filters</b> <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Isolates Browser, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
A search box is available in each filter to search for values not found in the top 100. Example, open the "Isolation source" filter and type in the word "chicken" in the search box. All case-insensitive matches to any of the values of the word "chicken" will show up, which is very useful to catch those synonymous values from multiple submitters.<br /><br />
Numeric fields have ranges that can be selected using the check button or reset, while date fields have a range selection as well as quick access to common recent queries.<br /><br /> .
The search box can be reset with the reset button beside the search box. The entire filter can be removed with the 'X' at the top right corner.<br /><br />
Filters can be collapsed if more than one is shown with the double left hand arrow at the bottom left, and opened again after collapse with the double right hand arrow on collapsed tabs. Each tab is labeled with the filter name.<br /><br />
</li>
<!-- ======== END_FILTERS_ON_THE_FLY ======= -->
<!-- ======== FILTERS_GENE_FIELDS ========== -->
<li id="filters-gene-fields"><b>Gene fields: AMR genotypes, Stress genotypes, Virulence genotypes, AMR genotypes core</b> <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Isolates Browser, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
The fields with gene and point-mutation fields have filters that separate the genes into categories based on characteristics that help to determine how likely the gene/point-mutation is to be properly transcribed and assembled. They are divided into <strong>COMPLETE</strong>, <strong>POINT</strong>, <strong>PARTIAL</strong>, <strong>HMM</strong>, <strong>MISTRANSLATION</strong>, and <strong>PARTIAL_END_OF_CONTIG</strong>. More information on what the categories mean is <a href="/pathogens/docs/data_processing/#genotype-categories">available below</a> and on the <a href="https://github.com/ncbi/amr/wiki/Interpreting-results#the-method-column">AMRFinderPlus wiki</a>. Each of the categories can be expanded by clicking on the '+' sign next to it, and within that the gene symbols may be selected to further refine your search. As with the other filter fields only the 100 most-frequent gene symbols will appear in the filter box. To search for specific genes you can use the search function within the filter. <br /><br />
</li>
<!-- ======== END_FILTERS_GENE_FIELDS ========= -->
<!-- ======== FILTERS_SCIENTIFIC_NAME ========= -->
<li id="filters-scientific-name"><b>Scientific name</b> <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Isolates Browser, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
The <b>Scientific name</b> field is set up with a hierarchy that represents lineages based on <a href="/taxonomy">NCBI Taxonomy</a> to allow you to filter for all members of a given taxonomic group. Clicking on a node at a higher level will select all the taxa within that group even though the boxes by those names won't show up as selected. As with other filters only the 100 most common values are shown, in this case that is the 100 most common values in the Scientific name field and the higher level taxa that they belong to. You can search within the values using the Search box within the filter to narrow the choices and reveal scientific names that are not in the most frequent set.
<img src="/core/assets/pathogens/images/Isolates-Browser-Taxonomy-filter.png" /> For example selecting <strong><em>Enterobacteriaceae</em></strong> will include all isolates that are <em><strong>Salmonella</strong></em>, <em><strong>E. coli</strong></em>, <em><strong>Shigella</strong></em>, and <em><strong>Klebsiella</strong></em> even though those more specific taxa are not selected individually. <br /><br />
</li>
<!-- ======== END_FILTERS_SCIENTIFIC_NAME ========= -->
<!-- ======== FILTERS_DATE_FIELDS ========== -->
<li id="filters-date-fields"><b>Date fields: Create date, Collection date</b> <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Isolates Browser, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
Filters for fields with date strings in them have date regions that are searched inclusively, so if the collection date filter was From: was 1/1/2021 and To: was 12/31/2021 then there would be 365 days included in the search (both 1/1/2021 and 12/31/2021 would be included).
The date fields also have buttons to conveniently search for recent dates. For example if pressing the the <b>Last 1 day</b> button in the <b>Create date</b> filter you would get any isolates whose <b>Create date</b> value was the current day.
</li>
<!-- ======== END_FILTERS_DATE_FIELDS ========== -->
<!-- ======== FILTERS_ISOLATE ======= -->
<li id="filters-isolate"><b>Isolate</b> <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Isolates Browser, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
The isolate field search in the filter is case sensitive so accessions such as PDT000000002.3 need to have the "PDT" portion in capital letters.
</li><br />
<!-- ======== END_FILTERS_ISOLATE ======= -->
<!-- ======== FILTERS_ACCESSION_SNP_CLUSTER ======= -->
<li id="filters-snp-cluster"><b>SNP cluster</b> <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Isolates Browser, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
The SNP cluster filter search is case sensitive so accessions such as PDS000174935.6 need to have the "PDS" portion in capital letters.
</li>
<!-- ======== END_FILTERS_SNP_CLUSTER ======= -->
<!-- ======== FILTERS_LOOK_FOR_SYNONYMS ======= -->
<li id="filters-synonyms"><b>Look for synonyms</b> <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Isolates Browser, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
A number of <a href="#isolates-browser-data-fields">data fields</a> <b>do not use a controlled vocabulary</b>, but instead list the various terms that submitters applied to their data. As a result, submitters might use different terms for the same concept. Therefore, if you are using filters, <b>look for synonymous terms</b> that are listed under a given filter and check the boxes for any/all terms that are of interest. If you are searching the data fields directly (as described in the <a href="#isolates-browser-advanced-search">advanced search</a> section of this document), consider including synonyms in your query in order to broaden retrieval.<br />
Synonyms are also useful to include if you are doing <a href="#isolates-browser-advanced-search">advanced searches</a>, such as limiting your search to specific <a href="#isolates-browser-data-fields">data fields</a>. As an example, see the sample searches of the <a href="#isolates-browser-data-field-Host">host</a> organism data field.
</li><br />
<!-- ======== END_FILTERS_LOOK_FOR_SYNONYMS ======= -->
</ul>
</div>
<!-- =========== END_ISOLATES_BROWSER_FILTERS ========== -->
<!-- =========== ISOLATES_BROWSER_ADVANCED_SEARCH ========== -->
<h4 id="isolates-browser-advanced-search">Advanced Search <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Isolates Browser, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h4>
<!-- =========== SOLR_QUERY_LANGUAGE ========== -->
<div style="padding-left: 2em">
<h4 id="solr"><b>SOLR Query Language</b></h4>
The <a href="/pathogens/isolates#/search/">Isolates Browser</a> uses a modified SOLR search platform (version 6.6) to retrieve pathogen data. The <a href="https://lucene.apache.org/solr/guide/">Apache SOLR Reference Guides</a> provides detailed documentation for the platform. Some key concepts are introduced below, and link to the complete documentation in the <a href="https://lucene.apache.org/solr/guide/6_6/">SOLR Reference Guide 6.6</a>, particularly the sections on: <a href="https://lucene.apache.org/solr/guide/6_6/searching.html">Searching</a> &gt; <a href="https://lucene.apache.org/solr/guide/6_6/query-syntax-and-parsing.html">Query Syntax and Parsing</a> &gt; <a href="https://lucene.apache.org/solr/guide/6_6/the-standard-query-parser.html"><b>The Standard Query Parser</b></a>.<br /><br />
In some instances, there might be some slight differences between the Isolates Browser and the SOLR Standard Query Parser. For example, the Isolates Browser has been modified relative to the SOLR Standard Query Parser in the way it handles <a href="#special-characters">special characters</a> that are part of a search term. Specifically, the browser has been programmed to automatically escape special characters (such as <b>hyphens</b> in <a href="#isolates-browser-data-field-Strain">strain</a> names, <b>parentheses</b> in <a href="#isolates-browser-data-field-AMRGenotypes">gene names</a>, slashes in <a href="#isolates-browser-data-field-Serovar">serovar</a> names, etc.) and to treat them as part of the search term. The Browser therefore retrieves isolates that include the term exactly as it was entered, including special characters.<br /><br />
<a href="#solr-query-terms"><b>Query terms</b></a> | <a href="#solr-single-term">single term</a> | <a href="#solr-multiple-terms">multiple terms</a> | <a href="#solr-phrase">phrase</a> | <a href="#solr-term-modifiers">term modifiers</a> | <a href="#wildcards">wildcard searches</a> | <a href="#special-characters">special characters in search terms</a><br />
<a href="#operators"><b>Operators</b></a> | <a href="#operators-boolean">AND, OR, NOT</a> | <a href="#operators-plus-and-minus">plus (+) and minus (-) symbols</a> | <a href="#range-searches">range searches [nnnn TO nnnn]</a><br />
<a href="#parentheses"><b>Parentheses</b></a> | <a href="#parentheses-boolean">use to order Boolean queries</a> | <a href="#parentheses-list-of-terms">use to input a list of query terms</a> | <a href="#parentheses-in-gene-name">automatically escaped if part of a gene name or query term</a><br />
<a href="#isolates-browser-data-fields"><b>Data Fields</b></a><br />
<a href="#isolates-browser-search-modifiers"><b>Search modifiers</b></a><br />
<a href="#solr-sample-searches"><b>Examples of SOLR queries</b></a>
</div>
<!-- =========== SOLR_QUERY_LANGUAGE ========== -->
<!-- =========== SOLR_QUERY_TERMS ========== -->
<div style="padding-left: 2em">
<h4 id="solr-query-terms">SOLR Query terms <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser-advanced-search"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Isolates Browser Advanced Search, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h4>
<div style="padding-left: 2em"><a href="#solr-single-term">single term</a> | <a href="#solr-multiple-terms">multiple terms</a> | <a href="#solr-phrase">phrase</a> | <a href="#solr-term-modifiers">term modifiers</a> | <a href="#wildcards">wildcard searches</a> | <a href="#special-characters">special characters in search terms</a></div>
<ul>
<!-- =========== SOLR_QUERY_TERMS_SINGLE ========== -->
<li id="solr-single-term"><span style="background-color: #ffff00"><b>Single term</b></span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser-advanced-search"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Isolates Browser Advanced Search, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a>
<br /><br />
A single query term, such as <b>lettuce</b>, will retrieve all isolates that have the term in any <a href="#isolates-browser-data-fields">data field</a>.<br /><br />
<b>Examples:</b><br /><br />
A search for:<br />
<a href="/pathogens/isolates#/search/lettuce"><i>lettuce</i></a><br />
will show isolates that contain the term <i>lettuce</i> in any <a href="#isolates-browser-data-fields">data field</a>.<br /><br />
<b>Tips:</b><br /><br />
If you search a specific <a href="#isolates-browser-data-fields">data field</a>, your search will become <a href="#case-sensitive">case sensitive</a>.<br /><br />
For example, compare the search results for:<br />
<a href="/pathogens/isolates#/search/isolation_source:lettuce"><i>isolation_source:lettuce</i></a><br />
versus:<br />
<a href="/pathogens/isolates#/search/isolation_source:Lettuce"><i>isolation_source:Lettuce</i></a><br />
For broader retrieval, you can either remove the data field specifier to conduct a <a href="#case-insensitive">case insensitive search</a>, or include synonyms in your query, for example:<br />
<a href="/pathogens/isolates#/search/isolation_source:lettuce%20OR%20isolation_source:Lettuce"><i>isolation_source:lettuce OR isolation_source:Lettuce</i></a><br />
A separate section of this document provides additional information about searching for <a href="#synonyms">synonyms</a>.<br />
</li>
<!-- =========== SOLR_QUERY_TERMS_MULTIPLE_TERMS ========== -->
<li id="solr-multiple-terms">
<span style="background-color: #ffff00"><b>Multiple terms</b></span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser-advanced-search"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Isolates Browser Advanced Search, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a>
<br /><br />
If you include two or more terms in your query, the system will <b>automatically insert a Boolean OR in each space</b> that it encounters. As a result, it will search for each word individually, and the system will show isolates that contain at least one of your search terms in any <a href="#isolates-browser-data-fields">data field</a>.<br /><br />
<b>Examples:</b><br /><br />
A search for the following query (with no quotes or <a href="#special-characters">special characters</a>):<br />
<a href="/pathogens/isolates#/search/romaine%20lettuce"><i>romaine lettuce</i></a><br />
will be <b>interpreted as</b>:<br />
<b><i>romaine OR lettuce</i></b><br /><br />
A search for the following query (with no quotes or <a href="#special-characters">special characters</a>):<br />
<a href="/pathogens/isolates#/search/all%20purpose%20flour"><i>all purpose flour</i></a><br />
will be <b>interpreted as</b>:<br />
<b><i>all OR purpose OR flour</i></b><br />
because the system will insert an OR when it encounters each space in the query string.<br /><br />
A search for the following query (with no quotes and with a hyphen in <i>all-purpose</i>):<br />
<a href="/pathogens/isolates#/search/all-purpose%20flour"><i>all-purpose flour</i></a><br />
will be <b>interpreted as</b>:<br />
<b><i>all-purpose OR flour</i></b><br />
because the system will treat the <a href="#special-characters">special character</a> (hypen) as part of the first query term, and it will insert an OR where it encounters a space in the query string.<br /><br />
<b>Tips:</b><br /><br />
If you include a <a href="#isolates-browser-data-fields">data field</a> specifier and you do not enclose your query terms in quotes, the data field specifier will be applied only to the term that immediately follows it, and that term will be searched in a <a href="#case-sensitive">case sensitive</a> manner.<br /><br />
For example, a search for the following query (with no quotes or special characters):<br />
<a href="/pathogens/isolates#/search/isolation_source:lettuce"><i>isolation_source:romaine lettuce</i></a><br />
will be <b>interpreted as</b>:<br />
<b><i>isolation_source:romaine OR lettuce</i></b><br />
The system will show all isolates that have the lower case term <i>romaine</i> in the <a href="#isolates-browser-data-field-IsolationSource">Isolation Source</a> data field, and the term <i>lettuce</i> in any case and in any field.<br />
If, on the other hand, you want to search <i><b>romaine lettuce</b></i> as a <a href="#solr-phrase"><b>phrase</b></a>, you will need to use <b>quotes</b>, as described below.
</li>
<!-- =========== SOLR_QUERY_TERMS_PHRASE ========== -->
<li id="solr-phrase">
<span style="background-color: #ffff00"><b>Phrase</b></span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser-advanced-search"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Isolates Browser Advanced Search, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a>
<br /><br />
If you want to search for a <b>phrase</b>, surround your query terms with <b>quotes</b>.<br /><br />
<b>Examples:</b><br /><br />
A search for:<br />
<a href="/pathogens/isolates#/search/%22romaine%20lettuce%22"><i>"romaine lettuce"</i></a><br />
will show isolates that contain that phrase in any <a href="#isolates-browser-data-fields">data field</a>.<br /><br />
A search for:<br />
<a href="/pathogens/isolates#/search/isolation_source:%22All-Purpose%20Flour%22"><i>"all-purpose flour"</i></a><br />
will show isolates that contain the phrase <i>all-purpose flour</i>, and will conduct the search in a <a href="#case-insensitive">case insensitive</a> manner because the query does not include a <a href="#isolates-browser-data-fields">data field</a> specifier.<br /><br />
A search for:<br />
<a href="/pathogens/isolates#/search/isolation_source:%22All-Purpose%20Flour%22"><i>isolation_source:"All-Purpose Flour"</i></a><br />
and will show isolates that contain the phrase <i>All-Purpose Flour</i> in the <a href="#isolates-browser-data-field-IsolationSource">Isolation Source</a> data field.<br />
Because the query includes a <a href="#isolates-browser-data-fields">data field</a> specifier, the search is conducted in a <a href="#case-sensitive">case sensitive</a> manner. It will therefore only show isolates that have the exact phrase you specified, including upper and lower case letters as well as the hypen.<br /><br />
<b>Tips:</b><br /><br />
If <b>no quotes</b> are used, the system will automatically insert a Boolean OR when it encounters a space in the query string. If you query specific <a href="#isolates-browser-data-fields">data fields</a>, please note that the names of data fields, and the values they contain, are <a href="#case-sensitive">case sensitive</a>. <a href="#special-characters">Special characters</a>, such as the hypen in the examples above, are recognized as part of the search term and therefore retained in the query, regardless of whether quotes are used.<br /><br />
For example, if the last sample search above was entered as
<a href="/pathogens/isolates#/search/isolation_source:All-Purpose%20Flour"><i>isolation_source:All-Purpose Flour</i></a>, with <b>no quotes</b>, it would be interpreted as <i>isolation_source:All-Purpose OR flour</i>. The Browser would show isolates that contain the term <i>All-Purpose</i> in the <a href="#isolates-browser-data-field-IsolationSource">Isolation Source</a> data field or the term <i>flour</i> in any data field. This is because the system processes the term adjacent to the data field specifier in a <a href="#case-sensitive">case sensitive</a> manner, and inserts a Boolean OR when it encounters a space.
<!-- B>Proximity searches:</b><br /><br />
The <a href="https://lucene.apache.org/solr/guide/6_6/">SOLR Reference Guide 6.6</a> also provides information about <a href="https://lucene.apache.org/solr/guide/6_6/the-standard-query-parser.html#TheStandardQueryParser-ProximitySearches">proximity searches</a>, which are included in the Standard Query Parser, if you would like to retrieve records that have your search terms within a specified distance of each other. -->
</li>
<!-- =========== SOLR_QUERY_TERMS_TERM_MODIFIERS ========== -->
<li id="solr-term-modifiers">
<span style="background-color: #ffff00"><b>Term modifiers</b></span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser-advanced-search"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Isolates Browser Advanced Search, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a>
<br /><br />
As noted in the "<a href="https://lucene.apache.org/solr/guide/6_6/the-standard-query-parser.html">Standard Query Parser</a>" section of the <a href="https://lucene.apache.org/solr/guide/6_6/">SOLR Reference Guide 6.6</a>, "Solr supports a variety of <a href="https://lucene.apache.org/solr/guide/6_6/the-standard-query-parser.html#TheStandardQueryParser-TermModifiers">term modifiers</a> that add flexibility or precision, as needed, to searches. These modifiers include <a href="https://lucene.apache.org/solr/guide/6_6/the-standard-query-parser.html#TheStandardQueryParser-WildcardSearches">wildcard characters</a>, characters for making a search "<a href="https://lucene.apache.org/solr/guide/6_6/the-standard-query-parser.html#TheStandardQueryParser-FuzzySearches">fuzzy</a>" or more general, and so on."
</li>
<!-- =========== SOLR_QUERY_TERMS_WILDCARDS ========== -->
<li id="wildcards">
<span style="background-color: #ffff00"><b>Wildcard searches</b></span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser-advanced-search"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Isolates Browser Advanced Search, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a>
<br /><br />
A question mark (?) can be included your query string to match any single character.<br />
An asterisk (*) can be included your query string to match zero or more sequential characters.
<!-- Bill's edits for this section include the comment:
Need to add combined wild-card searches per discussion on
https://jira.ncbi.nlm.nih.gov/browse/SEQUI-1080 --><br /><br />
<b>Examples:</b><br /><br />
A search for:<br />
<a href="/pathogens/isolates#/search/AMR_genotypes:tet(*)"><i>AMR_genotypes:tet(*)</i></a><br />
will show isolates that have a string of "<i>tet(*)</i>" in the <a href="#isolates-browser-data-field-AMRGenotypes">AMR Genotypes</a> data field, with the question mark serving as a wildcard to retrieve gene names that have any single character in the parentheses, such as <i>tet(A), tet(M), tet(O), tet(X). etc.</i><br /><br />
A search for:<br />
<a href="/pathogens/isolates#/search/strawberr*"><i>strawberr*</i></a><br />
will show isolates that contain terms such as <i>strawberry</i>, <i>strawberries</i>, etc. in any <a href="#isolates-browser-data-fields">data field</a>.<br /><br />
A search for:<br />
<a href="/pathogens/isolates#/search/isolation_source:*berry"><i>isolation_source:*berry</i></a><br />
will show isolates that contain terms such as <i>strawberry</i>, <i>mulberry</i>, etc. in the <a href="#isolates-browser-data-field-IsolationSource">Isolation Source</a> data field.<br /><br />
<b>Tips:</b><br /><br />
The wildcard characters can appear anywhere in your search term (at the beginning, middle, or end).<br />
The <a href="https://lucene.apache.org/solr/guide/6_6/">SOLR Reference Guide 6.6</a> provides additional details about the use of <a href="https://lucene.apache.org/solr/guide/6_6/the-standard-query-parser.html#TheStandardQueryParser-WildcardSearches">wildcards</a>.<br /><br />
</li>
<!-- =========== SOLR_QUERY_TERMS_SPECIAL_CHARACTERS ========== -->
<li id="special-characters">
<span style="background-color: #ffff00"><b>Special characters in search terms</b></span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser-advanced-search"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Isolates Browser Advanced Search, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a>
<br /><br />
As noted in the introduction to the <a href="#isolates-browser-advanced-search">advanced search</a> section of this document, the <a href="/pathogens/isolates#/search/">Isolates Browser</a> uses the SOLR search platform (version 6.6) to retrieve pathogen data. However, in some instances, there might be some slight differences between the Isolates Browser and the SOLR Standard Query Parser.<br /><br />
For example, the Isolates Browser has been modified relative to the SOLR Standard Query Parser in the way it handles <b>special characters that are part of a search term</b>. Specifically, the browser has been programmed to <b>automatically escape</b> special characters (such as <b>hyphens</b> in <a href="#isolates-browser-data-field-Strain">strain</a> names, <b>parentheses</b> in <a href="#isolates-browser-data-field-AMRGenotypes">gene names</a>, <b>slashes</b> in <a href="#isolates-browser-data-field-Serovar">serovar</a> names, etc.) and to treat them as part of the search term. As a result, the Browser retrieves isolates that include the term exactly as it was entered, including special characters.<br /><br />
<b>Examples:</b><br /><br />
A search for:<br />
<a href="/pathogens/isolates#/search/strain:KCRI-598A"><i>strain:KCRI-598A</i></a><br />
will show isolates that contain the term <i>KCRI-598A</i> in the <a href="#isolates-browser-data-field-Strain">Strain</a> data field.<br /><br />
A search for:<br />
<a href="/pathogens/isolates#/search/serovar:1~2F2a"><i>serovar:1/2a</i></a><br />
will show isolates that contain the term <i>1/2a</i> in the <a href="#isolates-browser-data-field-Serovar">Serovar</a> data field.<br /><br />
A search for:<br />
<a href="/pathogens/isolates#/search/AMR_genotypes:ant(6)-Ia%20AND%20AMR_genotypes:aph(3')-IIIa"><i>AMR_genotypes:ant(6)-Ia AND AMR_genotypes:aph(3')-IIIa</i></a><br />
will show isolates that contain that have both the <i>ant(6)-Ia</i> and the <i>aph(3')-IIIa</i> in the <a href="#isolates-browser-data-field-AMRGenotypes">AMR Genotypes</a> data field.<br /><br />
<b>Tips:</b><br /><br />
When you query specific <a href="#isolates-browser-data-fields">data fields</a>, please note that the names of data fields, and the values they contain, are <a href="#case-sensitive">case sensitive</a>. Also, if your query string includes a space, surround the query string with quotes in order to do a <a href="#solr-phrase">phrase search</a>. If no quotes are used, the system will automatically insert a Boolean OR when it encounters a space in the query string.
</li>
</ul>
</div>
<!-- =========== END_SOLR_QUERY_TERMS ========== -->
<!-- =========== SOLR_OPERATORS ========== -->
<div style="padding-left: 2em">
<h4 id="operators">SOLR Operators <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser-advanced-search"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Isolates Browser Advanced Search, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h4>
<div style="padding-left: 2em"><a href="#operators-boolean">AND, OR, NOT</a> | <a href="#operators-plus-and-minus">Plus (+) and Minus (-) symbols</a> | <a href="#range-searches">Range searches [nnnn TO nnnn]</a></div>
<ul>
<!-- =========== SOLR_OPERATORS_BOOLEAN ========== -->
<li id="operators-boolean">
<span style="background-color: #ffff00"><b>AND, OR, NOT</b></span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser-advanced-search"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Isolates Browser Advanced Search, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a>
<br /><br />
The SOLR search platform allows you to apply Boolean logic to queries with the AND, OR, and NOT operators. Boolean operators must be written in <b>upper case letters</b>, or they can be represented as <b>symbols</b>:<br /><br />
<b>AND</b> can be represented as <b>&amp;&amp;</b><br />
<b>OR</b> can be represented as <b>||</b><br />
<b>NOT</b> can be represented as <b>!</b><br /><br />
By <b>default</b>, the system applies the <b>OR</b> operator each time it encounters a space in the query string.<br /><br />
<b>Examples:</b><br /><br />
A search for:<br />
<a href="/pathogens/isolates#/search/all-purpose%20flour"><i>all-purpose flour</i></a><br />
will be interpreted as:<br />
<i>all-purpose OR flour</i><br />
because the system applies a Boolean OR when it encounters a space in your query string.<br />
The system recognizes <a href="#special-characters">special characters</a> such as the hyphen when they are part of a search term, and therefore will show isolates that contain the term <i>all-purpose</i> in any data field, or the term <i>flour</i> in any data field.
<br /><br />
A search for:<br />
<a href="/pathogens/isolates#/search/romaine%20lettuce"><i>romaine lettuce</i></a><br />
will be interpreted as:<br />
<i>romaine OR lettuce</i><br />
will show isolates that contain the term <i>romaine</i> in any data field, or the term <i>lettuce</i> in any data field.<br /><br />
A search for:<br />
<a href="/pathogens/isolates#/search/romaine%20AND%20lettuce"><i>romaine AND lettuce</i></a><br />
will show isolates that contain both of the terms, which can appear independently of each other in any <a href="#isolates-browser-data-fields">data field</a>. If you instead prefer to retrieve isolates in which two or more query terms to appear adjacent to each other, use quotes to conduct a <a href="#solr-phrase">phrase search</a>. For example, a search for: <a href="/pathogens/isolates#/search/%22romaine%20lettuce%22"><i>"romaine lettuce"</i></a> will retrieve isolates that contain that phrase <i>romaine lettuce</i>in any data field.<br /><br />
A search for:<br />
<a href="/pathogens/isolates#/search/lettuce%20NOT%20romaine"><i>lettuce NOT romaine</i></a><br />
will show isolates that contain the term <i>lettuce</i>, but not the term <i>romaine</i>.<br />
That same search can also be written as:<br />
<a href="/pathogens/isolates#/search/lettuce%20!romaine"><i>lettuce !romaine</i></a><br />
or as:<br />
<a href="/pathogens/isolates#/search/lettuce%20-romaine"><i>lettuce -romaine</i></a>
<br /><br />
<b>Tips:</b><br /><br />
The <a href="https://lucene.apache.org/solr/guide/6_6/">SOLR Reference Guide 6.6</a> provides additional details about the use of <a href="https://lucene.apache.org/solr/guide/6_6/the-standard-query-parser.html#TheStandardQueryParser-BooleanOperatorsSupportedbytheStandardQueryParser">Boolean operators</a>.
</li>
<!-- =========== SOLR_OPERATORS_PLUS_MINUS ========== -->
<li id="operators-plus-and-minus">
<span style="background-color: #ffff00"><b>Plus (+) and Minus (-) symbols</b></span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser-advanced-search"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Isolates Browser Advanced Search, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a>
<br /><br />
The plus (+) and minus (-) symbols can be used to require that a term be present or absent, respectively, in the records retrieved by a search.<br /><br />
<b>Examples:</b><br /><br />
A search for:<br />
<a href="/pathogens/isolates#/search/romaine%20lettuce"><i>lettuce +romaine</i></a><br />
will show isolates that contain the term <i>lettuce</i> (in any data field) and that <b>must contain</b> the term <i>romaine</i> (in any data field).<br /><br />
A search for:<br />
<a href="/pathogens/isolates#/search/romaine%20lettuce"><i>lettuce -romaine</i></a><br />
and will show isolates that contain the term <i>lettuce</i> (in any data field) but <b>must not contain</b> the term <i>romaine</i> (in any data field).<br /><br />
<b>Tips:</b><br /><br />
The <a href="https://lucene.apache.org/solr/guide/6_6/">SOLR Reference Guide 6.6</a> provides additional details about the use of the plus (+) and minus (-) symbols in the section on <a href="https://lucene.apache.org/solr/guide/6_6/the-standard-query-parser.html#TheStandardQueryParser-BooleanOperatorsSupportedbytheStandardQueryParser">Boolean operators</a>.
</li>
<!-- =========== SOLR_OPERATORS_RANGE_SEARCH ======== -->
<li id="range-searches">
<span style="background-color: #ffff00"><b>Range searches [nnnn TO nnnn]</b></span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser-advanced-search"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Isolates Browser Advanced Search, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a>
<br /><br />
To search for a range of values, enter a query such as:<br />
<i>collection_date:[value1 TO value2]</i><br />
with <b>square brackets</b> surrounding the query string, and with the word <b>"TO" written in upper case</b>.<br /><br />
<b>Examples:</b><br /><br />
<b>Range of Collection Dates:</b><br /><br />
A search for:<br />
<a href="/pathogens/isolates#/search/collection_date:%5B2013-02*%20TO%202013-08*%5D"><i>collection_date:[2013-02* TO 2013-08*]</i></a><br />
will show isolates that were collected anytime from <i>February 2013</i> through <i>August 2013</i>.<br />
A search for:<br />
<a href="/pathogens/isolates#/search/collection_date:%5B2013*%20TO%202015*%5D"><i>collection_date:[2013* TO 2015*]</i></a><br />
will show isolates that were collected in any month or date from <i>2013</i> through <i>2015</i>.<br /><br />
See the section of this help document for more information about the <a href="#isolates-browser-data-field-CollectionDate">Collection Date</a> data field, which accepts an asterisk (*) as a wildcard.<br /><br />
<b>Range of Create Dates:</b><br /><br />
A search for:<br />
<a href="/pathogens/isolates#/search/creation_date:%5B2013-02%20TO%202013-08%5D"><i>creation_date:[2013-02 TO 2013-08]</i></a><br />
will show isolates that were first seen by the Pathogen Detection system anytime from <i>February 2013</i> through <i>August 2013</i>.<br />
See the section of this help document for more information about the <a href="#isolates-browser-data-field-CreateDate">Create Date</a> data field, which does NOT accept an asterisk (*) as a wildcard.<br /><br />
<b>Tips:</b><br /><br />
The <a href="https://lucene.apache.org/solr/guide/6_6/">SOLR Reference Guide 6.6</a> provides additional details about <a href="https://lucene.apache.org/solr/guide/6_6/the-standard-query-parser.html#TheStandardQueryParser-RangeSearches">Range searches</a>.
</li>
</ul>
</div>
<!-- =========== END_SOLR_OPERATORS ========== -->
<!-- =========== SOLR_PARENTHESES ========== -->
<div style="padding-left: 2em">
<h4 id="parentheses">Parentheses <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser-advanced-search"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Isolates Browser Advanced Search, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h4>
<div style="padding-left: 2em"><a href="#parentheses-boolean">order Boolean queries</a> | <a href="#parentheses-list-of-terms">input a list of query terms</a> | <a href="#parentheses-in-gene-name">automatically escaped if part of a query term</a></div>
<ul>
<!-- =========== SOLR_PARENTHESES_ORDER ========== -->
<li id="parentheses-boolean">
<span style="background-color: #ffff00"><b>Use parentheses to determine order of execution in Boolean queries</b></span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser-advanced-search"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Isolates Browser Advanced Search, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a>
<br /><br />
By default, the system applies Boolean operators from left to right in the query. Parentheses can be used to alter the order of execution of Boolean operators. Sub-queries that are surrounded by parentheses will be executed first.<br /><br />
<b>Examples:</b><br /><br />
A search for:<br />
<a href="/pathogens/isolates#/search/AMR_genotypes:qnr*%20AND%20(AST_phenotypes:ciprofloxacin=R%20OR%20AST_phenotypes:%22nalixidic%20acid=R%22)"><b><i>AMR_genotypes:qnr* AND (AST_phenotypes:ciprofloxacin=R OR AST_phenotypes:"nalixidic acid=R")</i></b></a><br />
will show all of the isolates that have a qnr gene and that are resistant to either ciprofloxacin or nalidixic acid.<br />
(For additional information about this example, see the section of this help document on <a href="#solr-sample-searches">Examples of SOLR Queries</a> &gt; <a href="#solr-sample-search-GenotypesQnrCiproResistant">Genotypes and phenotypes: has specific gene, resistant to antiobiotics</a>.)<br /><br />
<b>Tips:</b><br /><br />
The <a href="https://lucene.apache.org/solr/guide/6_6/">SOLR Reference Guide 6.6</a> provides additional details about use of parentheses for <a href="https://lucene.apache.org/solr/guide/6_6/the-standard-query-parser.html#TheStandardQueryParser-GroupingTermstoFormSub-Queries">grouping terms to form sub-queries</a>.
</li>
<!-- =========== SOLR_PARENTHESES_LIST ========== -->
<li id="parentheses-list-of-terms">
<span style="background-color: #ffff00"><b>Use parentheses to input a list of query terms</b></span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser-advanced-search"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Isolates Browser Advanced Search, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a>
<br /><br />
Search terms that are enclosed in parentheses will be OR'ed together.<br /><br />
<b>Examples:</b><br /><br />
A search for:<br />
<a href="/pathogens/isolates#/search/escherichia%20AND%20(FDA%20CDC%20USDA)"><i>escherichia AND (FDA CDC USDA)</i></a><br />
will show isolates that contain the term <i>escherichia</i> (in any <a href="#isolates-browser-data-fields">data field</a>), and the term <i>FDA</i> or <i>CDC</i> or <i>USDA</i> (in any data field).<br /><br />
</li>
<!-- =========== SOLR_PARENTHESES_IN_QUERY_TERM ======= -->
<li id="parentheses-in-gene-name">
<span style="background-color: #ffff00"><b>Parentheses are automatically escaped if they are an internal part of a gene name or query term</b></span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser-advanced-search"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Isolates Browser Advanced Search, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a>
<br /><br />
As noted in the introduction to the <a href="#isolates-browser-advanced-search">advanced search</a> section of this document, the <a href="/pathogens/isolates#/search/">Isolates Browser</a> uses the SOLR search platform (version 6.6) to retrieve pathogen data. However, in some instances, there might be some slight differences between the Isolates Browser and the SOLR Standard Query Parser.<br /><br />
For example, the Isolates Browser has been modified relative to the SOLR Standard Query Parser in the way it handles <a href="#special-characters"><b>special characters</b></a> that are part of a search term. Specifically, the browser has been programmed to <b>automatically escape</b> special characters, such as <b>parentheses</b> that are part of <a href="#isolates-browser-data-field-AMRGenotypes">gene names</a>, and to treat them as part of the search term. As a result, the Browser retrieves isolates that include the term exactly as it was entered, including special characters.<br /><br />
<b>Examples:</b><br /><br />
A search for:<br />
<a href="/pathogens/isolates#/search/AMR_genotypes:ant(6)-Ia%20AND%20AMR_genotypes:aph(3')-IIIa"><i>AMR_genotypes:ant(6)-Ia AND AMR_genotypes:aph(3')-IIIa</i></a><br />
will show isolates that contain that have both strings, <i>ant(6)-Ia</i> and <i>aph(3')-IIIa</i>, in the <a href="#isolates-browser-data-field-AMRGenotypes">AMR Genotypes</a> data field.
</li>
</ul>
</div>
<!-- =========== END_SOLR_PARENTHESES ========== -->
<!-- ========= DATA_FIELDS ========== -->
<!-- ========= DATA_FIELDS_INTRO =========== -->
<h3 id="isolates-browser-data-fields">Data fields in the Pathogens Isolates Browser <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser-advanced-search"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Isolates Browser Advanced Search, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h3>
<div style="padding-left: 2em">
The Isolates Browesr <a href="#isolates-browser-data-fields-list">data fields listed below</a> have been indexed by the Pathogen Detection project and are therefore <b>directly searchable</b>.<br /><br />
Each data field reflects an available column in the <a href="/pathogens/isolates#/search/">Pathogens Isolates Browser</a> web interface. The <a href="#isolates-browser-output">output</a> section of this document provides tips on how to <a href="#isolates-browser-display-options">choose columns</a> to include in the display.<br /><br />
<b>Please note:</b> in the list of available data fields below: <br />
<ul>
<li>The term shown in the <span style="background-color: #ffff00">regular font</span> is the <span style="background-color: #ffff00">display name</span> (column header) shown by the Isolates Browser web interface. The term shown in <span style="background-color: #ffff00"><i>(italics)</i></span> is the <span style="background-color: #ffff00"><b><i>name of the corresponding data field</i></b>, if you want to search that field directly</span>.</li>
<li>For example, one data field is listed as: <a href="#isolates-browser-data-field-Location">Location (<b><i>geo_loc_name</i></b>)</a>. The term "<b>Location</b>" appears in the Isolates Browser column header, and "<b><i>geo_loc_name</i></b>" is the string you should use if you want to search that data field directly.</li>
<li>Brief <b><i>italicized search examples</i></b> are also provided for each data field, when possible, showing how to query the data field directly. The values represent text strings <b>exactly as they appear in the data fields</b>, including upper case and lower case letters, <a href="#special-characters">special characters</a> such as hyphens, etc. The <span style="background-color: #ffff00">data field names and values are <a href="#case-sensitive"><b>case sensitive</b></a></span>, as noted below.</li>
</ul>
<span style="background-color: #ffff00" id="data-fields-case-sensitive"><b>Case sensitive searches:</b></span> The <b>names of the data fields</b>, and the <b>values they contain</b>, are <b>case sensitive</b>. The values represent text strings <b>exactly as they were entered by the submitter</b>, including upper case and lower case letters, special characters such as hyphens, etc. (A separate section of this document provides <a href="#case-sensitive">examples of case sensitive searches</a>.)<br /><br />
The case-sensitivity and the retention of special characters such as hyphens and parentheses (when they are internal to a search term) were built into the system in order to ensure <b>precise handling of searches</b> for values such as <b>strain name</b>, <b>serovar</b>, <b>gene symbol</b>, and more. The case sensitivity and handling of special characters applies to other data fields as well.<br /><br />
Therefore, when you search a specific data field, the system will retrieve isolates that contain the <b>exact string you have specified</b>, including upper case and lower case letters, as well as <a href="#query-tips-special-characters">special characters</a> such as hyphens and parentheses.<br /><br />
<span style="background-color: #ffff00" id="data-fields-case-insensitive"><b>Case insensitive searches:</b></span> <b>If you are uncertain about the exact text string</b> that appears in isolate records, then you can simply enter the query in any text format (all upper, all lower, or mixed case) <b>without a data field specifier</b>. The system will then search the <b>Text index</b>, which is a <b>case insensitive compilation of terms</b> from many text-containing data fields. This provides a flexible search mechanism, although it is less precise in its retrieval as the query terms can appear in any text field of the pathogen isolate records. (A separate section of this document provides <a href="#case-insensitive">examples of case insensitive searches</a>.)<br /><br />
The <a href="#isolates-browser-query-tips">query tips</a> section of this document includes a <span style="background-color: #ffff00"><a href="#case-sensitive">comparison of case sensitive versus case insensitive searches</a></span>.<br /><br />
<span id="isolates-browser-data-fields-list"><b>The available data fields in the <a href="/pathogens/isolates#/search/">Pathogens Isolates Browser</a> include the following:</b></span> <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser-advanced-search"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Isolates Browser Advanced Search, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br />
Note that fields shown in the default display are highlighted in blue. Each field is written in this format: &#160;&#160;<b>Display name</b> (<b><i>data_field_name</i></b>)<br />
The "Display name" is the column header that appears in the Isolates Browser web interface, and the "<i>data_field_name</i>" is the <a href="#case-sensitive">case-sensitive</a> string you should enter if you want to search the data field directly using a <a href="#solr">SOLR query</a>:<br />
<br />
Fields marked with + are also fields that can be used as labels in the <b>SNP Tree Viewer</b> .
<br /><br />
<!-- ========== DATA_FIELDS_MINI_TOC =========== -->
<table width="100%">
<tr>
<td width="50%" valign="top">
<a href="#isolates-browser-data-field-AMRGenotypes"><span style="background-color: #cde1ff">AMR genotypes (<b><i>AMR_genotypes</i></b>)</span></a><br />
<a href="#isolates-browser-data-field-AMRGenotypesCore">AMR genotypes core (<b><i>AMR_genotypes_core</i></b>)</a><br />
<a href="#isolates-browser-data-field-amrfinderplus-analysis-type">AMRFinderPlus analysis type (<b><i>amrfinderplus_analysis_type</i></b>)</a><br />
<a href="#isolates-browser-data-field-amrfinderplus-version">AMRFinderPlus version (<b><i>amrfinderplus_version</i></b>)</a><br />
<a href="#isolates-browser-data-field-Assembly"><span style="background-color: #cde1ff">Assembly (<b><i>asm_acc</i></b>)+</span></a><br />
<a href="#isolates-browser-data-field-ASTPhenotypes">AST phenotypes (<b><i>AST_phenotypes</i></b>)</a><br />
<a href="#isolates-browser-data-field-BioProject">BioProject (<b><i>bioproject_acc</i></b>)+</a><br />
<a href="#isolates-browser-data-field-BioSample"><span style="background-color: #cde1ff">BioSample (<b><i>biosample_acc</i></b>)+</span></a><br />
<a href="#isolates-browser-data-field-CollectedBy">Collected by (<b><i>collected_by</i></b>)+</a><br />
<a href="#isolates-browser-data-field-CollectionDate">Collection Date (<b><i>collection_date</i></b>)+</a><br />
<a href="#isolates-browser-data-field-ComputedTypes"><span style="background-color: #cde1ff">Computed types(<b><i>computed_types</i></b>)+</span></a><br />
<a href="#isolates-browser-data-field-Contigs">Contigs (<b><i>asm_stats_n_contig</i></b>)+</a><br />
<a href="#isolates-browser-data-field-CreateDate"><span style="background-color: #cde1ff">Create Date (<b><i>creation_date</i></b>)+</span></a><br />
<a href="#isolates-browser-data-field-FoodOrigin"><span style="background-color: #cde1ff">Food origin (<b><i>food_origin</i></b>)+</span></a><br />
<a href="#isolates-browser-data-field-Host">Host (<b><i>host</i></b>)+</a><br />
<a href="#isolates-browser-data-field-HostDisease">Host Disease (<b><i>host_disease</i></b>)+</a><br />
<a href="#isolates-browser-data-field-IFSAC_category">IFSAC_category (<b><i>IFSAC_category</i></b>)</a><br />
<a href="#isolates-browser-data-field-Isolate"><span style="background-color: #cde1ff">Isolate (<b><i>target_acc</i></b>)+</span></a><br />
<a href="#isolates-browser-data-field-Isolate_identifiers"><span style="background-color: #cde1ff">Isolate_identifiers (<b><i>isolate_identifiers</i></b>)+</span></a><br />
<a href="#isolates-browser-data-field-IsolationSource"><span style="background-color: #cde1ff">Isolation Source (<b><i>isolation_source</i></b>)+</span></a><br />
<a href="#isolates-browser-data-field-IsolationType"><span style="background-color: #cde1ff">Isolation type (<b><i>epi_type</i></b>)+</span></a><br />
<a href="#isolates-browser-data-field-KmerGroup">K-mer group (<b><i>kmer_group</i></b>)+</a><br />
<a href="#isolates-browser-data-field-LatLon">Lat/Lon (<b><i>lat_lon</i></b>)+</a><br />
<a href="#isolates-browser-data-field-Length">Length (<b><i>asm_stats_length_bp</i></b>)+</a><br />
<a href="#isolates-browser-data-field-Level">Level (<b><i>asm_level</i></b>)+</a><br />
<a href="#isolates-browser-data-field-LibraryLayout">Library Layout (<b><i>LibraryLayout</i></b>)+</a><br />
<a href="#isolates-browser-data-field-Location"><span style="background-color: #cde1ff">Location (<b><i>geo_loc_name</i></b>)+</span></a><br />
</td>
<td width="50%" valign="top">
<a href="#isolates-browser-data-field-Method">Method (<b><i>assembly_method</i></b>)+</a><br />
<a href="#isolates-browser-data-field-MinSame"><span style="background-color: #cde1ff">Min-same (<b><i>minsame</i></b>)+</span></a><br />
<a href="#isolates-browser-data-field-MinDiff"><span style="background-color: #cde1ff">Min-diff (<b><i>mindiff</i></b>)+</span></a><br />
<a href="#isolates-browser-data-field-N50">N50 (<b><i>asm_stats_contig_n50</i></b>)+</a><br />
<a href="#isolates-browser-data-field-OrganismGroup"><span style="background-color: #cde1ff">Organism Group (<b><i>taxgroup_name</i></b>)</span></a><br />
<a href="#isolates-browser-data-field-Outbreak">Outbreak (<b><i>outbreak</i></b>)+</a><br />
<!-- a href="#DataFieldParentGroup">Parent group (<b><i>parent_group</i></b>)</a><br -->
<a href="#isolates-browser-data-field-PFGEPrimaryEnzymePattern">PFGE Primary Enzyme Pattern (<b><i>PFGE_PrimaryEnzyme_pattern</i></b>)+</a><br />
<a href="#isolates-browser-data-field-PFGESecondaryEnzymePattern">PFGE Secondary Enzyme Pattern (<b><i>PFGE_SecondaryEnzyme_pattern</i></b>)+</a><br />
<a href="#isolates-browser-data-field-Platform">Platform (<b><i>Platform</i></b>)+</a><br />
<a href="#isolates-browser-data-field-refgene-db-version">PD Ref Gene Catalog version (<b><i>refgene_db_version</i></b>)</a><br />
<a href="#isolates-browser-data-field-Run">Run (<b><i>Run</i></b>)+</a><br />
<a href="#isolates-browser-data-field-Strain"><span style="background-color: #cde1ff">Strain (<b><i>strain</i></b>)+</span></a><br />
<a href="#isolates-browser-data-field-Serovar"><span style="background-color: #cde1ff">Serovar (<b><i>serovar</i></b>)+</span></a><br />
<!-- a href="#DataFieldSerotype">Serotype (<b><i>serotype</i></b>)</a><br -->
<a href="#isolates-browser-data-field-SNPCluster"><span style="background-color: #cde1ff">SNP cluster (<b><i>erd_group</i></b>)+</span></a><br />
<a href="#isolates-browser-data-field-ScientificName">Scientific name (<b><i>scientific_name</i></b>)+</a><br />
<a href="#isolates-browser-data-field-source_type">Source type (<b><i>source_type</i></b>)+</a><br />
<a href="#isolates-browser-data-field-SpeciesTaxID">Species TaxID (<b><i>species_taxid</i></b>)+</a><br />
<a href="#isolates-browser-data-field-SRACenter">SRA Center (<b><i>sra_center</i></b>)+</a><br />
<a href="#isolates-browser-data-field-SRAReleaseDate">SRA Release Date (<b><i>sra_release_date</i></b>)+</a><br />
<!-- a href="#DataFieldStatus">Status (<b><i>status</i></b>)</a><br -->
<a href="#isolates-browser-data-field-stress-genotypes">Stress genotypes (<b><i>stress_genotypes</i></b>)</a><br />
<a href="#isolates-browser-data-field-TaxID">TaxID (<b><i>taxid</i></b>)+</a><br />
<!-- a href="#tree_node_ids">tree_node_ids (<b><i>tree_node_ids</i></b>)</a><br -->
<a href="#isolates-browser-data-field-virulence-genotypes">Virulence genotypes (<b><i>virulence_genotypes</i></b>)</a><br />
<a href="#isolates-browser-data-field-WGSAccession">WGS Accession (<b><i>wgs_master_acc</i></b>)+</a><br />
<a href="#isolates-browser-data-field-WGSPrefix">WGS Prefix (<b><i>wgs_acc_prefix</i></b>)+</a><br />
</td>
</tr>
</table>
<!-- ========= END_DATA_FIELDS_MINI_TOC ========= -->
</div>
<!-- ========= END_DATA_FIELDS_INTRO =========== -->
<!-- ========= DATA_FIELDS_DESCRIPTIONS =========== -->
<ul>
<!-- ======== DATA_FIELD_AMRGenotypes ========== -->
<li id="isolates-browser-data-field-AMRGenotypes">
<span style="background-color: #cde1ff">AMR genotypes (<b><i>AMR_genotypes</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of Isolates Browser data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
Antimicrobial resistance (AMR) genes found in the isolate during analysis with <a href="/pathogens/antimicrobial-resistance/AMRFinder/">AMRFinderPlus</a>. This is a de-duplicated list, so multiple genes that share the same symbol will only be represented once. <span style="color: #D3D3D3">&lt;NONE&gt;</span> indicates a lack of AMR genes identified by AMRFinderPlus, while an empty field means AMRFinderPlus results are not yet available. See the <a href="#isolates-browser-data-field-amrfinderplus-analysis-type">AMRFinderPlus analysis type</a>, <a href="#isolates-browser-data-field-refgene-db-version">PD Ref Gene Catalog version</a>, and <a href="#isolates-browser-data-field-amrfinderplus-version">AMRFinderPlus version</a> fields for more information about the AMRFinderPlus analysis of this isolate. <i>(Separate sections of this document provide an <a href="#amr-finder">overview of AMRFinderPlus</a> and additional information about <a href="#data-type-genotype">genotypes</a>.)</i><br /><br />
The genes that have been identified in an isolate's genome sequence are grouped into <b>genotype categories</b>, such as <i><b>complete</b></i>, <i><b>partial</b></i>, <i><b>partial end of contig</b></i>. The <a href="/pathogens/docs/data_processing">data processing pipeline</a> section of this document provides <a href="/pathogens/docs/data_processing/#genotype-categories">more information about genotype categories</a>.<br /><br />
The <a href="#filters">Filters</a> interface has been customized gene fields such as this one. See <a href="#filters-gene-fields">Filter gene fields</a> for more information.<br /><br />
Data field names and values are <a href="#case-sensitive">case sensitive</a>, as shown in the examples below. Additional sections of this document provide tips about search terms that contain <a href="#special-characters">special characters</a> (such as the parentheses, hyphens, and apostrophes in the second example below), and the use of <a href="#wildcards">wildcards</a> such as the asterisk and question mark (as in the first and third examples below).<br /><br />
<b>Examples:</b>
<ul>
<li>To search this field directly, enter a query such as: &#160;
<i>AMR_genotypes:searchterm</i></li>
<li>Search for: &#160; <i>AMR_genotypes:mcr* AND AMR_genotypes:blaKPC*</i><br />
to show all of the isolates that have both a mobile colistin resistance gene and a KPC beta-lactamase.
</li>
<li>Search for: &#160; <i>AMR_genotypes:ant(6)-Ia AND AMR_genotypes:aph(3')-IIIa</i><br />
to show all of the isolates that have both strings, <i>ant(6)-Ia</i> and <i>aph(3')-IIIa</i>, in the AMR Genotype data field.
</li>
<li>Search for: &#160; <i>AMR_genotypes:tet(*)</i><br />
to show all of the isolates that have a genotype of "tet(*)," with the question mark serving as a <a href="#wildcards">wildard</a> to retrieve gene names that have any character in the parentheses, such as tet(A), tet(M), tet(O), tet(X). etc.
</li>
</ul>
<i>Note: To learn more about a given gene, open the <a href="/pathogens/isolates#/refgene/">Pathogen Detection Reference Gene Catalog</a> and search for the gene symbol of interest. For example, see the Reference Gene Catalog results of a search for
<a href="/pathogens/isolates#/refgene/mcr*">mcr*</a> or <a href="/pathogens/isolates#/refgene/ant(6)-Ia">ant(6)-Ia</a>. In the Pathogen Detection Reference Gene Catalog search results display, clicking on the gene symbol will retrieve the isolates that have been found to contain the gene.</i>
</li>
<!-- ======== DATA_FIELD_AMRGenotypesCore ========== -->
<li id="isolates-browser-data-field-AMRGenotypesCore">
<span style="background-color: #cde1ff">AMR genotypes core (<b><i>AMR_genotypes_core</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of Isolates Browser data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
Core antimicrobial resistance (AMR) genes found in the isolate during analysis with <a href="/pathogens/antimicrobial-resistance/AMRFinder/">AMRFinderPlus</a>. The only differences between <span style="background-color: #cde1ff">AMR genotypes core (<b><i>AMR_genotypes_core</i></b>)</span> and <span style="background-color: #cde1ff">AMR genotypes (<b><i>AMR_genotypes</i></b>)</span> column is that "plus" genes are not shown. This is a de-duplicated list, so multiple genes that share the same symbol will only be represented once. <span style="color: #D3D3D3">&lt;NONE&gt;</span> indicates a lack of AMR genes identified by AMRFinderPlus, while an empty field means AMRFinderPlus results are not yet available. See the <a href="#isolates-browser-data-field-amrfinderplus-analysis-type">AMRFinderPlus analysis type</a>, <a href="#isolates-browser-data-field-refgene-db-version">PD Ref Gene Catalog version</a>, and <a href="#isolates-browser-data-field-amrfinderplus-version">AMRFinderPlus version</a> fields for more information about the AMRFinderPlus analysis of this isolate. <i>(Separate sections of this document provide an <a href="#amr-finder">overview of AMRFinderPlus</a> and additional information about <a href="#refgene-scope">core vs. plus genotypes</a>.)</i><br /><br />
The <a href="#filters">Filters</a> interface has been customized gene fields such as this one. See <a href="#filters-gene-fields">Filter gene fields</a> for more information.<br /><br />
Data field names and values are <a href="#case-sensitive">case sensitive</a>, as shown in the examples below. Additional sections of this document provide tips about search terms that contain <a href="#special-characters">special characters</a> (such as the parentheses, hyphens, and apostrophes in the second example below), and the use of <a href="#wildcards">wildcards</a> such as the asterisk and question mark (as in the first and third examples below).<br /><br />
<b>Examples:</b>
<ul>
<li>To search this field directly, enter a query such as: &#160;
<i>AMR_genotypes_core:searchterm</i></li>
<li>Search for: &#160; <i>AMR_genotypes_core:mcr* AND AMR_genotypes_core:blaKPC*</i><br />
to show all of the isolates that have both a mobile colistin resistance gene and a KPC beta-lactamase.
</li>
</ul>
</li>
<!-- ======== DATA_FIELD_AMRFinderPlusAnalysisType ========== -->
<li id="isolates-browser-data-field-amrfinderplus-analysis-type">
<span style="background-color: #cde1ff">AMRFinderPlus analysis type (<b><i>amrfinderplus_analysis_type</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of Isolates Browser data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
Indicates the data types that were used to analyze the isolate's genome sequences using AMRFinderPlus. Genome sequences are generally analyzed in two passes: <br />
<ol>
<li><b>NUCLEOTIDE</b>: this in an initial analysis that is done, using translated BLAST, immediately after a pathogen isolate genome is assembled. It identifies the proteins in the genome sequence.</li>
<li><b>COMBINED</b>: this is a second, more sensitive analysis that runs AMRFinderPlus on both an isolate's nucleotide and protein sequences. Protein BLAST, nucleotide BLAST, and HMMER are used to analyze the proteins. The combined analysis can produce more sensitive results than the initial nucleotide analysis.<br />
<i>(Separate sections of this document provide details about the Pathogen Detection <a href="/pathogens/docs/data_processing">data processing pipeline</a> and an <a href="#amr-finder">overview of AMRFinderPlus</a>. The <a href="https://github.com/ncbi/amr/wiki">AMRFinderPlus wiki</a> provides details about installing and running the program, interpreting the results, and methods used.)</i>
</li>
</ol>
<!-- The "<i>amrfinderplus_analysis_type</i>" data field was added in February 2020. -->
This field will be empty if AMRFinderPlus results are not yet available.<br /><br />
Data field names and values are <a href="#case-sensitive">case sensitive</a>, as shown in the examples below, and the values of "NUCLEOTIDE" and "COMBINED" must be written in <b>all upper case</b>. <!-- Additional <a href="#isolates-browser-query-tips">query tips</a> are provided in a separate section of this document. Additional sections of this document provide tips about search terms that contain <a href="#special-characters">special characters</a> (such as the parentheses, hyphens, and apostrophes), and the use of <a href="#wildcards">wildcards</a> (such as the asterisk and question mark). --><br /><br />
<b>Examples:</b>
<ul>
<li>To search this field directly, enter a query such as: &#160;
<i>amrfinderplus_analysis_type:searchterm</i></li>
<li>Search for: &#160; <i>amrfinderplus_analysis_type:COMBINED</i><br />
to show all of the isolates that were analyzed by running AMRFinderPlus on both their nucleotide and protein sequences.
</li>
</ul>
</li>
<!-- ======== DATA_FIELD_AMRFinderPlusVersion ========== -->
<li id="isolates-browser-data-field-amrfinderplus-version">
<span style="background-color: #cde1ff">AMRFinderPlus version (<b><i>amrfinderplus_version</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of Isolates Browser data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
The version of the <a href="/pathogens/antimicrobial-resistance/AMRFinder/">AMRFinderPlus</a> software that was used to analyze a particular isolate.<br /><br />
New isolates are analyzed using the latest version of AMRFinderPlus software. Older isolates may have been analyzed with earlier versions of AMRFinderPlus software. There might be occasional updates to annotation on all isolates in special circumstances, such as the identification of a new genes (e.g., mobilized colistin resistance (mcr) genes).<br /><br />
<!-- The "<i>amrfinderplus_version</i>" data field was added in February 2020. -->
This field will be empty if AMRFinderPlus results are not yet available.<br /><br />
<i>(Separate sections of this document provide details about the Pathogen Detection <a href="/pathogens/docs/data_processing">data processing pipeline</a> and an <a href="#amr-finder">overview of AMRFinderPlus</a>. The <a href="https://github.com/ncbi/amr/wiki">AMRFinderPlus wiki</a> provides details about installing and running the program, interpreting the results, and methods used.)</i><br /><br />
Data field names and values are <a href="#case-sensitive">case sensitive</a> (as shown in the example below, in which the data field name is in all lower case). Additional <a href="#isolates-browser-query-tips">query tips</a> are provided in a separate section of this document. <!-- Additional sections of this document provide tips about search terms that contain <a href="#special-characters">special characters</a> (such as the parentheses, hyphens, and apostrophes), and the use of <a href="#wildcards">wildcards</a> (such as the asterisk and question mark). --><br /><br />
<b>Examples:</b>
<ul>
<li>To search this field directly, enter a query such as: &#160;
<i>amrfinderplus_version:searchterm</i></li>
<li>Search for: &#160; <i>amrfinderplus_version:3.6.7</i><br />
to show all of the isolates that were analyzed with AMRFinderPlus version 3.6.7.</li>
<!-- li><i>Note: The amrfinderplus_version data field was added in February 2020. As a result, isolates that were analyzed prior to that time do not have a value in the "AMRFinderPlus version" data column of the Isolates Browser display.</i></li -->
</ul>
</li>
<!-- ======== DATA_FIELD_Assembly ========== -->
<li id="isolates-browser-data-field-Assembly">
<span style="background-color: #cde1ff">Assembly (<b><i>asm_acc</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of Isolates Browser data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
The accession number for the genome sequence from the <a href="https://www.ncbi.nlm.nih.gov/assembly/">Assembly database</a>.<br /><br />
Data field names and values are <a href="#case-sensitive">case sensitive</a>, as shown in the examples below.<br />
Note that a transient state may occur where two isolates point to the same assembly when the submitter changes the taxonomic identifier for the biosample from one taxgroup to another.
The assembly accession should be entered in the form of <b>Accession.version</b>, as in the first example below.<br />
If you enter only the accession, <b>no hits</b> will be returned.<br />
If you don't know the version number, then you can use an <b>asterisk</b> (<b>*</b>) to serve as a <b>wildcard</b>, as in the second example below.<br />
In either case, the letters that are in the <b>accession number prefix must be in upper case</b>. A separate section of this document provides search tips about <a href="#case-sensitive">case sensitive</a> searches.<br /><br />
<b>Examples:</b>
<ul>
<li>To search this field directly, enter a query such as: &#160;
<i>asm_acc:searchterm</i></li>
<li>Search for: &#160; <i>asm_acc:GCA_000008865.2</i></li>
</ul>
</li>
<!-- ======== DATA_FIELD_ASTPhenotypes ========== -->
<li id="isolates-browser-data-field-ASTPhenotypes">
<span style="background-color: #cde1ff">AST phenotypes (<b><i>AST_phenotypes</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of Isolates Browser data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
Antibiotic resistance phenotype, based on Antimicrobial Susceptibility Test (AST) results. <i>(<a href="#data-type-phenotype">read more about phenotypes</a> and look at sample records)</i><br /><br />
Data field names and values are <a href="#case-sensitive">case sensitive</a>, as shown in the examples below. A separate section of this document provides tips about the use of <a href="#query-tips-phrase-search-quotes">quotes for phrase searches</a>.<br /><br />
<i>DISCLAIMER: Note, the format for this data field in the isolates browser is presented as a list of antibiotic compounds broken down by resistance call made by the data submitter. These are typically, done by using CLSI or EUCAST standards and those standards change over time OR the call is made by an automated instrument which may infer the cutoff. This may mean that data submitted using an earlier standard may have different resistance calls for the same antibiotic compound than data submitter using a later standard, and even for the same organism and same isolate, different tests may yield different results. Users can search this field by the antibiotic compound AND by the resistance call &#8211; the format is different than most other fields in this document.</i><br /><br />
<b>Examples:</b><br />
<ul>
<li>To search this field directly, enter a query such as: &#160;
<i>AST_phenotypes:searchterm</i></li>
<li>Search for: &#160; <i>AST_phenotypes:imipenem=R</i><br />
to show isolates that are resistant to imipenem</li>
<li>Search for: &#160; &#160; <i>AST_phenotypes:ciprofloxacin=R OR AST_phenotypes:"nalixidic acid=R"</i><br />
to show isolates that are resistant to either ciprofloxacin or nalidixic acid</li>
</ul>
A list of possible <b>phenotype values</b> is shown on the <a href="https://www.ncbi.nlm.nih.gov/biosample/docs/beta-lactamase/">BioSample Antibiograms</a> page, under the "Resistance Phenotype" tab, and includes:<br />
<ul>
<li>intermediate (I)</li>
<li>nonsusceptible (NS)</li>
<li>not defined (N, ND)</li>
<li>resistant (R)</li>
<li>susceptible (S, sensitive)</li>
<li>susceptible-dose dependent (SSD)</li>
</ul>
</li>
<!-- ======== DATA_FIELD_BioProject ========== -->
<li id="isolates-browser-data-field-BioProject">
<span style="background-color: #cde1ff">BioProject (<b><i>bioproject_acc</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of Isolates Browser data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
BioProject accession <i>(<a href="#data-type-bioproject">read more about bioprojects</a> and look at sample records)</i><br /><br />
Data field names and values are <a href="#case-sensitive">case sensitive</a>. The letters that are in the <b>accession prefix must be in upper case</b>, as shown in the example below. (A separate section of this document provides a list of <a href="#accession-prefixes">accession prefixes</a> that appear in the Pathogen Detection project.)<br /><br />
<b>Examples:</b>
<ul>
<li>To search this field directly, enter a query such as: &#160;
<i>bioproject_acc:searchterm</i></li>
<li>Search for: &#160; <i>bioproject_acc:PRJNA230969</i><br />
to show all isolates that were sequenced as part of <a href="https://www.ncbi.nlm.nih.gov/bioproject/230969">BioProject PRJNA230969</a>, which describes the GenomeTrakr project by the US Food and Drug Administration (FDA) to sequence Escherichia coli (E. coli) genomes for the surveillance and rapid detection of foodborne contamination events.</li>
<li>Note that some bioprojects are "parent" to other bioprojects, and a search of this data field only retrieves the bioprojects that are being searched for explicitly. For exmaple, the search above will only retrieve <a href="https://www.ncbi.nlm.nih.gov/bioproject/230969">BioProject PRJNA230969</a>, and not its parent project (BioProject PRJNA230919). To access a parent project, or additional sub-projects that fall under the same parent, follow the "Navigate up" and "Navigate Across" links, respectively, that appear on a BioProject page.</li>
</ul>
</li>
<!-- ======== DATA_FIELD_BioSample ========== -->
<li id="isolates-browser-data-field-BioSample">
<span style="background-color: #cde1ff">BioSample (<b><i>biosample_acc</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of Isolates Browser data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
BioSample accession <i>(<a href="#data-type-biosample">read more about biosamples</a> and look at sample records)</i>.<br /><br />
Data field names and values are <a href="#case-sensitive">case sensitive</a>. The letters that are in the <b>accession prefix must be in upper case</b>, as shown in the example below. (A separate section of this document provides a list of <a href="#accession-prefixes">accession prefixes</a> that appear in the Pathogen Detection project.)<br /><br />
<b>Examples:</b>
<ul>
<li>To search this field directly, enter a query such as: &#160;
<i>biosample_acc:searchterm</i></li>
<li>Search for: &#160; <i>biosample_acc:SAMN05245394</i><br />
to show the isolate from an individual BioSample, <a href="https://www.ncbi.nlm.nih.gov/biosample/SAMN05245394">SAMN05245394</a>, which was collected and sequenced as part of the FDA's GenomeTrakr project (<a href="https://www.ncbi.nlm.nih.gov/bioproject/230969">BioProject PRJNA230969</a>) for the surveillance and rapid detection of foodborne contamination events</li>
</ul>
</li>
<!-- ======== DATA_FIELD_CollectedBy ========== -->
<li id="isolates-browser-data-field-CollectedBy">
<span style="background-color: #cde1ff">Collected by (<b><i>collected_by</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of Isolates Browser data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
Name of persons or institute who collected the sample, if provided by the submitter.<br /><br />
Data field names and values are <a href="#case-sensitive">case sensitive</a>, as shown in the examples below, and <a href="#query-tips-phrase-search-quotes">quotes can be used for phrase searches</a>.<br /><br />
When you enter a query, the system will retrieve isolates that contain the exact query string you specified, including punctuation, capitalization, and spaces.<br /><br />
To browse the various values that are available in a data field, use the "<a href="#isolates-browser-display-options">Choose Columns</a>" option at the top of the "Matched Isolates" table, select the desired column (data field) to display, then click on the column header to sort by the values in that column.<br /><br />
<b>Examples:</b>
<ul>
<li>To search this field directly, enter a query such as: &#160;
<i>collected_by:searchterm</i></li>
<li>Search for: &#160; <i>collected_by:FDA</i></li>
</ul>
</li>
<!-- ======== DATA_FIELD_CollectionDate ========== -->
<li id="isolates-browser-data-field-CollectionDate">
<span style="background-color: #cde1ff">Collection Date (<b><i>collection_date</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of Isolates Browser data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
Date sample was collected, in the format the submitter supplied.
<br /><i>(In contrast, the values in the <a href="#isolates-browser-data-field-CreateDate">Create Date</a> field are in ISO format.)</i><br /><br />
Note: collection_date is the time the sample was collected, which may differ from the type the data was submitted to <a href="http://www.insdc.org/">INSDC</a> and also different than the time the data was added to the Pathogen Detection project. For real-time submissions of pathogen surveillance data, these dates will be in close proximity. For legacy data, or research projects, these dates may differ wildly and be separated by years.<br /><br />
You can use an <b>asterisk (*)</b> as a wildcard for truncation, in order to retrieve all of the isolates that were collected in a given month or year, as shown in the examples below.<br />
To search for a <b>range of values</b>, enter a query such as: collection_date:[value1 TO value2]
with <b>square brackets</b> surrounding the query string, and with the word <b>"TO" written in upper case</b>.<br />
Data field names and values are <a href="#case-sensitive">case sensitive</a>, and this <b>data field name</b> should be written in all <b>lower case</b>.<br /><br />
<b>Examples:</b>
<ul>
<li>To search this field directly, enter a query such as: &#160;
<i>collection_date:searchterm</i></li>
<li>Search for: &#160; <i>collection_date:2013-08-24</i><br />
to show isolates in which the submitter entered that exact string as the collection date.</li>
<li>Search for: &#160; <i>collection_date:2013-08</i><br />
to show isolates in which the submitter entered that exact string as the collection date (that is, the isolates in which the submitter provided only the year and month, but not the day, as the collection_date).</li>
<li>Search for: &#160; <i>collection_date:2013-08*</i><br />
to show isolates that were collected in August 2013. The asterisk serves as a <a href="#wildcards">wildcard</a>, and the system will therefore retrieve all isolates that have 2013-08 as the stem of their collection date.</li>
<li>Search for: &#160; <i>collection_date:[2013-02* TO 2013-08*]</i><br />to show isolates that were collected anytime from February 2013 through August 2013.</li>
</ul>
</li>
<!-- ====== Technical background notes for collection_date:
collection_date - is a fee text field (not a true date field) that can contain date-formatted strings that are often written with the format YYYY-MM-DD, or written as partial string such as YYYY or YYYY-MM. The collection_date field can also sometimes: (a) be empty (e.g., if a submitter didn't provide that information for their data), (b) contain a date format other than YYYY-MM-DD, (c) contain some other type of text string, if a submitter inserted something other than a date in that field. At no point is the value converted from free text to a date. Collection date is supposed to correspond to the date on which the sample (clinical or environmental/other) was taken, from which the pathogen was later isolated and sequenced. Because it is a free text field, an asterisk * can be used as a wildcard or for truncation.
====== End of Technical background notes for collection_date -->
<!-- ======== DATA_FIELD_CompytedTypes ========== -->
<li id="isolates-browser-data-field-ComputedTypes">
<span style="background-color: #cde1ff">Computed types (<b><i>computed_types</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of Isolates Browser data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
"In-silico" typing results. Currently the results of executing <a href="https://github.com/denglab/SeqSero2">SeqSero2</a> version 1.3.1 on Salmonella isolates (only) are presented in these subfields [<a href="#seqsero2_2015">Zhang 2015</a>, <a href="#seqsero2_2019">Zhang 2019</a>]:<br />
<ul>
<li><b>serotype</b> - The serovar computed from the reads (if available) or the assembly of the isolate.</li>
<li><b>antigen_formula</b> - The antigenic formula computed from the reads (if available) or the assembly of the isolate.</li>
</ul>
<br />
<b>Values for "Serotype" and "Antigen formula" in the <span style="background-color: #cde1ff">Computed types</span> field may not agree with the user submitted fields <a href="#isolates-browser-data-field-Serovar">Serovar</a>, <a href="#isolates-browser-data-field-TaxID">TaxID</a>, or <a href="#isolates-browser-data-field-ScientificName">Scientific name</a></b> because those fields are reported by the submitter. The "computed_types" field, on the other hand, is a computational prediction based on the sequence calculated as part of the Pathogen Detection Pipeline.
<br />
<br />
<b>Examples:</b>
<ul>
<li>Search for: &#160; <i>taxgroup_name:"Salmonella enterica" AND computed_types:serotype=Enteritidis</i><br />
to show isolates whose computed serovar is Enteritidis only.</li>
<li>Search for: &#160; <i>taxgroup_name:"Salmonella enterica" AND computed_types:antigen_formula=9:g,m:-</i><br />
to show isolates with the antigenic formula that corresponds to serovar Enteritidis.</li>
<li>Search for: &#160; <i>taxgroup_name:"Salmonella enterica" AND computed_types:serotype=Enteritidis AND NOT serovar:*nteritidis*</i><br />
to show isolates whose computed serovar is Enteritidis but were submitted with a different serovar.</li>
</ul>
</li>
<!-- ====== Technical background notes for collection_date:
computed_types - The values in the sub-fields are returend by the Third-Party tool and are not subject to validation by NCBI.
====== End of Technical background notes for collection_date -->
<!-- ======== DATA_FIELD_Contigs ========== -->
<li id="isolates-browser-data-field-Contigs">
<span style="background-color: #cde1ff">Contigs (<b><i>asm_stats_n_contig</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of Isolates Browser data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
Number of contigs in the isolate's genome assembly. If this was submitted to GenBank by the submitter it will be from their assembly and will match the assembly stats in the assembly database (https://www.ncbi.nlm.nih.gov/assembly/). If it is from an assembly made by the Pathogen Detection system, it may not yet be in GenBank, and therefore this will be the only place to see the assembly statistics.<br /><br />
To search for a <b>range of values</b>, enter a query such as: &#160; <i>asm_stats_n_contig:[value1 TO value2]</i><br />with <b>square brackets</b> surrounding the query string, and with the word <b>"TO" written in upper case</b>. An interesting way to use a range search of this field is to retrieve isolates whose genome assemblies are comprised of only a few contigs.<br />
Data field names and values are <a href="#case-sensitive">case sensitive</a>, and this <b>data field name</b> should be written in all <b>lower case</b>.<br /><br />
<b>Examples:</b>
<ul>
<li>To search this field directly, enter a query such as: &#160;
<i>asm_stats_n_contig:searchterm</i></li>
<li>Search for: &#160; <i>asm_stats_n_contig:[1 TO 3]</i><br />
to retrieve isolates with genome assemblies comprised of contigs that range in number from 1 to 3</li>
</ul>
</li>
<!-- ======== DATA_FIELD_CreateDate ========== -->
<li id="isolates-browser-data-field-CreateDate">
<span style="background-color: #cde1ff">Create Date (<b><i>creation_date</i></b><!-- B><i>NOT target_creation_date</i></B -->)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of Isolates Browser data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
The date on which this isolate was first seen by the Pathogen Detection system, in the format: YYYY-MM-DD. Note, these dates are in ISO format.<br /><i>(In contrast, the values in the <a href="#isolates-browser-data-field-CollectionDate">Collection Date</a> field are in the format that was provided by the data submitter.)</i><br /><br />
This data field does <b>not</b> accept an asterisk as a wild card. However, it allows you to input either a <b>full date or a partial date</b> as the query. For example, enter the query in the format:<br />
<div style="padding-left: 2em">
<b>YYYY-MM-DD</b> to retrieve all isolates first seen on a specific date, or<br />
<b>YYYY-MM</b> to retrieve all isolates first seen during a given month, or<br />
<b>YYYY</b> to retrieve all isolates first seen during a given year.<br />
</div>
To search for a <b>range of values</b>, enter a query such as: &#160; <i>creation_date:[value1 TO value2]</i><br />with <b>square brackets</b> surrounding the query string, and with the word <b>"TO" written in upper case</b>.<br />
Data field names and values are <a href="#case-sensitive">case sensitive</a>, and this <b>data field name</b> should be written in all <b>lower case</b>.<br /><br />
<b>Examples:</b>
<ul>
<li>To search this field directly, enter a query such as: &#160;
<i>creation_date:searchterm</i></li>
<li>Search for: &#160; <i>creation_date:2013-11-19</i><br />
to show isolates that were first seen by the Pathogen Detection system on that exact date.</li>
<li>Search for: &#160; <i>creation_date:2013-11</i><br />
to show isolates that were first seen by the Pathogen Detection system in November 2013.</li>
<li>Search for: &#160; <i>creation_date:2013</i><br />
to show isolates that were first seen by the Pathogen Detection system in 2013, regardless of the month or date.</li>
<li>Search for: &#160; <i>creation_date:[2013-02 TO 2013-08]</i><br />to show isolates that were first seen by the Pathogen Detection system anytime from February 2013 through August 2013.</li>
<li>Search for: &#160; <i>creation_date:[2013 TO 2015]</i><br />
to show isolates that were first seen by the Pathogen Detection system in any month or date from 2013 through 2015.</li>
</ul>
</li>
<!-- ====== Technical background notes for creation_date:
creation_date - is a true date and time field that Lewis created from the target creation date. It is a copy of the target creation date field, but it is a RANGE date and time field, not a POINT date and time field. As a result, it can be searched with a partial string. That is, the user does not need to enter the complete YYYY-MM-DDTHH:MM:SSZ string in the query. Instead, s/he can instead enter only part of the string, and the Isolates Browser will convert the user's query string into a range between two POINTS.
For example, if a user enters the query as:
2018-01-15
the system will convert that query to the range:
[2018-01-15T00:00:01Z TO 2018-01-15T23:59:59Z]
The creation_date field also allows users to do a range search, for example:
creation_date:[2013-11-01 TO 2013-11-30]
or
creation_date:[2013-08 TO 2013-11]
or
creation_date:[2013 TO 2015]
The creation_date field DOES NOT ALLOW USERS TO USE AN ASTERISK for truncation, for example:
creation_date:2013-11*
will retrieve ZERO ISOLATES. Instead, users can enter part of the date string, such as YYYY-MM or YYYY to retrieve isolates first seen in a given month or year, respectively, or they can use a range, as shown in the examples above.
====== End of Technical background notes for creation_date -->
<!-- ====== Technical background notes for target_creation_date:
target_creation_date - this is a POINT date and time field; it includes both the date and the time (expressed as Zulu time or Greenwich Meridian Time (GMT)). Even though the date is stamped as GMT, the date stamp actually reflects the Eastern time at which the collection was loaded into the Pathogen detection project. It represents the date and time on which the Pathogen Detection project first saw the GENOME ASSEMBLY for the isolate. The beginning and end of the range have to be expressed as POINT TIMES with the full string YYYY-MM-DDTHH:MM:SSZ. When a user is searching the target_creation_date field, the complete YYYY-MM-DDTHH:MM:SSZ string must be entered in the query.
CAUTION: If you insert a space after the datafieldname and colon (i.e., insert a space before the search term), then the system treats the query string as free text (and not a date). The system therefore looks in the Collection Date field because that field contains values that are text strings and not actual dates.
The "target_creation_date" field is not shown in this help document because it seems unlikely that users will know and/or search for the full string YYYY-MM-DDTHH:MM:SSZ, So only the "creation_date" field is shown in the help document, as it can be searched with YYYY-MM-DD, or YYYY-MM, or YYYY.
====== End of Technical background notes for target_creation_date -->
<!-- ======== DATA_FIELD_FoodOrigin ========== -->
<li id="isolates-browser-data-field-FoodOrigin">
<span style="background-color: #cde1ff">Food origin (<b><i>food_origin</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of Isolates Browser data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
The geographical location where the sample originated, if provided by the submitter. This matches the /country qualifier of GenBank records. The data field typically may have two parts: <b>Country:Region</b>. <b>Country</b> is a <b>controlled vocabulary</b> (<a href="https://www.ncbi.nlm.nih.gov/genbank/collab/country/">https://www.ncbi.nlm.nih.gov/genbank/collab/country/</a>). <b>Region</b> is <b>not controlled</b> and can be anything (i.e., free text). For example, region could be a state abbreviation, province name, or city name.<br /><br />
Data field names and values are <a href="#case-sensitive">case sensitive</a>, as shown in the examples below. If you enter both Country and Region, surround the query string in quotes. If you only specify a country and no region,<!-- the retrieval will vary depending on whether you insert a <b>space</b> after "geo_loc_name:" If there is <b>no space</b>, --> then the search system will retrieve all isolates with the specified country name, regardless of region.<br /><br />
Note: use this field to indicate from where the sample originated, not where it was collected.
<b>Examples:</b>
<ul>
<li>To search this field directly, enter a query such as: &#160;
<i>food_origin:searchterm</i></li>
<li>Search for: &#160; <i>food_origin:"USA:NY"</i><br />
with <b>quotes</b> around the "country:region" query string, to retrieve isolates that originated in New York State.</li>
<li>Search for: &#160; <i>food_origin:USA</i><br />
with <b>no space</b> before the country name, to retrieve isolates that originated in the United States, regardless of region.
<i>(If you insert a space before the country name, the system converts the query to a search of the Text index, which is a case insensitive compilation of terms from many text-containing data fields. It will therefore retrieve isolates that contain your search term (in upper and/or lower case) in any data field.)</i></li>
</ul>
</li>
<!-- ======== DATA_FIELD_Host ========== -->
<li id="isolates-browser-data-field-Host">
<span style="background-color: #cde1ff">Host (<b><i>host</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of Isolates Browser data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
Host species, if provided by the submitter.<br /><br />
This field contains values exactly as they were entered by the data submitters. Some submitters might have entered a <b>scientific name</b> while others might have entered a <b>common name</b>; therefore, search for <b>synonyms</b> if you would like to retrieve more comprehensive results.<br />
Data field names and values are <a href="#case-sensitive">case sensitive</a>, as shown in the examples below, and a separate section of this document provides tips about using <a href="#filters-synonyms">synonyms</a> in your query.<br /><br />
<b>Examples:</b>
<ul>
<li>To search this field directly, enter a query such as: &#160;
<i>host:searchterm</i></li>
<li>Search for: &#160; <i>host:"Homo sapiens"</i><br />
to retrieve only the isolates in which the submitter used the scientific name for the host species.</li>
<li>Search for: &#160; <i>host:human</i><br />
to retrieve only the isolates in which the submitter used the common name for the host species.</li>
<li>Search for: &#160; <i>host:"Homo sapiens" OR host:human</i><br />
to retrieve only the isolates in which the submitter used either the scientific name or the common name for the host species.</li>
</ul>
</li>
<!-- ======== DATA_FIELD_HostDisease ========== -->
<li id="isolates-browser-data-field-HostDisease">
<span style="background-color: #cde1ff">Host Disease (<b><i>host_disease</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of Isolates Browser data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
Host disease, if provided by the submitter.<br /><br />
This field contains values exactly as they were entered by the data submitters. Search for synonyms if you would like to retrieve more comprehensive results.<br />
To browse the various values that are available in a data field, use the "<a href="#isolates-browser-display-options">Choose Columns</a>" option at the top of the "Matched Isolates" table, select the desired column (data field) to display, then click on the column header to sort by the values in that column.<br />
Data field names and values are <a href="#case-sensitive">case sensitive</a>, as shown in the examples below, and separate sections of this document provides tips about using <a href="#filters-synonyms">synonyms</a> in your query, and <a href="#query-tips-phrase-search-quotes">using quotes for phrase searches</a>.<br /><br />
<b>Examples:</b>
<ul>
<li>To search this field directly, enter a query such as: &#160;
<i>host_disease:searchterm</i></li>
<li>Search for: &#160; <i>host_disease:HUS</i></li>
<li>Search for: &#160; <i>host_disease:"hemolytic uremic syndrome"</i></li>
<li>Search for: &#160; <i>host_disease:"Hemolytic Uremic Syndrome"</i></li>
<li>Search for: &#160; <i>host_disease:HUS OR host_disease:"hemolytic uremic syndrome" OR host_disease:"Hemolytic Uremic Syndrome"</i></li>
</ul>
</li>
<!-- ======== DATA_FIELD_IFSAC_category ========== -->
<li id="isolates-browser-data-field-IFSAC_category">
<span style="background-color: #cde1ff">IFSAC_category(<b><i>IFSAC_category</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of Isolates Browser data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
IFSAC_category, if provided by the submitter.
The Interagency Food Safety Analytics Collaboration (IFSAC) develops regulatory-focused schemes to help categorize isolate sourcing information. <br /><br />
This field contains values exactly as they were entered by the data submitters. Search for synonyms if you would like to retrieve more comprehensive results.<br /><br />
To browse the various values that are available in a data field, use the "<a href="#isolates-browser-display-options">Choose Columns</a>" option at the top of the "Matched Isolates" table, select the desired column (data field) to display, then click on the column header to sort by the values in that column.<br />
Data field names and values are <a href="#case-sensitive">case sensitive</a>, as shown in the examples below, and separate sections of this document provides tips about using <a href="#filters-synonyms">synonyms</a> in your query, and <a href="#query-tips-phrase-search-quotes">using quotes for phrase searches</a>.<br /><br />
<b>Examples:</b>
<ul>
<li>To search this field directly, enter a query such as: &#160;
<i>IFSAC_category:searchterm</i></li>
<li>Search for: &#160; <i>IFSAC_category:nuts</i></li>
</ul>
<br />
An alternative way to search the <i>IFSAC_category</i> data field is to use the "<a href="#filters"><b>Filters</b></a>" option, which includes a <b>"IFSAC_cateogry " text box</b>, where you can enter the category name. Here it is possible to search for null values by selecting <b>&lt;EMPTY&gt;</b>. <br /><br />
</li>
<!-- ======== DATA_FIELD_Isolate ========== -->
<li id="isolates-browser-data-field-Isolate">
<span style="background-color: #cde1ff">Isolate (<b><i>target_acc</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of Isolates Browser data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
Pathogen Detection accession of the isolate. The accession begins with the prefix "<b>PDT</b>," which stands for Pathogen Detection Target. This database is the primary resource issuing PDT accessions.<br /><br />
<b>Each target is the genome assembly for a single pathogen isolate</b>. There are <b>several types of genome assemblies</b>:<br />
<ol>
<li>isolate genomes assembled by the NCBI Pathogens <a href="/pathogens/docs/data_processing">data processing</a> pipeline from sequence reads, but not published as genome sequence records in GenBank</li>
<li>isolates submitted directly to GenBank as assembled genomes, and therefore have a corresponding <a href="#accession-prefix-gca">"GCA" accession</a></li>
<li>isolate genomes assembled by the NCBI data processing pipeline and then submitted to GenBank either by the submitter or on behalf of the submitter with their permission, or without their permission into the <a href="https://www.ncbi.nlm.nih.gov/genbank/tpa/">Third Party Annotation (TPA) database</a>.</li>
</ol>
<br />
Data field names and values are <a href="#case-sensitive">case sensitive</a>, including in <a href="#filters-isolate">Filters</a>, and the letters that are in the <b>accession prefix must be in upper case</b>, as shown in the example below. (A separate section of this document provides a list of <a href="#accession-prefixes">accession prefixes</a> that appear in the Pathogen Detection project.)<br /><br />
The contents of this field may change for a given isolate if a new assembly or new metadata cause the pipeline to be rerun. See <a href="#data-retention">Data Retention and History Tracking</a> for information on the data retention policy.<br /><br />
<b>Examples:</b>
<ul>
<li>To search this field directly, enter a query such as: &#160;
<i>target_acc:searchterm</i></li>
<li>Search for: &#160; <i>target_acc:PDT000133982</i></li>
</ul>
</li>
<!-- ======== DATA_FIELD_Isolate_identifiers ========== -->
<li id="isolates-browser-data-field-Isolate_identifiers">
<span style="background-color: #cde1ff">Isolate_identifiers (<b><i>isolate_identifiers</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of Isolates Browser data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
A list of alternative identifiers that the isolate may be known by.<br /><br />
<b>Ids are assembled from various fields in the BioSample record, including</b>:<br />
<ol>
<li>auxiliary identifiers supplied with the Biosample</li>
<li>sample_name</li>
<li>strain</li>
<li>isolate (from BioSample)</li>
<li>NARMS_isolate_number</li>
<li>culture_collection</li>
<li>isolate_name_alias (split by delimiter)</li>
</ol>
<br />
Data field names and values are <a href="#case-sensitive">case sensitive</a> and embedded spaces must be contained in quotes.<br /><br />
<b>Examples:</b>
<ul>
<li>To search this field directly, enter a query such as: &#160;
<i>isolate_identifiers:searchterm</i></li>
<li>Search for a specific identifier: CFSAN045463 <i>isolate_identifiers:CFSAN045463</i></li>
<li>Search for an identifier with embedded space: CVM N9107 <i>isolate_identifiers:"CVM N9107"</i></li>
<li>Search with a wildcard pattern: FSIS* <i>isolate_identifiers:FSIS*</i></li>
<li>Search a list <i>isolate_identifiers:(PNUSAS185147 PNUSAS185148 PNUSAS185149)</i></li>
</ul>
</li>
<!-- ======== DATA_FIELD_IsolationSource ========== -->
<li id="isolates-browser-data-field-IsolationSource">
<span style="background-color: #cde1ff">Isolation Source (<b><i>isolation_source</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of Isolates Browser data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
Describes the physical, environmental and/or local geographical source of the biological sample from which the sample was derived, if provided by the submitter.<br /><br />
This field contains values exactly as they were entered by the data submitters. Data field names and values are <a href="#case-sensitive">case sensitive</a>, as shown in the examples below. Separate sections of this document provides tips about the use of <a href="#query-tips-phrase-search-quotes">quotes for phrase searches</a>, <a href="#special-characters">special characters</a> that are part of a query term, and the use of <a href="#wildcards">wildcards</a>.<br /><br />
<b>Examples:</b>
<ul>
<li>To search this field directly, enter a query such as: &#160;
<i>isolation_source:searchterm</i></li>
<li>Search for: &#160; <i>isolation_source:lettuce</i></li>
<li>Search for: &#160; <i>isolation_source:"All-Purpose Flour"</i><br />
to show all isolates that have that exact string (including upper case, lower case, and hypen) in the isolation source data field.</li>
<li>Search for: &#160; <i>isolation_source:*berry</i><br />
to show isolates that contain terms such as <i>strawberry</i>, <i>mulberry</i>, etc. in the isolation source data field, using the asterisk as a <a href="#wildcards">wildcard</a> to match zero or more sequential characters.</li>
<li>Note that submitters might use different terms for the same type of source (e.g., "animal-chicken-young-chicken," "chicken," "chicken breast," "Chicken Breast," "chicken carcass," "comminuted chicken," and "raw intact chicken"), so search for <a href="#synonyms">synonyms</a> to broaden your retrieval, if desired.</li>
</ul>
</li>
<!-- ======== DATA_FIELD_IsolationType ========== -->
<li id="isolates-browser-data-field-IsolationType">
<span style="background-color: #cde1ff">Isolation type (<b><i>epi_type</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of Isolates Browser data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
Isolation type of an isolate: <b>clinical</b> OR <b>environmental/other</b> OR <b>NULL</b>.<br />
Note, this field is derived from the attribute package selected by the isolate's submitter using one of the Pathogen templates in BioSample.
<ul>
<li>If <b>attribute_package</b>=<a href="https://www.ncbi.nlm.nih.gov/biosample/docs/packages/Pathogen.cl.1.0">Pathogen.cl.1.0</a> then isolation type is <b>clinical</b>.</li>
<li>If <b>attribute_package</b>=<a href="https://www.ncbi.nlm.nih.gov/biosample/docs/packages/Pathogen.env.1.0">Pathogen.env.1.0</a> then isolation type is <b>environmental/other</b>,
unless host or isolation_source indicates that it was isolated from a human subject in which case isolation type is <b>clinical</b>.</li>
<li>If neither of these packages is used then isolation type is <b>NULL</b>.</li>
</ul>
<br />
The isolation type (epi_type) is used to calculate the SNP distance values
<a href="#isolates-browser-data-field-MinSame">Min-same</a> and <a href="#isolates-browser-data-field-MinDiff">Min-diff</a> .
These have non-negative values when there are other isolates in the cluster having the same or different isolation type.
These values will both be <b>n/a</b> if the isolate has isolation type <b>NULL</b>.
These values will also be <b>n/a</b> if there is no other isolate in the cluster having the same or different isolation type.
<br />
This data field's names and values are <a href="#case-sensitive">case sensitive</a>
and can be searched on values <b>clinical</b> OR <b>environmental/other</b> (enter as-is without quotes).
The value <b>NULL</b> cannot be used as a search term. However, by using filters,
you can choose between <b>clinical</b> OR <b>environmental/other</b> OR <b>&lt;EMPTY&gt;</b> and thereby find isolates whose <i>epi_type</i> is not set.
<br /><br />
<b>Examples:</b>
<ul>
<li>To search this field directly, enter a query such as: &#160;
<i>epi_type:searchterm</i></li>
<li>Search for clinical isolates: &#160; <i>epi_type:clinical</i></li>
<li>Search for environmental isolates: &#160; <i>epi_type:environmental/other</i></li>
<li>Search for isolates without epi_type: &#160; <i>NOT epi_type:clinical NOT epi_type:environmental/other</i></li>
</ul>
</li>
<!-- ======== DATA_FIELD_KmerGroup ========== -->
<li id="isolates-browser-data-field-KmerGroup">
<span style="background-color: #cde1ff">K-mer group (<b><i>kmer_group</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of Isolates Browser data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
K-mer group accession, which is an alphanumeric representation of the <a href="#isolates-browser-data-field-OrganismGroup">Organism group</a>. This database is the primary resource issuing PDG accession numbers. There is a one-to-one relationship of the organism group and the PDG accession, with each version representing each update of that organism group.<br /><br />
The K-mer accession should be entered in the form of <b>Accession.version</b>, as in the first example below.<br />
If you enter only the accession, <b>no hits</b> will be returned.<br />
If you don't know the version number, then you can use an <b>asterisk</b> (<b>*</b>) to serve as a <b>wildcard</b>, as in the second example below.<br />
Data field names and values are <a href="#case-sensitive">case sensitive</a>, and the letters that are in the <b>accession prefix must be in upper case</b>, as shown in the examples below. (A separate section of this document provides a list of <a href="#accession-prefixes">accession prefixes</a> that appear in the Pathogen Detection project.)<br /><br />
<b>Examples:</b>
<ul>
<li>To search this field directly, enter a query such as: &#160;
<i>kmer_group:searchterm</i></li>
<li>Search for: &#160; <i>kmer_group:PDG000000004.960</i></li>
<li>Search for: &#160; <i>kmer_group:PDG000000004.*</i><br />
with an asterisk (*) serving as a wildcard, if you don't know the version number of the K-mer accession.</li>
</ul>
</li>
<!-- ======== DATA_FIELD_LatLon ========== -->
<li id="isolates-browser-data-field-LatLon">
<span style="background-color: #cde1ff">Lat/Lon (<b><i>lat_lon</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of Isolates Browser data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
The geographical coordinates (latitude and longitude) of the location where the sample was collected, if provided by the submitter.
<!-- ul>
<li>To search this field directly, enter a query such as: &#160;
<i>____:searchterm</i></li>
<li>For example: &#160; <i>____:_____</i></li>
</ul><br -->
</li>
<!-- ======== DATA_FIELD_Length ========== -->
<li id="isolates-browser-data-field-Length">
<span style="background-color: #cde1ff">Length (<b><i>asm_stats_length_bp</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of Isolates Browser data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
Total length of the genome sequence assembly in number of base pairs (nucleotides).<br />
If this was submitted to GenBank by the submitter it will be from their assembly and will match the assembly stats in the assembly database (https://www.ncbi.nlm.nih.gov/assembly/). If it is from an assembly made by the Pathogen Detection system, it may not yet be in GenBank, and therefore this will be the only place to see the assembly statistics.
<br /><br />
When searching the Length data field, the value should be entered as an <b>integer with no commas</b>.<br />
To search for a <b>range of values</b>, enter a query such as: &#160; <i>asm_stats_length_bp:[value1 TO value2]</i><br />
with <b>square brackets</b> surrounding the query string, and with the word <b>"TO" written in upper case</b>.<br />
Data field names and values are <a href="#case-sensitive">case sensitive</a>, and this <b>data field name</b> should be written in all <b>lower case</b>.<br /><br />
<b>Examples:</b>
<ul>
<li>To search this field directly, enter a query such as: &#160;
<i>asm_stats_length_bp:[value1 TO value2]</i>
</li>
<li>Search for: &#160; <i>asm_stats_length_bp:[4000000 TO 5000000]</i><br />
to retrieve isolates with genome assemblies that are anywhere in the range of 4,000,000 to 5,000,000 nucleotides in length.</li>
</ul>
</li>
<!-- ======== DATA_FIELD_Level ========== -->
<li id="isolates-browser-data-field-Level">
<span style="background-color: #cde1ff">Level (<b><i>asm_level</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of Isolates Browser data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
Assembly level. <br /><br />
<!-- The following text is adapted from https://www.ncbi.nlm.nih.gov/assembly/help/ -->
The NCBI <a href="https://www.ncbi.nlm.nih.gov/assembly/">Assembly database</a>, which includes pathogen isolates as well as eukaryotic organisms, represents genomes assembled to different levels <i>(<a href="https://www.ncbi.nlm.nih.gov/assembly/help/">read more about assembly levels</a>)</i>. This field is only present for those assemblies in the assembly database. For pathogen assemblies not yet submitted to GenBank, this field will be blank, but for all intents and purposes the Pathogen Detection assemblies will only be at contig level. The Isolates Browser uses circle icons to represents the assembly levels, as follows:<br /><br />
<ul>
<li><b>Complete Genome</b>: &#160; Complete genome assemblies, represented in the "Level" column as a <b>completely filled black circle</b> icon.<!-- I>Example: isolate accession number <a href="/pathogens/isolates#/search/target_acc:PDT000216052.3">PDT000216052.3</a></i --></li>
<!-- li><b>Chromosome</b>: &#160; Assemblies that include chromosomes or linkage groups, scaffolds, and contigs, represented in the "Level" column as a <b>3/4 filled circle</b> icon</li><br -->
<li><b>Scaffold</b>: &#160; Assemblies that include scaffolds and contigs, represented in the "Level" column as a <b>1/2 filled circle</b> icon.<!-- I>Example: isolate accession number <a href="/pathogens/isolates#/search/target_acc:PDT000333204.1">PDT000333204.1</a></i --></li>
<li><b>Contig</b>: &#160; Assemblies that include only contigs, represented in the "Level" column as a <b>1/4 filled circle</b> icon.<!-- I>Example: isolate accession number <a href="/pathogens/isolates#/search/target_acc:PDT000333205.1">PDT000333205.1</a></i --></li>
<b>Examples:</b>
<ul>
<li>To search this field directly, enter a query such as: &#160;
<i>asm_level:"searchterm"</i></li>
<li>Search for: &#160; <i>asm_level:"Complete Genome"</i></li>
</ul>
</ul>
</li>
<!-- ======== DATA_FIELD_LibraryLayout ========== -->
<li id="isolates-browser-data-field-LibraryLayout">
<span style="background-color: #cde1ff">Library Layout (<b><i>LibraryLayout</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of Isolates Browser data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
Sequence Read Archive (SRA) library layout (PAIRED/SINGLE)<br /><br />
Data field names and values are <a href="#case-sensitive">case sensitive</a>. The value for library layout must be entered in all upper case, as shown in the example below.<br /><br />
<b>Examples:</b>
<ul>
<li>To search this field directly, enter a query such as: &#160;
<i>LibraryLayout:searchterm</i></li>
<li>Search for: &#160; <i>LibraryLayout:PAIRED</i></li>
</ul>
</li>
<!-- ======== DATA_FIELD_Location ========== -->
<li id="isolates-browser-data-field-Location">
<span style="background-color: #cde1ff">Location (<b><i>geo_loc_name</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of Isolates Browser data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
The geographical location where the sample was collected, if provided by the submitter. This matches the /country qualifier of GenBank records. The Location data field typically may have two parts: <b>Country:Region</b>. <b>Country</b> is a <b>controlled vocabulary</b> (<a href="https://www.ncbi.nlm.nih.gov/genbank/collab/country/">https://www.ncbi.nlm.nih.gov/genbank/collab/country/</a>). <b>Region</b> is <b>not controlled</b> and can be anything (i.e., free text). For example, region could be a state abbreviation, province name, city name, zip code, etc.<br /><br />
Data field names and values are <a href="#case-sensitive">case sensitive</a>, as shown in the examples below. If you enter both Country and Region, surround the query string in quotes. If you only specify a country and no region,<!-- the retrieval will vary depending on whether you insert a <b>space</b> after "geo_loc_name:" If there is <b>no space</b>, --> then the search system will retrieve all isolates with the specified country name, regardless of region.<br /><br />
Note: use this field to indicate from where the sample was collected, not where it originated.
<b>Examples:</b>
<ul>
<li>To search this field directly, enter a query such as: &#160;
<i>geo_loc_name:searchterm</i></li>
<li>Search for: &#160; <i>geo_loc_name:"USA:NY"</i><br />
with <b>quotes</b> around the "country:region" query string, to retrieve isolates that were collected in New York State.</li>
<li>Search for: &#160; <i>geo_loc_name:USA</i><br />
with <b>no space</b> before the country name, to retrieve isolates that were collected in the United States, regardless of region.<!-- retrieves 147,196 as of June 25, 2018 -->
<i>(If you insert a space before the country name, the system converts the query to a search of the Text index, which is a case insensitive compilation of terms from many text-containing data fields. It will therefore retrieve isolates that contain your search term (in upper and/or lower case) in any data field.)</i></li>
</ul>
</li>
<!-- ======== DATA_FIELD_Method ========== -->
<li id="isolates-browser-data-field-Method">
<span style="background-color: #cde1ff">Method (<b><i>assembly_method</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of Isolates Browser data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
Assembly method.<br /><br />
This field contains values exactly as they were entered by the data submitters. <!-- The values in this column are the exact text strings that were provided by the data submitters for assembly method. --><br /><br />
When searching this field, the query string you enter must match exactly the string that appears in the "Method" column, including capitalization, punctuation, and spaces.<br /><br />
Data field names and values are <a href="#case-sensitive">case sensitive</a>, and <a href="#query-tips-phrase-search-quotes">quotes can be used for phrase searches</a>, as shown in the examples below.<br /><br />
<b>Examples:</b><br />
<ul>
<li>To search this field directly, enter a query such as: &#160;
<i>assembly_method:"search string in quotes"</i></li>
<li>Search for: &#160; <i>assembly_method:"CLC NGS Cell v. 9.0"</i></li>
<li>Search for: &#160; <i>assembly_method:"PacBio SMRT Analysis v. 2.3.0"</i></li>
<li>Search for: &#160; <i>assembly_method:"SPAdes v. 3.11.1"</i></li>
</ul><br />
</li>
<!-- ======== DATA_FIELD_MinSame ========== -->
<li id="isolates-browser-data-field-MinSame">
<span style="background-color: #cde1ff">Min-same (<b><i>minsame</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of Isolates Browser data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
Minimum SNP distance from this isolate to one of the same <a href="#isolates-browser-data-field-IsolationType">isolation type</a>.
For example, the minimum SNP distance from one clinical isolate to another clinical isolate, or from one environmental isolate to another environmental isolate.<br /><br />
A value will appear in the "Min-diff" column only if an isolate has been found, by the Pathogen Detection Project data processing pipeline, to belong to a SNP cluster and another isolate in that cluster has the same isolation type (and the isolation type is not NULL).
If it has, the isolate will contain a "PDS*" accession number in the "<a href="#isolates-browser-data-field-SNPCluster">SNP cluster</a>" column of the Isolates Browser,
along with a value in the "Min-same" and/or "<a href="#isolates-browser-data-field-MinDiff">Min-diff</a>" columns (depending upon the composition of the SNP cluster).<br /><br />
To view the SNP cluster for an isolate of interest, click on either the "PDT*" accession number in the "Isolate" column, or the "PDS*" accession number in the "SNP cluster" column.
In the SNP Tree Viewer display, the branch lengths are proportional to the number of SNPs among the isolates in the cluster. Mouse over any branch to see its length.<br /><br />
Note that the value of <b>Min-same</b> is <b>n/a</b> where the isolate does not have a value for <a href="#isolates-browser-data-field-IsolationType">isolation type</a>.
It is also <b>n/a</b> where there are no other isolates in the cluster with this isolate's <a href="#isolates-browser-data-field-IsolationType">isolation type</a>,
or if the isolate is not in any SNP cluster.<br /><br />
To search for a <b>range of values</b>, enter a query such as: &#160; <i>minsame:[value1 TO value2]</i> &#160;
with <b>square brackets</b> surrounding the query string, and with the word <b>"TO" written in upper case</b>.
Data field names and values are <a href="#case-sensitive">case sensitive</a>, and this <b>data field name</b> should be written in all <b>lower case</b>.<br /><br />
<b>Examples:</b>
<ul>
<li>To search this field directly, enter a query such as: &#160;
<i>minsame:[value1 TO value2]</i></li>
<li>Search for: &#160; <i>minsame:[0 TO 6]</i><br />
to retrieve isolates that are no more than 6 SNPs away from other isolates of the same isolate type within the same cluster.
In other words, retrieve clinical isolates that have a distance of no more than 6 SNPs from other clinical isolates in the same cluster, or retrieve environmental isolates that have a distance of no more than 6 SNPs from other environmental isolates in the same cluster.</li>
</ul>
</li>
<!-- ======== DATA_FIELD_MinDiff ========== -->
<li id="isolates-browser-data-field-MinDiff">
<span style="background-color: #cde1ff">Min-diff (<b><i>mindiff</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of Isolates Browser data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
Minimum SNP distance from this isolate to one of a different <a href="#isolates-browser-data-field-IsolationType">isolation type</a>.
For example, the minimum SNP distance from a clinical isolate to an environmental isolate, or vice versa.<br /><br />
A value will appear in the "Min-diff" column only if an isolate has been found, by the Pathogen Detection Project data processing pipeline, to belong to a SNP cluster and another isolate in that cluster has a different "Isolation type" that is not NULL.
If it has, the isolate will contain a "PDS*" accession number in the "<a href="#isolates-browser-data-field-SNPCluster">SNP cluster</a>" column of the Isolates Browser,
along with a value in the "Min-diff" and/or "<a href="#isolates-browser-data-field-MinSame">Min-same</a>" columns (depending upon the composition of the SNP cluster).<br /><br />
To view the SNP cluster for an isolate of interest, click on either the "PDT*" accession number in the "Isolate" column, or the "PDS*" accession number in the "SNP cluster" column.
In the SNP Tree Viewer display, the branch lengths are proportional to the number of SNPs among the isolates in the cluster. Mouse over any branch to see its length.<br /><br />
Note that the value of <b>Min-diff</b> is <b>n/a</b> where the isolate does not have a value for <a href="#isolates-browser-data-field-IsolationType">isolation type</a>.
It is also <b>n/a</b> where there are no other isolates in the cluster that has a type opposite to this isolate's <a href="#isolates-browser-data-field-IsolationType">isolation type</a>,
or if the isolate is not in any SNP cluster.<br /><br />
To search for a <b>range of values</b>, enter a query such as: &#160; <i>mindiff:[value1 TO value2]</i> &#160; with <b>square brackets</b> surrounding the query string, and with the word <b>"TO" written in upper case</b>. Data field names and values are <a href="#case-sensitive">case sensitive</a>, and this <b>data field name</b> should be written in all <b>lower case</b>. Alternatively <a href="#filters">Filters</a> are a convenient way to search for ranges of values.<br /><br />
<b>Examples:</b>
<ul>
<li>To search this field directly, enter a query such as: &#160;
<i>mindiff:[value1 TO value2]</i></li>
<li>Search for: &#160; <i>mindiff:[0 to 6]</i><br />
to retrieve isolates that are no more than 6 SNPs away from other isolates of the opposite isolate type within the same cluster. In other words, retrieve clinical isolates that have a distance of no more than 6 SNPs from environmental isolates in the same cluster, or vice versa.</li>
</ul>
</li>
<!-- ======== DATA_FIELD_N50 ========== -->
<li id="isolates-browser-data-field-N50">
<span style="background-color: #cde1ff">N50 (<b><i>asm_stats_contig_n50</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of Isolates Browser data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
Assembly contig N50. This is a statistical measure that defines assembly quality. At least half of the bases in the assembly belong to contigs that have a length of N50 or longer.<br />
If this was submitted to GenBank by the submitter it will be from their assembly and will match the assembly stats in the assembly database (https://www.ncbi.nlm.nih.gov/assembly/). If it is from an assembly made by the Pathogen Detection system, it may not yet be in GenBank, and therefore this will be the only place to see the assembly statistics.<br /><br />
When searching the N50 data field, the value should be entered as an <b>integer with no commas</b>.<br />
To search for a <b>range of values</b>, enter a query such as: &#160; <i>asm_stats_contig_n50:[value1 TO value2]</i> &#160;
with <b>square brackets</b> surrounding the query string, and with the word <b>"TO" written in upper case</b>. Data field names and values are <a href="#case-sensitive">case sensitive</a>, and this <b>data field name</b> should be written in all <b>lower case</b>.<br /><br />
<b>Examples:</b>
<ul>
<li>To search this field directly, enter a query such as: &#160;
<i>asm_stats_contig_n50:[value1 TO value2]</i></li>
<li>Search for: &#160; <i>asm_stats_contig_n50:[1000000 TO 9999999]</i><br />
to retrieve isolates with genome assemblies that are highly aggregated (in this case 50% of the assembly length is in contigs 1 Mbp or greater in size).</li>
</ul>
</li>
<!-- ======== DATA_FIELD_OrganismGroup ========== -->
<li id="isolates-browser-data-field-OrganismGroup">
<span style="background-color: #cde1ff">Organism Group (<b><i>taxgroup_name</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of Isolates Browser data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
Organism group related by taxonomy for purposes of calculating <a href="#isolates-browser-data-field-SNPCluster">SNP clusters</a><!-- from column header mousover text, 5/17/2018 -->.<br />
There is a one-to-one relationship between organism group and <a href="#accession-prefixes">PDG accession</a>. The organism group is effectively a shorthand for the organism that is predominant but does not list all organism present. These organism groups are manually constructed and may include sister species and outgroups. To see the full list of organism for each organism group utilize the <a href="#isolates-browser-data-field-ScientificName">scientific_name</a> field.<br /><br />
Some organism groups are represented by the <i>Genus species</i> name, such as "<i>Listeria monocytogenes</i>," and others are represented as a phrase, such as "<i>E.coli and Shigella</i>."<br /><br />
Data field names and values are <a href="#case-sensitive">case sensitive</a>, and <a href="#query-tips-phrase-search-quotes">quotes can be used for phrase searches</a>, as shown in the example below. The system will retrieve isolates that contain the exact organism group name that you entered, including capitalization, punctuation, and spaces.<br /><br />
<b>Examples:</b><br />
<ul>
<li>To search this field directly, enter a query such as: &#160;
<i>taxgroup_name:searchterm</i></li>
<li>Search for: &#160; <i>taxgroup_name:"Acinetobacter baumannii"</i></li>
</ul><br />
<b>Tips:</b><br />
Alternative ways to retrieve isolates that belong to a specific organism group include:<br />
<ul>
<li>Use the <b>"Select an organism group" menu</b> that appears near the top of the <a href="/pathogens/isolates#/search/">Isolates Browser</a> interface, OR</li>
<li>Open the complete list of <a href="/pathogens/organisms/">Organism Groups</a> and follow the links of interest to retrieve the isolates that belong to a group of interest.</li>
</ul>
<br />
<b>Technical note:</b><br />
<ul>
<li><i>An organism group (PDG) contains one or more targets (PDTs). A PDT is a member of zero or one SNP cluster (PDS), and never more than one cluster. A SNP cluster is composed of two or more PDTs, and each PDS is completely contained within a PDG. (A separate section of this document provides a list of <a href="#accession-prefixes">accession prefixes</a> that appear in the Pathogen Detection project.)</i></li>
</ul>
<br />
</li>
<!-- ======== DATA_FIELD_Outbreak ========== -->
<li id="isolates-browser-data-field-Outbreak">
<span style="background-color: #cde1ff">Outbreak (<b><i>outbreak</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of Isolates Browser data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
The submitter designated name for an occurrence of more cases of disease than expected in a given area or among a specific group of people over a particular period of time, if provided by the submitter.<br /><br />
This field contains values exactly as they were entered by the data submitters.<br /><br />
When searching this field, the query string you enter must match exactly the string that appears in the "Outbreak" column, including capitalization, punctuation, and spaces.<br /><br />
Data field names and values are <a href="#case-sensitive">case sensitive</a>, and <a href="#query-tips-phrase-search-quotes">quotes can be used for phrase searches</a>, as shown in the example below.<br /><br />
<b>Examples:</b>
<ul>
<li>To search this field directly, enter a query such as: &#160;
<i>outbreak:"query string in quotes"</i></li>
<li>Search for: &#160; <i>outbreak:"1109COGX6-1 Cantaloupe"</i></li>
<li>Search for: &#160; <i>outbreak:"1203NYJAP-1"</i></li>
<li>To retrieve all isolates that have a value in the outbreak data field, enter a query that uses the asterisk (wildcard) as the value.<br /><br />
Search for: &#160; <i>outbreak:*</i><br /><br />
Once the search results are displayed, use the "<a href="#isolates-browser-display-options">Choose Columns</a>" option at the top of the "Matched Isolates" table to add the "Outbreak" column to display, where you can browse the values that submitters entered in that data field.</li>
</ul>
</li>
<!-- ======== DATA_FIELD_ParentGroup ========== -->
<!-- li id="isolates-browser-data-field-ParentGroup">
<span style="background-color: #cde1ff">Parent group (<b><i>parent_group</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of Isolates Browser data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
______________<br /><br />
<b>Examples:</b>
<ul>
<li>To search this field directly, enter a query such as: &#160;
<i>____:searchterm</i></li>
<li>Search for: &#160; <i>____:_____</i></li>
</ul>
</li -->
<!-- ======== DATA_FIELD_PFGEPrimaryEnzymePattern ========== -->
<li id="isolates-browser-data-field-PFGEPrimaryEnzymePattern">
<span style="background-color: #cde1ff">PFGE Primary Enzyme Pattern (<b><i>PFGE_PrimaryEnzyme_pattern</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of Isolates Browser data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
Pulsed-field gel electrophoresis (PFGE) primary enzyme pattern, if provided by the submitter.<br /><br />
This field contains values exactly as they were entered by the data submitters. When searching this field, the query string you enter must match exactly the string that appears in the "PFGE Primary Enzyme Pattern" column, including capitalization and punctuation.<br /><br />
Data field names and values are <a href="#case-sensitive">case sensitive</a>, as shown in the examples below.<br /><br />
PFGE is a DNA fingerprinting technique used to differentiate bacterial strains based on the pattern of DNA fragments that are created by digesting their complete genome with a restriction enzyme. <i>(Read about PFGE on the <a href="https://www.cdc.gov/pulsenet/pathogens/pfge.html">CDC website</a> and in <a href="https://www.ncbi.nlm.nih.gov/pubmed?term=26894068+25682374+20692376">PubMed</a>.)</i><br /><br />
<b>Examples:</b>
<ul>
<li>To search this field directly, enter a query such as: &#160;
<i>PFGE_PrimaryEnzyme_pattern:searchterm</i></li>
<li>Search for: &#160; <i>PFGE_PrimaryEnzyme_pattern:GX6A16.0016</i></li>
<li>Search for: &#160; <i>PFGE_PrimaryEnzyme_pattern:JFXX01.0787</i></li>
<li>To retrieve all isolates that have a value in the PFGE Primary Enzyme Pattern data field, enter a query that uses the asterisk (wildcard) as the value.<br /><br />
For example: &#160; <i>PFGE_PrimaryEnzyme_pattern:*</i><br /><br />
Once the search results are displayed, use the "<a href="#isolates-browser-display-options">Choose Columns</a>" option at the top of the "Matched Isolates" table to add the "PFGE Primary Enzyme Pattern" column to display, where you can browse the values that submitters entered in that data field.</li>
</ul>
</li>
<!-- ======== DATA_FIELD_PFGESecondaryEnzymePattern ========== -->
<li id="isolates-browser-data-field-PFGESecondaryEnzymePattern">
<span style="background-color: #cde1ff">PFGE Secondary Enzyme Pattern (<b><i>PFGE_SecondaryEnzyme_pattern</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of Isolates Browser data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
Pulsed-field gel electrophoresis (PFGE) secondary enzyme pattern, if provided by the submitter.<br /><br />
This field contains values exactly as they were entered by the data submitters. When searching this field, the query string you enter must match exactly the string that appears in the "PFGE Secondary Enzyme Pattern" column, including capitalization and punctuation.<br /><br />
Data field names and values are <a href="#case-sensitive">case sensitive</a>, as shown in the examples below.<br /><br />
PFGE is a DNA fingerprinting technique used to differentiate bacterial strains based on the pattern of DNA fragments that are created by digesting their complete genome with a restriction enzyme. <i>(Read about PFGE on the <a href="https://www.cdc.gov/pulsenet/pathogens/pfge.html">CDC website</a> and in <a href="https://www.ncbi.nlm.nih.gov/pubmed?term=26894068+25682374+20692376">PubMed</a>.)</i><br /><br />
<b>Examples:</b>
<ul>
<li>To search this field directly, enter a query such as: &#160;
<i>PFGE_SecondaryEnzyme_pattern:searchterm</i></li>
<li>Search for: &#160; <i>PFGE_SecondaryEnzyme_pattern:EXHA26.0556</i></li>
<li>Search for: &#160; <i>PFGE_SecondaryEnzyme_pattern:GX6A12.0022</i></li>
<li>To retrieve all isolates that have a value in the PFGE Secondary Enzyme Pattern data field, enter a query that uses the asterisk (wildcard) as the value.<br /><br />
Search for: &#160; <i>PFGE_SecondaryEnzyme_pattern:*</i><br /><br />
Once the search results are displayed, use the "<a href="#isolates-browser-display-options">Choose Columns</a>" option at the top of the "Matched Isolates" table to add the "PFGE Secondary Enzyme Pattern" column to display, where you can browse the values that submitters entered in that data field.</li>
</ul>
</li>
<!-- ======== DATA_FIELD_Platform ========== -->
<li id="isolates-browser-data-field-Platform">
<span style="background-color: #cde1ff">Platform (<b><i>Platform</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of Isolates Browser data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
Sequence Read Archive (SRA) sequencing platform.<br /><br />
Data field names and values are <a href="#case-sensitive">case sensitive</a>. The data field name, "Platform," should be written with a leading upper case letter, and the values are also case sensitive, as shown in the examples below.<br /><br />
<b>Examples:</b>
<ul>
<li>To search this field directly, enter a query such as: &#160;
<i>Platform:searchterm</i></li>
<li>Search for: &#160; <i>Platform:ILLUMINA</i></li>
</ul>
<br />
<b>List of supported platforms:</b>
<ul>
<li>ILLUMINA</li>
<li>LS454</li>
<li>ION_TORRENT</li>
</ul>
<br />
</li>
<!-- ======== DATA_FIELD_PDRefGeneCatalogVersion ========== -->
<li id="isolates-browser-data-field-refgene-db-version">
<span style="background-color: #cde1ff">PD Ref Gene Catalog version (<b><i>refgene_db_version</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of Isolates Browser data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
The version of the <a href="/pathogens/isolates#/refgene/">Pathogen Detection Reference Gene Catalog</a> that was used to analyze a particular isolate.<br /><br />
New isolates are analyzed using the latest version of the Pathogen Detection Reference Gene Catalog. Older isolates may have been analyzed with earlier versions of the Pathogen Detection Reference Gene Catalog. There might be occasional updates to annotation on all isolates in special circumstances, such as the identification of a new genes (e.g., mobilized colistin resistance (mcr) genes).<br /><br />
Because the "<i>refgene_db_version</i>" data field was added in February 2020, isolates that were analyzed prior to that time do not have a value in the corresponding "PD Ref Gene Catalog version" data column of the Isolates Browser display.<br /><br />
<i>(Separate sections of this document provide details about the Pathogen Detection <a href="/pathogens/docs/data_processing">data processing pipeline</a>, <a href="#reference-gene-catalog">Pathogen Detection Reference Gene Catalog help</a>, and an <a href="#amr-finder">overview of AMRFinderPlus</a> that applies the Reference Gene Catalog data in the analysis of isolate genome assemblies. The <a href="https://github.com/ncbi/amr/wiki">AMRFinderPlus wiki</a> provides details about installing and running the program, interpreting the results, and methods used.)</i><br /><br />
Data field names and values are <a href="#case-sensitive">case sensitive</a>, as shown in the examples below. Additional sections of this document provide tips about search terms that contain <a href="#special-characters">special characters</a> (such as the parentheses, hyphens, and apostrophes in the second example below), and the use of <a href="#wildcards">wildcards</a> such as the asterisk and question mark (as in the first and third examples below).<br /><br />
<b>Examples:</b>
<ul>
<li>To search this field directly, enter a query such as: &#160;
<i>refgene_db_version:searchterm</i></li>
<li>Search for: &#160; <i>refgene_db_version:2020-01-06.1</i><br />
to show all of the isolates that were analyzed with the Pathogen Detection Reference Gene Catalog version 2020-01-06.1.
</li>
<li>Search for: &#160; <i>refgene_db_version:2020-01-22.1</i><br />
to show all of the isolates that were analyzed with the Pathogen Detection Reference Gene Catalog version 2020-01-22.1.
</li>
</ul>
</li>
<!-- ======== DATA_FIELD_Run ========== -->
<li id="isolates-browser-data-field-Run">
<span style="background-color: #cde1ff">Run (<b><i>Run</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of Isolates Browser data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
Sequence Read Archive (SRA) accession of the sequence that was used for the genome assembly.<br /><br />
Data field names and values are <a href="#case-sensitive">case sensitive</a>. The data field name, "Run," should be written with a leading upper case letter, and the "SRR" accession prefix should be written in all upper case, as shown in the examples below. (A separate section of this document provides a list of <a href="#accession-prefixes">accession prefixes</a> that appear in the Pathogen Detection project.)<br /><br />
<b>Examples:</b>
<ul>
<li>To search this field directly, enter a query such as: &#160;
<i>Run:searchterm</i></li>
<li>Search for: &#160; <i>Run:SRR3747659</i></li>
<li>Search for: &#160; <i>Run:SRR5862473 OR SRR7456389</i></li>
</ul><br />
</li>
<!-- ======== DATA_FIELD_Strain ========== -->
<li id="isolates-browser-data-field-Strain">
<span style="background-color: #cde1ff">Strain (<b><i>strain</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of Isolates Browser data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
Microbial strain name, if provided by the submitter.<br /><br />
This field contains values exactly as they were entered by the data submitters.<br /><br />
Data field names and values are <a href="#case-sensitive">case sensitive</a>, as shown in the examples below.<br /><br />
Separate sections of this document provide tips about the use of <a href="#query-tips-special-characters">special characters</a> such as the hyphen, <a href="#wildcards">wildcards</a> such as the asterisk, and the use of <a href="#query-tips-phrase-search-quotes">quotes for phrase searches</a> (for strain names that contain spaces).<br /><br />
<b>Examples:</b>
<ul>
<li>To search this field directly, enter a query such as: &#160;
<i>strain:searchterm</i></li>
<li>Search for: &#160; <i>strain:FDA00010279</i></li>
<li>Search for: &#160; <i>strain:KCRI-598A</i></li>
<li>Search for: &#160; <i>strain::PNUSA*</i></li>
</ul><br />
</li>
<!-- ======== DATA_FIELD_Serovar ========== -->
<li id="isolates-browser-data-field-Serovar">
<span style="background-color: #cde1ff">Serovar (<b><i>serovar</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of Isolates Browser data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
Combined field of sub-species, serotype, or serovar, if provided by the submitter.<br /><br />
This field contains values exactly as they were entered by the data submitters.<br /><br />
Data field names and values are <a href="#case-sensitive">case sensitive</a>, as shown in the examples below.<br /><br />
Separate sections of this document provides tips about the use of <a href="#query-tips-phrase-search-quotes">quotes for phrase searches</a>, and <a href="#query-tips-special-characters">special characters</a> that appear in the sub-species, serotype, or serovar names.<br /><br />
<b>Examples:</b>
<ul>
<li>To search this field directly, enter a query such as: &#160;
<i>serovar:searchterm</i></li>
<li>Search for: &#160; <i>serovar:"4,[5],12:b:-"</i></li>
<li>Search for: &#160; <i>serovar:"Shigella sonnei"</i></li>
<li>Search for: &#160; <i>serovar:Enteritidis</i></li>
</ul><br />
</li>
<!-- ======== DATA_FIELD_Serotype ========== -->
<!-- li id="isolates-browser-data-field-Serotype">
<span style="background-color: #cde1ff">Serotype (<b><i>serotype</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of Isolates Browser data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
______________<br />
<ul>
<li>To search this field directly, enter a query such as: &#160;
<i>____:searchterm</i></li>
<li>Search for: &#160; <i>____:_____</i></li>
</ul><br>
</li -->
<!-- ======== DATA_FIELD_SNPCluster ========== -->
<li id="isolates-browser-data-field-SNPCluster">
<span style="background-color: #cde1ff">SNP cluster (<b><i>erd_group</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of Isolates Browser data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
Pathogen SNP cluster accession. A SNP cluster is a group of isolates whose genome assemblies are closely related, depending on the clustering methodology used (as noted in the <a href="/pathogens/docs/data_processing">data processing</a> section of this document).<br /><br />
The SNP cluster accession data field name is <b><i>erd_group</i></b>, in which "<b><i>ERD</i></b>" stands for <b>E</b>pidemiologically <b>R</b>elated <b>D</b>istance.<br /><br />
Each SNP cluster can be viewed as a phylogenetic distance tree in the SNP Tree Viewer. <i>(Read more in the <a href="#snp-tree-viewer">SNP Tree Viewer help document</a>, which includes an <a href="#snp-tree-viewer-access"><span style="color:#d70000">illustrated example</span> of SNP Tree Viewer launch points</a> and an <a href="#snp-tree-viewer-illustration"><span style="color:#d70000">illustrated example</span> of a SNP Tree Viewer display</a>.)</i><br /><br />
Data field names and values are <a href="#case-sensitive">case sensitive</a>, including in <a href="#filters-snp-cluster">Filters</a>, as shown in the examples below.<br /><br />
The first sample search below includes an <b>accession.version</b> number. If you don't know the latest version number for a SNP cluster, you can use an <b>asterisk *</b> as a <a href="#wildcards"><b>wildcard</b></a>, as in the second example below. If you enter an <b>older version number</b> that has since been superceded by a newer version of the SNP cluster, the Isolates Browser will display a message that links to the <b>newer version</b>. The PDS version changes when the membership of a SNP cluster changes.<br /><br />
A separate section of this document provides a list of <a href="#accession-prefixes">accession prefixes</a> that appear in the Pathogen Detection project, and the <a href="#data-retention">data retention and history tracking</a> section describes the use of <a href="#accession-version">accession.versions to track changes</a> to the data.<br /><br />
<b>Examples:</b><br />
<ul>
<li>To search this field directly, enter a query such as: &#160;
<i>erd_group:searchterm</i></li>
<li>Search for: &#160; <i>erd_group:PDS000003441.73</i><!-- 132 isolates in tree as of 7/3/2018; includes both clinical samples from stool and environmental samples from All-Purpose Flour --></li>
<li>Search for: &#160; <i>erd_group:PDS000003441.*</i><!-- 132 isolates in tree as of 7/3/2018; includes both clinical samples from stool and environmental samples from All-Purpose Flour --><br />
with an asterisk (*) serving as a wildcard, if you don't know the version number of the SNP cluster accession.</li>
<li>Note: Because the SNP cluster accession is unique, it is not necessary to include the data field name in searches. It is sufficient to just enter the SNP cluster accession, if desired. For example the first search above can simply be entered as <i>PDS000003441.73</i> into the Isolates Browser, and the second search can be entered as <i>PDS000003441.*</i>.</li>
</ul>
Either one of the search examples above will retrieve isolates that belong to a SNP cluster associated with an E. coli and Shigella outbreak that was traced to All-Purpose Flour. In that tree, the short branches that connect clinical and environmental samples indicate a high degree of similarity in the genome sequences of those isolates. <i>(For more information about the All-Purpose Flour outbreak, see the section of this document on "<a href="#how-to-outbreak">How to identify the possible source of an outbreak</a>.")</i>
</li>
<!-- ======== DATA_FIELD_ScientificName ========== -->
<li id="isolates-browser-data-field-ScientificName">
<span style="background-color: #cde1ff">Scientific name (<b><i>scientific_name</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of Isolates Browser data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
Scientific name (in <a href="https://www.ncbi.nlm.nih.gov/taxonomy">NCBI Taxonomy</a>) of the isolate from the submitter. The <a href="#filters">Filters</a> interface has been customized for this field to show the taxonomic hierarchy. See the <a href="#filters-scientific-name">Filters documentation</a> for details.<br /><br />
Data field names and values are <a href="#case-sensitive">case sensitive</a>, and the genus name must begin with an upper case letter. For example, enter the scientific name for: <i>Escherichia coli</i>. The system will retrieve isolates that have the exact string you entered. An asterisk * can be used as a <a href="#wildcards">wildcard</a>, if desired.<br /><br />
<b>Examples:</b><br />
<ul>
<li>To search this field directly, enter a query such as: &#160;
<i>scientific_name:searchterm</i></li>
<li>Search for: &#160; <i>scientific_name:"Escherichia coli O157:H7"</i><br />
to retrieve the isolates containing that full, exact string as the scientific name</li>
<li>Search for: &#160; <i>scientific_name:"Escherichia coli"</i><br />to retrieve the isolates containing that exact string as the scientific name, with no additional characters.</li>
<li>Search for: &#160; <i>scientific_name:Escherichia*</i><br />
to retrieve the isolates containing Escherichia in the scientific name, followed by any other characters.</li>
</ul>
An alternative way to search the <i>scientific_name</i> data field is to use the "<a href="#filters"><b>Filters</b></a>" option, which includes a <b>"Scientific Name" text box</b>, where you can enter the genus name (or the full genus and species name) of the pathogen, with the first letter of the genus capitalized. An <b>autocomplete</b> function will list the <b>top 10 scientific names</b> (based on number of isolates for each one) that begin with the term you entered. If your organism of interest doesn't fall within the top 10, then you can search the <i>scientific_name</i> data field directly for the organism of interest, as shown in the examples above.<br /><br />
To retrieve all isolates that belong to a specific <a href="#isolates-browser-data-field-OrganismGroup">Organism group</a>, use the <b>"Select an organism group" menu</b> on the <a href="/pathogens/isolates#/search/">Isolates Browser</a> home page.
</li>
<!-- ======== DATA_FIELD_source_type ========== -->
<li id="isolates-browser-data-field-source_type">
<span style="background-color: #cde1ff">Source type (<b><i>source_type</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of Isolates Browser data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
The isolate source type. Possible values include <i>Food, Animal, Environmental, Human, Animal feed</i>.<br /><br />
Data field names and values are <a href="#case-sensitive">case sensitive</a>, and this data field name should be written in all lower case, as shown in the example below.<br /><br />
<b>Examples:</b><br />
<ul>
<li>To search this field directly, enter a query such as: &#160;
<i>source_type:searchterm</i></li>
<li>Search for: &#160; <i>source_type:Food</i><br /> to retrieve isolates with source_type <i>Food</i>.</li>
</ul>
<br />
An alternative way to search the <i>source_type</i> data field is to use the "<a href="#filters"><b>Filters</b></a>" option, which includes a <b>"Source type " text box</b>, where you can enter the <i>source_type</i> string. Here it is possible to search for null values by selecting <b>&lt;EMPTY&gt;</b>. <br /><br />
</li>
<!-- ======== DATA_FIELD_SpeciesTaxID ========== -->
<li id="isolates-browser-data-field-SpeciesTaxID">
<span style="background-color: #cde1ff">Species TaxID (<b><i>species_taxid</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of Isolates Browser data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
The <a href="https://www.ncbi.nlm.nih.gov/taxonomy">NCBI Taxonomy</a> identifier (<a href="https://www.ncbi.nlm.nih.gov/books/NBK21100/#A268">TaxID</a>) at the species level for this isolate.<br /><br />
Data field names and values are <a href="#case-sensitive">case sensitive</a>, and this data field name should be written in all lower case, as shown in the example below.<br /><br />
The TaxID number for a species can be obtained from the <a href="https://www.ncbi.nlm.nih.gov/taxonomy">NCBI Taxonomy</a> database. For example, search the database for <a href="https://www.ncbi.nlm.nih.gov/taxonomy/?term=escherichia+coli"><i>Escherichia coli</i></a>, then follow the link for that species name to open its Taxonomy Browser display, which shows a TaxID of 562.<br /><br />
<b>Examples:</b>
<ul>
<li>To search this field directly, enter a query such as: &#160;
<i>species_taxid:searchterm</i></li>
<li>Search for: &#160; <i>species_taxid:562</i><br />
to retrieve all isolates that belong to the species <i>Escherichia coli</i>.</li>
</ul>
</li>
<!-- ======== DATA_FIELD_SRACenter ========== -->
<li id="isolates-browser-data-field-SRACenter">
<span style="background-color: #cde1ff">SRA Center (<b><i>sra_center</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of Isolates Browser data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
The name of the center that submitted the data to the Sequence Read Archive (SRA).<br /><br />
Data field names and values are <a href="#case-sensitive">case sensitive</a>, as shown in the examples below.<br /><br />
The system will retrieve isolates that contain the exact query string you specified, including punctuation, capitalization, and spaces.<br /><br />
Separate sections of this document provide tips about use of <a href="#query-tips-phrase-search-quotes">quotes for phrase searches</a> and <a href="#special-characters">special characters</a> (such as a hyphen) that are part of a query term.<br /><br />
To browse the various values that are available in a data field, use the "<a href="#isolates-browser-display-options">Choose Columns</a>" option at the top of the "Matched Isolates" table, select the desired column (data field) to display, then click on the column header to sort by the values in that column.<br /><br />
<b>Examples:</b>
<ul>
<li>To search this field directly, enter a query such as: &#160;
<i>sra_center:searchterm</i></li>
<li>Search for: &#160; <i>sra_center:EDLB-CDC</i></li>
<li>Search for: &#160; <i>sra_center:FDA</i></li>
</ul><br />
</li>
<!-- ======== DATA_FIELD_SRAReleaseDate ========== -->
<li id="isolates-browser-data-field-SRAReleaseDate">
<span style="background-color: #cde1ff">SRA Release Date (<b><i>sra_release_date</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of Isolates Browser data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
Sequence Read Archive (SRA) release date.<br /><br />
</li>
<!-- ======== DATA_FIELD_Status ========== -->
<!-- li id="isolates-browser-data-field-Status">
<span style="background-color: #cde1ff">Status (<b><i>status</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of Isolates Browser data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
______________<br /><br />
Q, Note: This field no longer seems to be in the Isolates Browser. It was mentioned in the JSON file dated 20180503, but not in the more recent file, dated, 20180518<br />
<ul>
<li>To search this field directly, enter a query such as: &#160;
<i>____:searchterm</i></li>
<li>Search for: &#160; <i>____:_____</i></li>
</ul><br>
</li -->
<!-- ======== DATA_FIELD_StressGenotypes ========== -->
<li id="isolates-browser-data-field-stress-genotypes">
<span style="background-color: #cde1ff">Stress genotypes (<b><i>stress_genotypes</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of Isolates Browser data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
Stress resistance genes found in the isolate during analysis with <a href="/pathogens/antimicrobial-resistance/AMRFinder/">AMRFinderPlus</a>. These can include metal, biocide, and heat resistance genes. This is a de-duplicated list, so multiple genes that share the same symbol will only be represented once. <span style="color: #D3D3D3">&lt;NONE&gt;</span> indicates a lack of AMR genes identified by AMRFinderPlus, while an empty field means AMRFinderPlus results are not yet available. See the <a href="#isolates-browser-data-field-amrfinderplus-analysis-type">AMRFinderPlus analysis type</a>, <a href="#isolates-browser-data-field-refgene-db-version">PD Ref Gene Catalog version</a>, and <a href="#isolates-browser-data-field-amrfinderplus-version">AMRFinderPlus version</a> fields for more information about the AMRFinderPlus analysis of this isolate. <i>(Separate sections of this document provide an <a href="#amr-finder">overview of AMRFinderPlus</a>)</i><br /><br />
The genes that have been identified in an isolate's genome sequence are grouped into <b>genotype categories</b>, such as <i><b>complete</b></i>, <i><b>partial</b></i>, <i><b>partial end of contig</b></i>. The <a href="/pathogens/docs/data_processing">data processing pipeline</a> section of this document provides <a href="/pathogens/docs/data_processing/#genotype-categories">more information about genotype categories</a>.<br /><br />
The <a href="#filters">Filters</a> interface has been customized for fields that have genes listed such as this one. See <a href="#filters-gene-fields">Filter gene fields</a> for more information.<br /><br />
Data field names and values are <a href="#case-sensitive">case sensitive</a>, as shown in the examples below. <!-- Additional <a href="#isolates-browser-query-tips">query tips</a> are provided in a separate section of this document. Additional sections of this document provide tips about search terms that contain <a href="#special-characters">special characters</a> (such as the parentheses, hyphens, and apostrophes), and the use of <a href="#wildcards">wildcards</a> (such as the asterisk and question mark). --><br /><br />
<b>Examples:</b>
<ul>
<li>To search this field directly, enter a query such as: &#160;
<i>stress_genotypes:searchterm</i></li>
<li>Search for: &#160; <i>stress_genotypes:emrE</i><br />
to show all of the isolates that have the emrE gene.
</li>
<li>Search for: &#160; <i>stress_genotypes:emrE AND stress_genotypes:merC</i><br />
to show all of the isolates that have both the emrE gene and the merC gene.
</li>
</ul>
<i>Note: To learn more about a given gene, open the <a href="/pathogens/isolates#/refgene/">Pathogen Detection Reference Gene Catalog</a> and search for the gene symbol of interest. For example, see the Reference Gene Catalog results of a search for
<a href="/pathogens/isolates#/refgene/emrE">emrE</a> or <a href="/pathogens/isolates#/refgene/merC">merC</a>. In the Pathogen Detection Reference Gene Catalog search results display, clicking on the gene symbol will retrieve the isolates that have been found to contain the gene.</i>
</li>
<!-- ======== DATA_FIELD_TaxID ========== -->
<li id="isolates-browser-data-field-TaxID">
<span style="background-color: #cde1ff">TaxID (<b><i>taxid</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of Isolates Browser data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
The <a href="https://www.ncbi.nlm.nih.gov/taxonomy">NCBI Taxonomy</a> identifier (<a href="https://www.ncbi.nlm.nih.gov/books/NBK21100/#A268">TaxID</a>) for this isolate, which can have a classification that is narrower than species.<br /><br />
<b>Examples:</b><br />
<ul>
<li>To search this field directly, enter a query such as: &#160;
<i>taxid:searchterm</i></li>
<li>Search for: &#160; <i>taxid:83334</i><br />
to retrieve isolates for <i>Escherichia coli O157:H7</i>.
</li>
</ul>
<b>Notes:</b><br /><br />
<b>Compare</b> the TaxID data field that is described here with the "<a href="#isolates-browser-data-field-SpeciesTaxID">Species TaxID</a>" data field that was described earlier.<br />
The <b>Species TaxID</b> data field contains taxonomy IDs at the <i>Genus species</i> level.<br />
The <b>TaxID</b> data field, in contrast, can contain classifications that are <b>deeper</b> than species, as shown in the examples above.<br /><br />
The TaxID for a species and/or for deeper nodes can be obtained from the <a href="https://www.ncbi.nlm.nih.gov/taxonomy">NCBI Taxonomy</a> database. For example, search the database for <a href="https://www.ncbi.nlm.nih.gov/taxonomy/?term=escherichia+coli"><i>Escherichia coli</i></a>, then follow the link for that species name to open its Taxonomy Browser display, which show the TaxID for the species and will list the strains that fall under it. Follow the link for any strain name of interest to open its Taxonomy Browser display and view its TaxID.
<br /><br />
Some isolates might contain the same value in both fields, such as the <i>E. coli</i> isolates that are retrieved by a search for:<br />
<i>species_taxid:562 AND taxid:562</i>.
Those isolates have just been classified at the Genus species level, and not any deeper.
</li><br />
<!-- ======== DATA_FIELD_VirulenceGenotypes ========== -->
<li id="isolates-browser-data-field-virulence-genotypes">
<span style="background-color: #cde1ff">Virulence genotypes (<b><i>virulence_genotypes</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of Isolates Browser data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
Virulence genes found in the isolate during analysis with <a href="/pathogens/antimicrobial-resistance/AMRFinder/">AMRFinderPlus</a>. This is a de-duplicated list, so multiple genes that share the same symbol will only be represented once. This field may also contain stx operon results which represent the output of <a href="https://github.com/ncbi/stxtyper">StxTyper</a> which is now included in <a href="/pathogens/antimicrobial-resistance/AMRFinder/">AMRFinderPlus</a> versions 4.0 and above. <span style="color: #D3D3D3">&lt;NONE&gt;</span> indicates a lack of AMR genes identified by AMRFinderPlus, while an empty field means AMRFinderPlus results are not yet available. See the <a href="#isolates-browser-data-field-amrfinderplus-analysis-type">AMRFinderPlus analysis type</a>, <a href="#isolates-browser-data-field-refgene-db-version">PD Ref Gene Catalog version</a>, and <a href="#isolates-browser-data-field-amrfinderplus-version">AMRFinderPlus version</a> fields for more information about the AMRFinderPlus analysis of this isolate. <i>(Separate sections of this document provide an <a href="#amr-finder">overview of AMRFinderPlus</a>)</i><br /><br />
The genes that have been identified in an isolate's genome sequence are grouped into <b>genotype categories</b>, such as <i><b>complete</b></i>, <i><b>partial</b></i>, <i><b>partial end of contig</b></i>. The <a href="/pathogens/docs/data_processing">data processing pipeline</a> section of this document provides <a href="/pathogens/docs/data_processing/#genotype-categories">more information about genotype categories</a>.<br /><br />
<!-- i>(Separate sections of this document provide details about the Pathogen Detection <a href="/pathogens/docs/data_processing">data processing pipeline</a> and an <a href="#amr-finder">overview of AMRFinderPlus</a>.)</i><br /><br / -->
<!-- i>(<a href="#data-type-genotype">Read more about genotypes</a>, <a href="#/pathogens/docs/data_processing/genotype-categories">genotype categories</a>, and look at sample records.)</i><br /><br / -->
The <a href="#filters">Filters</a> interface has been customized gene fields such as this one. See <a href="#filters-gene-fields">Filter gene fields</a> for more information.<br /><br />
Data field names and values are <a href="#case-sensitive">case sensitive</a>, as shown in the examples below. <!-- Additional <a href="#isolates-browser-query-tips">query tips</a> are provided in a separate section of this document. Additional sections of this document provide tips about search terms that contain <a href="#special-characters">special characters</a> (such as the parentheses, hyphens, and apostrophes), and the use of <a href="#wildcards">wildcards</a> (such as the asterisk and question mark). --><br /><br />
<b>Examples:</b>
<ul>
<li>To search this field directly, enter a query such as: &#160;
<i>virulence_genotypes:searchterm</i></li>
<li>Search for: &#160; <i>virulence_genotypes:fdeC</i><br />
to show all of the isolates that have the fdeC gene.
</li>
<li>Search for: &#160; <i>virulence_genotypes:fdeC AND virulence_genotypes:iroE</i><br />
to show all of the isolates that have both the fdeC gene and the iroE gene.
</li>
</ul>
<i>Note: To learn more about a given gene, open the <a href="/pathogens/isolates#/refgene/">Pathogen Detection Reference Gene Catalog</a> and search for the gene symbol of interest. For example, see the Reference Gene Catalog results of a search for
<a href="/pathogens/isolates#/refgene/fdeC">fdeC</a> or <a href="/pathogens/isolates#/refgene/iroE">iroE</a>. In the Pathogen Detection Reference Gene Catalog search results display, clicking on the gene symbol will retrieve the isolates that have been found to contain the gene.</i>
</li>
<!-- ======== DATA_FIELD_WGSAccession ========== -->
<li id="isolates-browser-data-field-WGSAccession">
<span style="background-color: #cde1ff">WGS Accession (<b><i>wgs_master_acc</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of Isolates Browser data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
The Whole Genome Shotgun (WGS) accession for the master record. The WGS master record contains no sequence data, and instead lists all of the accession numbers for the individual sequence records that compose the genome assembly for the isolate.<br /><br />
<b>Tips:</b><br />
The genome assembly identifier should be entered in the form of <b>Accession.version</b>, as in the first example below.<br />
If you enter only the accession, <b>no hits</b> will be returned.<br />
If you don't know the version number, then you can use an <b>asterisk</b> (<b>*</b>) to serve as a <a href="#wildcards"><b>wildcard</b></a>, as in the second example below.<br />
Data field names and values are <a href="#case-sensitive">case sensitive</a>, and the <b>accession prefix</b> must be in <b>upper case</b>, as shown in the examples below.<br /><br />
A separate section of this document provides a list of <a href="#accession-prefixes">accession prefixes</a> that appear in the Pathogen Detection project, and the <a href="#data-retention">data retention and history tracking</a> section describes the use of <a href="#accession-version">accession.versions to track changes</a> to the data.<br /><br />
<b>Examples:</b><br />
<ul>
<li>To search this field directly, enter a query such as: &#160;
<i>wgs_master_acc:searchterm</i></li>
<li>Search for: &#160; <i>wgs_master_acc:JZAA00000000.1</i></li>
<li>Search for: &#160; <i>wgs_master_acc:JZAA00000000.*</i><br />
with an asterisk (*) serving as a wildcard, if you don't know the version number of the WGS master record.<br />
<!-- Either query above will retrieve the Salmonellaisolate whose Whole Genome Shotgun (WGS) sequencing data is accessible from the WGS master record that has the accession number JZAA00000000.1. -->
</li>
</ul>
A separate page provides <a href="https://www.ncbi.nlm.nih.gov/genbank/wgs/">more information about WGS data</a>.
</li><br />
<!-- ======== DATA_FIELD_WGSPrefix ========== -->
<li id="isolates-browser-data-field-WGSPrefix">
<span style="background-color: #cde1ff">WGS Prefix (<b><i>wgs_acc_prefix</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of Isolates Browser data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
The stable accession prefix that is assigned to a Whole Genome Shotgun (WGS) project.<br /><br />
<!-- Each Whole Genome Shotgun (WGS) project is assigned a stable 4-letter WGS accession prefix</b>, which does not change as the project is updated.<br /><br -->
<b>Examples:</b><br />
<ul>
<li>To search this field directly, enter a query such as: &#160;
<i>wgs_acc_prefix:searchterm</i></li>
<li>Search for: &#160; <i>wgs_acc_prefix:JZAA</i><br />
to retrieve the <!-- Salmonella -->isolate whose Whole Genome Shotgun (WGS) sequencing project that was assigned the prefix JZAA.</li>
</ul>
<b>Background:</b>
A separate page provides <a href="https://www.ncbi.nlm.nih.gov/genbank/wgs/">more information about WGS data</a>.<br /><br />
<i>(<span style="background-color: #cde1ff"></span>
Go back up to <a href="#isolates-browser-data-fields">list of data fields</a> <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#isolates-browser-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of Isolates Browser data fields" /></a> or to <a href="#top">top of document</a> <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a> )</i>
</li>
<!-- ======== END_OF_LAST_DATA_FIELD ========== -->
</ul>
<!-- ========= END_DATA_FIELDS_DESCRIPTIONS =========== -->
<!-- ========= END_DATA_FIELDS ======== -->
<!-- ========= SEARCH_MODIFIERS_DESCRIPTIONS =========== -->
<h3 id="isolates-browser-search-modifiers">Search modifiers <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser-advanced-search"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Isolates Browser Advanced Search, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h3>
<br />
Search modifiers can help limit the result set from a Isolates Browser search by specifying certain properties. <br />
<br />
<span id="isolates-browser-modifiers"><b>The available search modifiers in the <a href="/pathogens/isolates#/search/">Pathogens Isolates Browser</a> include the following:</b></span>
<br />
<ul>
<!-- ======== New ========== -->
<li id="isolates-browser-search-modifier-new">
<span style="background-color: #cde1ff">new </span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser-search-modifiers"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Isolates Browser search modifiers" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
</li>
<ul>
An isolate is considered "new" when it was not included in the previous publication of the organism group. Most often a "new" isolate is represented by data newly deposited to NCBI, or added to the Pathogen Detection resource. But "new" also includes other, less common cases. These include an existing isolate was updated with new SRA data, an existing isolate was re-assembled, an isolate was dropped from Pathogen Detection then added back (there can be many reasons for this, all uncommon), or the organism group is a new one in the Pathogen Detection system.
<br /><br />
<li><b>Example:</b> Get all the isolates added to an organism group since the last publication. Values are 0,1:
<a href="https://www.ncbi.nlm.nih.gov/pathogens/isolates#/search/taxgroup_name:%22Streptococcus pyogenes%22%20AND%20new:1"><b>taxgroup_name:"Streptococcus pyogenes" AND new:1</b></a>
<br />
</li>
</ul>
</ul>
<!-- ========= SEARCH_DATA_MODIFIERS_DESCRIPTIONS =========== -->
<!-- =============== SOLR_QUERY_EXAMPLES ============= -->
<!-- =============== SOLR_QUERY_EXAMPLES_INTRO ============= -->
<!-- <div style='padding-left: 2em'> -->
<h3 id="solr-sample-searches">Examples of SOLR queries <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser-advanced-search"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Isolates Browser Advanced Search, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h3>
<ul>
<li><a href="#solr-sample-search-IsolationSourceAllPurposeFlour"><b>Isolation source:</b><br />
Show all isolates that have the exact phrase "All-Purpose Flour" in the isolation_source data field</a></li>
<li><a href="#solr-sample-search-LocationAndOrganismGroup"><b>Geographic location and organism group:</b><br />
Show all Salmonella isolates from the USA</a></li>
<li><a href="#solr-sample-search-GenotypesMcrAndBlakpc"><b>Genotypes: isolates that have specific genes:</b><br />
Show all of the isolates that have a mobile colistin resistance gene and a KPC beta-lactamase</a></li>
<li><a href="#solr-sample-search-PhenotypesCiproResistant"><b>Phenotypes: isolates that are resistant to a given antibiotic:</b><br />
Show all of the isolates that are resistant to ciprofloxacin</a></li>
<li><a href="#solr-sample-search-GenotypesAndPhenotypes"><b>Genotypes and phenotypes:</b></a><br />
<a href="#solr-sample-search-GenotypesNoBlakpcNoBlandmImipenemResistant"><b>Example 1: missing specific genes, resistant to antiobiotic:</b><br />
Show all of the isolates that lack both a blaKPC and blaNDM carbapenemase but are resistant to imipenem</a><br />
<a href="#solr-sample-search-GenotypesBlakpcMeropenemSusceptible"><b>Example 2: has specific gene, susceptible to antiobiotic:</b><br />
Show all of the isolates that have a blaKPC gene and are susceptible to meropenem</a><br />
<a href="#solr-sample-search-GenotypesQnrCiproResistant"><b>Example 3: has specific gene, resistant to either of two antiobiotics:</b><br />Show all of the isolates that have a qnr gene and that are resistant to either ciprofloxacin or nalidixic acid</a>
</li>
<!-- li><a href="#solr-sample-search-GeneNameSpecialCharacters"><b>Genotypes: gene name with special characters:</b><br />
Show all of the isolates that have the gene aph(4)-Ia and a blaKPC carbapenemase</a></li><br -->
<li><a href="#solr-sample-search-WhereIsMyIsolate"><b>Where is my isolate?</b><br />
Retrieve your data by BioSample accession numbers or SRA Run accession numbers</a></li>
<li><a href="#solr-sample-search-BatchSearch"><b>Batch search with isolate identifiers that contain a hyphen:</b><br />
Input a list of isolate identifiers that contain special characters (hyphens)</a></li>
</ul>
<!-- </div> -->
<!-- ======== END_SOLR_QUERY_EXAMPLES_INTRO ======== -->
<!-- ========= HORIZONTAL_RULE ============ -->
<div style="padding-left: 2em">
<hr />
</div>
<!-- ======= END_HORIZONTAL_RULE ========== -->
<!-- ====== SOLR_SAMPLE_SEARCHES_AND_COMMENTS_TIPS ====== -->
<ul>
<!-- ====== SOLR_SAMPLE_SEARCH:DATA_FIELD_PHRASE_SEARCH ===== -->
<li id="solr-sample-search-IsolationSourceAllPurposeFlour">
<b>Isolation source:</b> <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#solr-sample-searches"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of advanced sample searches" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
Show all isolates that have the exact phrase "All-Purpose Flour" in the isolation_source data field:<br />
<span style="background-color: #ffff00"><a href="/pathogens/isolates#/search/isolation_source:%22All-Purpose%20Flour%22"><b><i>isolation_source:"All-Purpose Flour"</i></b></a>
</span>
<br />
<div style="padding-left: 2em">
Comments/Tips:<br />
This query searches the "<a href="#isolates-browser-data-field-IsolationSource">Isolation Source</a>" <a href="#isolates-browser-data-fields">data field</a>.<br />
Data field names and values are <a href="#case-sensitive"><b>case sensitive</b></a> and reflect the values exactly as they were entered by the data submitters. If you are uncertain about whether to use upper case, lower case, or mixed case in your query string, then you can simply enter the query in any case, but do not include a data field specifier. For example:<br />
<a href="/pathogens/isolates#/search/%22all-purpose%20flour%22"><b><i>"all-purpose flour"</i></b></a><br />
That approach searches a general <b>Text index</b>, which is a case insensitive compilation of terms from many text-containing data fields.<br />
The <b>quotes</b> ensure that your query string will be searched as a phrase, as noted in the <a href="#isolates-browser-query-tips">query tips</a> section of the document.
</div>
</li>
<!-- ==== END_SOLR_SAMPLE_SEARCH:DATA_FIELD_PHRASE_SEARCH === -->
<!-- ====== SOLR_SAMPLE_SEARCH:GEOGRAPHIC_LOCATION_TAXONOMIC_GROUP ===== -->
<li id="solr-sample-search-LocationAndOrganismGroup">
<b>Geographic location and organism group:</b> <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#solr-sample-searches"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of advanced sample searches" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
Show all Salmonella isolates collected in USA:<br />
<span style="background-color: #ffff00"><a href="/pathogens/isolates#/search/geo_loc_name:USA%20AND%20taxgroup_name:%22Salmonella%20enterica%22"><b><i>geo_loc_name:USA AND taxgroup_name:"Salmonella enterica"</i></b></a>
</span>
<br />
<div style="padding-left: 2em">
Comments/Tips:<br />
This query searches the "<a href="#isolates-browser-data-field-Location">Location</a>" (<i>geo_loc_name</i>) and "<a href="#isolates-browser-data-field-OrganismGroup">Organism Group</a>" (<i>taxgroup_name</i>) <a href="#isolates-browser-data-fields">data fields</a>.<br />
Data field names and values are <a href="#case-sensitive"><b>case sensitive</b></a> and reflect the values exactly as they were entered by the data submitters. If you are uncertain about whether to use upper case, lower case, or mixed case in your query string, then you can simply enter the query in any case, but do not include a data field specifier. For example:<br />
<a href="/pathogens/isolates#/search/usa%20AND%20%22salmonella%20enterica%22"><i>usa AND "salmonella enterica"</i></a><br />
That approach searches a general Text index, which is a case insensitive compilation of terms from many text-containing data fields.<br />
The quotes around the species name force the terms to be searched as a phrase.
</div>
</li>
<!-- ====== END_SOLR_SAMPLE_SEARCH:GEOGRAPHIC_LOCATION_TAXONOMIC_GROUP ===== -->
<!-- ==== SOLR_SAMPLE_SEARCH:AMR_GENOTYPES_mcr_AND_blaKPC ==== -->
<li id="solr-sample-search-GenotypesMcrAndBlakpc">
<b>Genotypes: isolates that have specific genes:</b> <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#solr-sample-searches"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of advanced sample searches" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
<span id="solr-sample-search-GenotypesMcrAndBlakpc">
Show all of the isolates that have a mobile colistin resistance gene and a KPC beta-lactamase<!-- blaKPC carbapenemase -->:</span><br />
<span style="background-color: #ffff00"><a href="/pathogens/isolates#/search/AMR_genotypes:mcr*%20AND%20AMR_genotypes:blaKPC*"><b><i>AMR_genotypes:mcr* AND AMR_genotypes:blaKPC*</i></b></a>
</span>
<br />
<div style="padding-left: 2em">
Comments/Tips:<br />
This query searches the "<a href="#isolates-browser-data-field-AMRGenotypes">antimicrobial resistance (AMR) genotypes</a>" <a href="#isolates-browser-data-fields">data field</a> and uses the <a href="#operators">Boolean operator</a> "AND" to override the default "OR."<br />
Data field names and values are <a href="#case-sensitive"><b>case sensitive</b></a> and reflect the values exactly as they were entered by the data submitters. If you are uncertain about whether to use upper case, lower case, or mixed case in your query string, then you can simply enter the query in any case, but do not include a data field specifier. For example:<br />
<a href="/pathogens/isolates#/search/mcr*%20AND%20blakpc*"><i>mcr* AND blakpc*</i></a><br />
That approach searches a general Text index, which is a case insensitive compilation of terms from many text-containing data fields.<br />
The <b>asterisk</b> (<b>*</b>) is a <b>wild card</b> and therefore searches for the specified word stem.
</div>
</li>
<!-- ==== END_SOLR_SAMPLE_SEARCH:AMR_GENOTYPES_mcr_AND_blaKPC ==== -->
<!-- ==== SOLR_SAMPLE_SEARCH:AST_PHENOTYPES_Cipro_Resistant ==== -->
<li id="solr-sample-search-PhenotypesCiproResistant">
<b>Phenotypes: antibiotic resistance:</b> <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#solr-sample-searches"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of advanced sample searches" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
Show all of the isolates that are resistant to ciprofloxacin:<br />
<span style="background-color: #ffff00"><a href="/pathogens/isolates#/search/AST_phenotypes:ciprofloxacin=R*"><b><i>AST_phenotypes:ciprofloxacin=R</i></b></a>
</span>
<br />
<div style="padding-left: 2em">
Comments/Tips:<br /><br />
The query directs the system to search the <a href="#isolates-browser-data-field-ASTPhenotypes">AST_phenotypes</a> data field, where the values can be:<br />
<ul>
<li>I (intermediate)</li>
<li>NS (nonsusceptible)</li>
<li>N, ND (not defined)</li>
<li>R (resistant)</li>
<li>S (susceptible, sensitive)</li>
<li>SSD (susceptible-dose dependent)</li>
</ul>
Data field names and values are <a href="#case-sensitive"><b>case sensitive</b></a> and reflect the values exactly as they were entered by the data submitters.<br /><br />
After you do the search, the Isolates Browser search results page will not display the "AST_phenotypes" column by default; however, you can use the "<a href="#isolates-browser-display-options">Choose Columns</a>" option at the top of the table to add that column to the display.
</div>
</li>
<!-- ==== END_SOLR_SAMPLE_SEARCH:AST_PHENOTYPES_Cipro_Resistant ==== -->
<!-- ===== SOLR_SAMPLE_SEARCH:AMR_GENOTYPES_AND_AST_PHENOTYPES ===== -->
<li id="solr-sample-search-GenotypesAndPhenotypes">
<b>Genotypes and phenotypes:</b> <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#solr-sample-searches"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of advanced sample searches" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
<!-- ====== EXAMPLE_1: NO_blaKPC_AND_blaNDM_AND_resistant_to_imipenem ===== -->
<div style="padding-left: 2em">
<span id="solr-sample-search-GenotypesNoBlakpcNoBlandmImipenemResistant">
<b>Example 1: missing specific genes, resistant to antiobiotic:</b></span><br /><br />
Show all of the isolates that lack both a blaKPC and blaNDM carbapenemase but are resistant to imipenem:<br />
<span style="background-color: #ffff00"><a href="/pathogens/isolates#/search/AST_phenotypes:imipenem=R%20AND%20NOT%20AMR_genotypes:blaKPC*%20AND%20NOT%20AMR_genotypes:blaNDM*"><b><i>AST_phenotypes:imipenem=R AND NOT AMR_genotypes:blaKPC* AND NOT AMR_genotypes:blaNDM*</i></b></a>
</span><br />
- or -<br />
<span style="background-color: #ffff00"><a href="/pathogens/isolates#/search/AST_phenotypes:imipenem=R%20NOT%20AMR_genotypes:blaKPC*%20NOT%20AMR_genotypes:blaNDM*"><b><i>AST_phenotypes:imipenem=R NOT AMR_genotypes:blaKPC* NOT AMR_genotypes:blaNDM*</i></b></a>
</span>
</div>
<br /><br />
<!-- ===== END_EXAMPLE_1: NO_blaKPC_AND_blaNDM_AND_resistant_to_imipenem ===== -->
<!-- ==== EXAMPLE_2: HAS_blaKPC_AND_susceptible_to_meropenem ==== -->
<div style="padding-left: 2em">
<span id="solr-sample-search-GenotypesBlakpcMeropenemSusceptible">
<b>Example 2: has specific gene, susceptible to antiobiotic:</b></span><br /><br />
Show all of the isolates that have a blaKPC gene and are susceptible to meropenem:<br />
<span style="background-color: #ffff00"><a href="/pathogens/isolates#/search/AST_phenotypes:meropenem=S%20AND%20AMR_genotypes:blaKPC*"><b><i>AST_phenotypes:meropenem=S AND AMR_genotypes:blaKPC*</i></b></a>
</span>
</div>
<br />
<!-- === END_EXAMPLE_2: HAS_blaKPC_AND_susceptible_to_meropenem === -->
<!-- ==== EXAMPLE_3: HAS_qnr_AND_resistant_to_either_cipro_or_nalixidic_acid ==== -->
<div style="padding-left: 2em">
<span id="solr-sample-search-GenotypesQnrCiproResistant">
<b>Example 3: has specific gene, resistant to either of two antiobiotics:</b></span><br /><br />
Show all of the isolates that have a qnr gene and that are either ciprofloxacin or nalidixic acid resistant:<br />
<span style="background-color: #ffff00"><a href="/pathogens/isolates#/search/AMR_genotypes:qnr*%20AND%20(AST_phenotypes:ciprofloxacin=R%20OR%20AST_phenotypes:%22nalixidic%20acid=R%22)"><b><i>AMR_genotypes:qnr* AND (AST_phenotypes:ciprofloxacin=R OR AST_phenotypes:"nalixidic acid=R")</i></b></a>
</span>
</div>
<br />
<!-- === END_EXAMPLE_3: HAS_qnr_AND_resistant_to_either_cipro_or_nalixidic_acid === -->
<div style="padding-left: 2em">
Comments/Tips:<br />
This query searches the "<a href="#isolates-browser-data-field-AMRGenotypes">antimicrobial resistance (AMR) genotypes</a>" and "<a href="#isolates-browser-data-field-ASTPhenotypes">antibiotic susceptibility test (AST) Phenotypes</a>" <a href="#isolates-browser-data-fields">data fields</a>. It also uses the <a href="#operators">Boolean operators</a> "AND" and "NOT" to override the default "OR."<br />
Data field names and values are <a href="#case-sensitive"><b>case sensitive</b></a> and reflect the values exactly as they were entered by the data submitters. If you are uncertain about whether to use upper case, lower case, or mixed case in your query string, then you can simply enter the query in any case, but do not include a data field specifier. For example:<br />
<a href="/pathogens/isolates#/search/imipenem=r%20NOT%20blakpc*%20NOT%20blandm*"><i>imipenem=r NOT blakpc* NOT blandm*</i></a><br />
That approach searches a general Text index, which is a case insensitive compilation of terms from many text-containing data fields.<br />
The <b>asterisk</b> (<b>*</b>) is a <b>wild card</b> and therefore searches for the specified word stem.
</div>
</li>
<!-- ==== END_SOLR_SAMPLE_SEARCH:AMR_GENOTYPES_AND_AST_PHENOTYPES ==== -->
<!-- ====== SOLR_SAMPLE_SEARCH:AMR_GENOTYPES_aph(4)-Ia_AND_blaKPC ===== -->
<!-- li id="GeneNameSpecialCharacters">
<b>Genotypes: gene name with special characters:</b> <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#solr-sample-searches"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of advanced sample searches" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
Show all of the isolates that have the gene aph(4)-Ia and a blaKPC carbapenemase:<br />
<span style="background-color: #ffff00"><a href="/pathogens/isolates#/search/AMR_genotypes:aph(4)-Ia%20AND%20AMR_genotypes:blaKPC*"><b><i>AMR_genotypes:aph(4)-Ia AND AMR_genotypes:blaKPC*</i></b></a>
</span>
<span style="background-color: #ffff00"><a href="______"><b><i>AMR_genotypes:aph\(4\)\-Ia AND AMR_genotypes:blaKPC*</i></b></a>
</span>
<br />
<div style='padding-left: 2em'>
Comments/Tips:<br />
This query searches the "<a href="#isolates-browser-data-field-AMRGenotypes">antimicrobial resistance (AMR) genotypes</a>" <a href="#isolates-browser-data-fields">data field</a> and includes a gene name that contains <a href="#special-characters"><b>special characters</b></a>. The Isolates Browser has been programmed to <b>automatically escape the special characters</b> when they are internal to a search term, such as the <b>parentheses</b> and <b>dash</b> that are <b>part of the gene name: <i>aph(4)-Ia</i></b>. The browser therefore interprets the special characters as part of the query string and returns isolates that contain the exact string you entered.<br />
Data field names and values are <a href="#case-sensitive"><b>case sensitive</b></a> and reflect the values exactly as they were entered by the data submitters. If you are uncertain about whether to use upper case, lower case, or mixed case in your query string, then you can simply enter the query in any case, but do not include a data field specifier. For example:<br />
<a href="/pathogens/isolates#/search/aph(4)-ia%20AND%20blakpc*"><i>aph(4)-ia AND blakpc*</i></a><br />
That approach searches a general Text index, which is a case insensitive compilation of terms from many text-containing data fields.<br />
The <b>asterisk</b> (<b>*</b>) is a <b>wild card</b> and therefore searches for the specified word stem.
</div>
</li><br -->
<!-- ====== END_SOLR_SAMPLE_SEARCH:AMR_GENOTYPES_aph(4)-Ia_AND_blaKPC ===== -->
<!-- ====== SOLR_SAMPLE_SEARCH:WHERE_IS_MY_ISOLATE? ===== -->
<li id="solr-sample-search-WhereIsMyIsolate">
<b>Where is my isolate?</b> <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#solr-sample-searches"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of advanced sample searches" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br />
Retrieve your data by BioSample accession numbers or SRA Run accession numbers:<br />
<div style="padding-left: 2em">
<b>BioSample accession number</b> can be entered, with or without the "<a href="#isolates-browser-data-field-BioSample">BioSample</a>" <i>(biosample_acc)</i> <a href="#isolates-browser-data-fields">data field</a> specifier:<br />
<div style="padding-left: 2em">
<span style="background-color: #ffff00"><a href="/pathogens/isolates#/search/SAMN04605222"><b><i>SAMN04605222</i></b></a></span><br />
- or - <br />
<span style="background-color: #ffff00"><a href="/pathogens/isolates#/search/biosample_acc:SAMN04605222"><b><i>biosample_acc:SAMN04605222</i></b></a></span><br />
</div>
<b>Sequence Read Archive (SRA) run</b> accession number can be entered, with or without the "<a href="#isolates-browser-data-field-Run">Run</a>" <i>(Run)</i> <a href="#isolates-browser-data-fields">data field</a> specifier. If the data field specifier is used, it must begin with an upper case letter "R":<br />
<div style="padding-left: 2em">
<span style="background-color: #ffff00"><a href="/pathogens/isolates#/search/SRR3986244"><b><i>SRR3986244</i></b></a></span><br />
- or - <br />
<span style="background-color: #ffff00"><a href="/pathogens/isolates#/search/Run:SRR3986244"><b><i>Run:SRR3986244</i></b></a></span><br />
</div>
<b>List of BioSample accession numbers</b>, separated by white spaces, can be entered to retrieve multiple isolates, with or without the <a href="#isolates-browser-data-fields">data field</a> specifier:<br />
<div style="padding-left: 2em">
<span style="background-color: #ffff00"><a href="/pathogens/isolates#/search/SAMN04605222%20SAMN09061456"><b><i>SAMN04605222 SAMN09061456</i></b></a></span><br />
- or - <br />
<span style="background-color: #ffff00"><a href="/pathogens/isolates#/search/biosample_acc:SAMN04605222%20SAMN09061456"><b><i>biosample_acc:SAMN04605222 SAMN09061456</i></b></a></span><br />
</div>
<b>List of SRA Run accession numbers</b>, separated by white spaces, can be entered, with or without the <a href="#isolates-browser-data-fields">data field</a> specifier. If the data field specifier is used, it must begin with an upper case letter "R":<br />
<div style="padding-left: 2em">
<span style="background-color: #ffff00"><a href="/pathogens/isolates#/search/SRR3986244%20SRR7294009%20SRR7294010%20SRR7293744%20SRR7293743"><b><i>SRR3986244 SRR7294009 SRR7294010 SRR7293744 SRR7293743</i></b></a></span><br />
- or - <br />
<span style="background-color: #ffff00"><a href="/pathogens/isolates#/search/SRR3986244%20SRR7294009%20SRR7294010%20SRR7293744%20SRR7293743"><b><i>Run:SRR3986244 SRR7294009 SRR7294010 SRR7293744 SRR7293743</i></b></a></span><br />
</div>
<b>Mixed list of BioSample and SRA Run accession numbers</b>, separated by white spaces, can be entered, with or without the <a href="#isolates-browser-data-fields">data field</a> specifiers, and without or with the Boolean OR:<br />
<div style="padding-left: 2em">
<span style="background-color: #ffff00"><a href="/pathogens/isolates#/search/SAMN04605222%20SRR7294010%20SRR7293743"><b><i>SAMN04605222 SRR7294010 SRR7293743</i></b></a></span><br />
- or - <br />
<span style="background-color: #ffff00"><a href="/pathogens/isolates#/search/biosample_acc:SAMN04605222%20Run:SRR7294010%20SRR7293743"><b><i>biosample_acc:SAMN04605222 Run:SRR7294010 SRR7293743</i></b></a></span><br />
- or - <br />
<span style="background-color: #ffff00"><a href="/pathogens/isolates#/search/biosample_acc:SAMN04605222%20OR%20Run:SRR7294010%20SRR7293743"><b><i>biosample_acc:SAMN04605222 OR Run:SRR7294010 SRR7293743</i></b></a></span>
</div>
</div>
</li>
<!-- ====== END_SOLR_SAMPLE_SEARCH:WHERE_IS_MY_ISOLATE? ===== -->
<!-- ====== SOLR_SAMPLE_SEARCH:BATCH_SEARCH_WITH_ISOLATE_IDENTIFIERS_THAT_CONTAIN_A_HYPHEN ===== -->
<li id="solr-sample-search-BatchSearch">
<b>Batch search with isolate identifiers that contain a hyphen:</b> <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#solr-sample-searches"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of advanced sample searches" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
Input a list of isolate identifiers that contain special characters (e.g., hyphens):<br />
<div style="padding-left: 2em">
<span style="background-color: #ffff00"><a href="/pathogens/isolates#/search/17B02879-2%2009B03887A-1%2009B01410A-1"><b><i>17B02879-2<br />
09B03887A-1<br />
09B01410A-1</i></b></a>
</span>
</div>
<br />
Comments/Tips:<br />
This query retrieves the list of isolates that have the specified identifiers. The Isolates Browser has been programmed to <b>automatically escape the special characters</b> when they are internal to a search term, such as the <b>dash</b> that is part of each identifier in the list. The browser therefore interprets the special characters as part of the query string and returns isolates that contain the exact string you entered.<br />
</li>
<!-- ====== END_SOLR_SAMPLE_SEARCH:BATCH_SEARCH_WITH_ISOLATE_IDENTIFIERS_THAT_CONTAIN_A_HYPHEN ===== -->
</ul>
<!-- ====== END_SOLR_SAMPLE_SEARCHES_AND_COMMENTS_TIPS ====== -->
<!-- ============= END_SOLR_QUERY_EXMAPLES =========== -->
<!-- =========== END_ISOLATES_BROWSER_ADVANCED_SEARCH ========== -->
<!-- ======== END_ISOLATES_BROWSER_INPUT ========= -->
<!-- ========= ISOLATES_BROWSER_OUPUT ============ -->
<h3 id="isolates-browser-output">Output from Isolates Browser <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Isolates Browser, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h3>
<div style="padding-left: 2em">
<a href="#isolates-browser-output-table">Tabular list of isolates</a> | <a href="#isolates-browser-exceptions-table">Exceptions table</a> | <a href="#isolates-browser-output-filters">Filters to refine results</a> | <a href="#isolates-browser-matched-clusters">Matched clusters</a> | <a href="#sort-order">Sort order</a><br />
<a href="#isolates-browser-display-options">Customize the display</a> (choose columns, default columns, additional columns)<br />
<a href="#isolates-browser-output-tree-viewer-link">SNP Tree Viewer link for each isolate that belongs to a SNP cluster</a><br />
<a href="#amr-genotypes-core-toggle">Show all AMR genotypes / Hide plus AMR genotypes button</a><br />
<a href="#isolates-browser-share">"<b>Share</b>" function in the Isolates Browser</a><br />
<a href="#isolates-browser-illustration"><span style="color:#d70000">Illustrated example</span> of Isolates Browser search results</a><br />
<a href="#isolates-browser-download">Download data from the Isolates Browser web display</a> (<a href="#isolates-browser-download-metadata">metadata</a>, <a href="#isolates-browser-download-assemblies">assemblies</a>)<br />
<a href="/pathogens/docs/isolates_gcp/">Isolates Browser in Google Cloud BigQuery</a><br />
</div>
<!-- ========= ISOLATES_BROWSER_OUPUT_TABLE ============ -->
<div style="padding-left: 2em">
<h4 id="isolates-browser-output-table">Tabular list of isolates <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser-output"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Isolates Browser Output, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h4>
<ul>
<li>Upon opening the <a href="/pathogens/isolates#/search/">Isolates Browser</a>, a table displays data for <b>all available isolates</b>, with the most recently added data at the top.</li>
<li><b>Every row</b> in the Isolates Browser is an <b>assembled isolate</b>, possibly with antimicrobial resistance (AMR), virulence, and/or stress response <a href="#data-type-genotype"><b>genotype data</b></a>, and antibiotic susceptibility (AST) <a href="#data-type-phenotype"><b>phenotype data</b></a>, as available.</li>
<li>The data for each isolate can also include strain name, geographic origin, isolation type (environmental or clinical), BioSample UID, K-mer group/organism group (PDG* accession), and more, as available. (See the <a href="#isolates-browser-data-fields">Pathogens Isolates Browser data fields</a> for a complete list.) Some of the data elements, such a accessions for corresponding BioSample and GenBank Assembly records, <b>link</b> to additional information in the <a href="#data-types">source databases</a>. The data in this table are either supplied by the submitter of the data into the BioProject, BioSample, SRA, and GenBank databases, and then collected from there by the Pathogen Detection system for display, or calculated by the Pathogen Detection system once the <a href="/pathogens/docs/data_processing">data is analyzed</a>.</li>
<li>The isolates can be <b>sorted</b> by clicking on column headers, <b>faceted</b> by using <a href="#filters">filters</a> (e.g., Property: has antimicrobial resistance (AMR) genotypes), or <b>searched</b> using <a href="#isolates-browser-basic-search">basic</a> or <a href="#isolates-browser-advanced-search">advanced</a> queries (see <a href="#solr-sample-searches">examples of SOLR queries</a> and an <a href="#isolates-browser-illustration"><span style="color:#d70000">illustrated example</span> of search results</a>).</li>
<li><b>Tree Viewer links:</b> If an isolate has a "PDS*" accession number in the <b>"SNP Cluster" column</b>, that indicates it is part of a SNP cluster, and you can click on the PSD* accession to launch the <b>Tree Viewer</b> and examine the relationships among your isolate of interest and other closely related isolates. <i><a href="#isolates-browser-output-tree-viewer-link">read more...</a></i></li>
</ul>
</div>
<!-- ======== END_ISOLATES_BROWSER_OUPUT_TABLE ========= -->
<!-- ======== EXCEPTIONS_TABLE ========= -->
<div style="padding-left: 2em">
<h4 id="isolates-browser-exceptions-table">Exceptions table <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" />
<a href="#isolates-browser-output"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Isolates Browser Output, topic list" /></a>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top">
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" />
</a>
</h4>
<ul>
<li>The results of a search for certain isolates in an organism group may include isolates that failed quality control (QC) and so are not used for analysis.
Isolates having "QC exceptions" are listed in an "Exceptions Table" along with QC details above the main grid display.
Users and submitters can find out why specific isolates are not being used.
</li>
<li>There are three "consequences" of QC failure:</li>
<ul>
<li><b>Not published</b> - The isolate will not appear in any published organism group (PDG).</li>
<li><b>Not clustered</b> - The isolate will appear in a published organism group (PDG) but will be presented as a singleton (ie no clustering attempted).</li>
<li><b>Not submitted</b> - The isolate will appear in a published organism group (PDG) and will be clustered, but its assembled sequence will not be submitted to GenBank.</li>
</ul>
<li>There are several exception "types":</li>
<ul>
<li><b>ANI species check</b> - When aligned against a database of type strains using average nucleotide identity (ANI) on the assembled sequence, the biosample's species could not be verified. </li>
<li><b>Readset validation failure</b> - The SRA run was not valid and could not be used for assembly.</li>
<li><b>Assembly validation failure</b> - The pathogen assembly was not valid and could not be used for analysis.</li>
<li><b>wgMLST validation failure</b> - The GenBank assembly could not be used for clustering.</li>
<li><b>Bad triples</b> - The assembly failed a triangle inequality test in the legacy kmer (ie non-wgMLST) clustering step.</li>
</ul>
<li>The Exceptions table is published to both the Pathogen Isolates Browser and FTP.
Further documentation about the ftp Exceptions file can be found at: <a href="https://ftp.ncbi.nlm.nih.gov/pathogen/ReadMe.txt">FTP README file.</a>
</li>
<li>Exception columns are defined as follows:</li>
<ul>
<li><b>exception type</b> - The category of error</li>
<li><b>exception</b> - Descriptive text for this category of error</li>
<li><b>consequence</b> - The result of the error</li>
<li><b>lower limit</b> - Lower allowed limit of the value if numeric</li>
<li><b>upper limit</b> - Expected value, or upper limit of value if numeric</li>
<li><b>actual value</b> - The value of the QC check for this isolate</li>
<li><b>BioSample</b> - Biosample accession</li>
<li><b>run(s)</b> - SRA accession for the sequencing run representing this isolate.</li>
<li><b>Isolate</b> - Pathogen target accession for this isolate</li>
<li><b>Assembly</b> - GenBank assembly accession for this isolate</li>
<li><b>organism</b> - Organism this isolate was submitted with</li>
<li><b>strain</b> - Strain this isolate was submitted with</li>
<li><b>sra center</b> - SRA center that submitted the sequencing run</li>
</ul>
<li>Click the download link to download the table in comma-delimited (.csv) or tab-delimited (.tsv) format.</li>
<li><b>Special note about assembly size validation</b>:
NCBI now validates the assembly size of most pathogenic bacterial organisms against fixed upper and lower bounds. These are set by species. The thresholds are the same for Pathogen and GenBank.
The assembly size thresholds can be checked by species, see
<a href="https://www.ncbi.nlm.nih.gov/assembly/help/genome-size-check">assembly size cutoffs</a>.
A table of min/max values is also available as a <a href="https://ftp.ncbi.nlm.nih.gov/genomes/ASSEMBLY_REPORTS/species_genome_size.txt.gz">downloadable TSV file</a>.
</li>
</ul></div>
<!-- ======== END_EXCEPTIONS_TABLE ========= -->
<!-- ========= ISOLATES_BROWSER_MATCHED_CLUSTERS ============ -->
<div style="padding-left: 2em">
<h4 id="isolates-browser-matched-clusters">Matched clusters <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" />
<a href="#isolates-browser-output"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Isolates Browser Output, topic list" /></a>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top">
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" />
</a>
</h4>
<ul>
<li>The Matched clusters window displays clusters of isolates that contain at least one isolate from the search results. Each row represents a cluster that contains one or more isolates matching the search criteria. The criteria for clustering can be found <a href="https://www.ncbi.nlm.nih.gov/pathogens/pathogens_help//pathogens/docs/data_processing-clustering">here</a>.
</li>
<li>The Matched clusters columns are defined as follows:</li>
<ul>
<li><b>Organism groups</b>- Name of the organism group. For more information about organism groups, see <a href="#isolates-browser-data-field-OrganismGroup">here</a>.</li>
<li><b>SNP cluster</b>- The ID of the <a href="#accession-prefix-pds">PDS cluster</a> containing one or more of the isolates matching the search criteria. Clicking the hyperlink will open the cluster in the <a href="https://www.ncbi.nlm.nih.gov/pathogens/pathogens_help/#snp-tree-viewer">SNP Tree Viewer</a> with the isolates matching the search criteria highlighted in red.</li>
<li><b>Matched isolates</b>- The number of isolates in a given cluster that match the search criteria.</li>
<li><b>Matched clinical isolates</b>- The number of clinical isolates in a given cluster that match the search criteria. For a definition of clinical isolates, see <a href="#isolates-browser-data-field-IsolationType">here</a>.</li>
<li><b>Matched environmental isolates</b>- The number of environmental isolates in a given cluster that match the search criteria. For a definition of environmental isolates, see <a href="#isolates-browser-data-field-IsolationType">here</a>.</li>
<li><b>Total isolates</b>- The total number of isolates in a cluster. Since not all isolates are assigned an Isolation Type (clinical or environmental), the total number of isolates can be larger than the sum of the matched clinical and environmental isolates.</li>
<li><b>Minimal min-diff</b>- Within in this cluster, the minimal number of SNPs between isolates having different <a href="#isolates-browser-data-field-IsolationType">isolation types</a>, provided such isolates exist in this cluster (e.g., environmental isolates within this cluster will differ by at least X SNPs from clinical isolates or vice versa).</li>
<li><b>Minimal min-same</b>- Within in this cluster, the minimal number of SNPs between isolates having the same <a href="#isolates-browser-data-field-IsolationType">isolation type</a>, provided such isolates exist in this cluster (e.g., environmental isolates will differ by at least X SNPs from other environmental isolates or vice versa).</li>
<li><b>Latest update</b>- The date that particular cluster was last updated.</li>
</ul> </ul>
<li>For an example of the Matched clusters display, see <a href="#isolates-browser-illustration">the Illustrated example of Isolates Browser search results</a>.</li></div>
<!-- ======== END_MATCHED_CLUSTERS ========= -->
<!-- ========= ISOLATES_BROWSER_OUPUT_FILTERS ============ -->
<div style="padding-left: 2em">
<h4 id="isolates-browser-output-filters">Filters to refine results <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser-output"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Isolates Browser Output, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h4>
<ul>
<li>The "Filters" menu options in the <a href="/pathogens/isolates#/search/">Isolates Browser</a> enable you to <b>facet or subset the data</b> in a variety of ways, and therefore can be used to refine your results, whether you have done a <a href="#isolates-browser-basic-search">basic search</a> or an <a href="#isolates-browser-advanced-search">advanced search</a>.</li>
<li>By default, each filter displays the <b>top 100 terms</b> (based on the number of isolates retrieved by a term) listed by count of value within that set of top 100.</li>
<li>A separate section of this document provides <a href="#filters">additional information about Filters</a>, including descriptions of the <a href="#filters-menu">menu options</a>, a note that <a href="#filters-on-the-fly">filters are generated on the fly for a given data set</a>, and tips to <a href="#filters-synonyms">look for synonyms within a filter</a>.</li>
</ul>
</div>
<!-- ======== END_ISOLATES_BROWSER_OUPUT_FILTERS ========= -->
<!-- ========= ISOLATES_BROWSER_SORT_ORDER ============ -->
<div style="padding-left: 2em">
<h4 id="sort-order">Sort order <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser-output"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Isolates Browser Output, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h4>
<ul>
<li id="sort-order-lifo">The <b>default sort order</b> in the Isolates Browser is by Create Date (also known as <i>target_creation_date</i>). That is the date on which the isolate was first seen by the Pathogen Detection system. The isolates are shown in reverse chronological order, with the newest ones appearing at the top.</li>
<li id="sort-order-column-headers">To change the sort order, <b>click on a column header</b> to sort by that criterion.</li>
<li id="sort-order-example"><b>Example:</b><br />
<ul>
<li>Open the <a href="/pathogens/isolates#/search/">Isolates Browser</a> home page, which displays all available isolates in the default sort order.</li>
<li>Enter a search for <a href="/pathogens/isolates#/search/strawberr*"><i>strawberr*</i></a> &#160; (The asterisk is a <a href="#wildcards">wild card</a>. The system therefore searches for the word stem and will retrieve isolates that contain terms such as <i>strawberry</i>, <i>strawberries</i>, etc. in any data field.)</li>
<li>By <b>default</b>, the isolates are <b>sorted by Create Date</b>.</li>
<li>Click on the <i>"Organism" column header</i> to sort alphabetically by organism name.</li>
<li>Each subsequent click on the same <b>column header</b> inverts the sort order. (The column header acts as a <b>toggle switch</b> to sort in <b>ascending or descending order</b> by the values in that column.)</li>
<li><b>To return to</b> the original, <b>default sort order</b>, <b>refresh the page</b> (i.e., reload the Isolates Browser, or, if you have done a search, re-run the search).</li>
</ul>
</li>
</ul>
</div>
<!-- ======== END_ISOLATES_BROWSER_SORT_ORDER ========= -->
<!-- ========= ISOLATES_BROWSER_OUPUT_DISPLAY_OPTIONS ============ -->
<h3 id="isolates-browser-display-options">Customize the Isolates Browser display <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser-output"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Isolates Browser Output, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h3>
<div style="padding-left: 2em">
The <a href="/pathogens/isolates#/search/">Isolates Browser</a> output table displays the default columns (highlighted in the <a href="#isolates-browser-data-fields-list">isolates browser column list</a>) initially, but you can use the "<b>Choose Columns</b>" option at the top of the "<b>Matched Isolates</b>" table to remove columns, select additional columns, or to display, and/or change the order of the columns. You can also drag column headers right and left to reorder them. Clicking on the column title will sort the list based on that column.<br /><br />
The options you select will <b>persist</b> within a given browser (e.g., Chrome, Edge, Internet Explorer, Firefox, Safari) until that browser's cookies are cleared/reset. To reset the column display and sort order to the default click the <b>Choose columns</b> button then click <b>Default</b> and <b>OK</b>.<br />
</div>
<!-- ======== END_ISOLATES_BROWSER_OUPUT_DISPLAY_OPTIONS ========= -->
<!-- ========= ISOLATES_BROWSER_OUPUT_TREE_VIEWER_LINK ============ -->
<h3 id="isolates-browser-output-tree-viewer-link">SNP Tree Viewer link for each isolate that belongs to a SNP cluster <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser-output"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Isolates Browser Output, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h3>
<ul>
<li>If an isolate has a <b>"PDS*" accession number</b> in the <b>"SNP Cluster" column</b> of the <a href="/pathogens/isolates#/search/">Isolates Browser</a>, this means the isolate's genome assembly has been found, via the Pathogens <a href="/pathogens/docs/data_processing">data processing pipeline</a>, to be closely related to other isolate genome sequences in that SNP cluster.
<!-- br />
<i>(The <a href="#sequence-data">sequence data analysis</a> section of this help document provides more information about the processing of isolate genome assemblies and the generation of <a href="#sequence-data-output">phylogenetic distance trees</a>.)</i --></li>
<li>Click on either the <b>"PDS*"</b> (Pathogen Detection SNP Cluster) accession number or the isolate's <b>"PDT*"</b> (Pathogen Detection Target) accession number to open the <a href="#snp-tree-viewer">SNP Tree Viewer</a>, which displays an interactive phylogenetic tree of all the isolates in the SNP cluster. <i>(A separate section of this document provides <a href="#snp-tree-viewer">more information about the SNP Tree Viewer</a>.)</i></li>
<li>If the SNP Cluster column is blank for a given isolate, that means the isolate's genome assembly has not been found, by the Pathogens <a href="/pathogens/docs/data_processing">data processing pipeline</a>, to be similar to any other isolate that is <b>currently</b> in the Pathogen Detection Project.</li>
</ul>
<!-- ======== END_ISOLATES_BROWSER_OUPUT_TREE_VIEWER_LINK ========= -->
<!-- ======== AMR_GENOTYPES_CORE_TOGGLE ============ -->
<h3 id="amr-genotypes-core-toggle">Show all AMR genotypes / Hide plus AMR genotypes button<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser-output"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Isolates Browser Output, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h3>
<ul>
<li> A toggle button is shown to toggle display of the <b><a href="#isolates-browser-data-field-AMRGenotypesCore">AMR genotypes core</a></b> or <b><a href="#isolates-browser-data-field-AMRGenotypes">AMR genotypes</a></b> column when one and only one of the two columns is shown.</li>
</ul>
<!-- ======== END_AMR_GENOTYPES_CORE_TOGGLE ============ -->
<!-- ========= ISOLATES_BROWSER_SHARE_FUNCTION ============ -->
<h3 id="isolates-browser-share">"Share" function in the Isolates Browser <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser-output"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Isolates Browser Output, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h3>
<ul>
<li>A "<b>Share</b>" button is available in the Isolates Browser search results display. It produces a URL that captures your search strategy, which can then be copied and shared with others to execute the search. The results of the search, however, will change over time as new data become available.</li>
</ul>
<!-- ========= END_ISOLATES_BROWSER_SHARE_FUNCTION ============ -->
<!-- ========= ISOLATES_BROWSER_ILLUSTRATED_EXAMPLE ============ -->
<h3 id="isolates-browser-illustration">Illustrated example of Isolates Browser search results <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser-output"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Isolates Browser Output, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h3>
<a href="/pathogens/isolates#/search/escherichia%20AND%20(FDA%20CDC%20USDA)%20AND%20AST_phenotypes:*"><img src="/core/assets/pathogens/images/IsolatesBrowserResultsEcoliFdaCdcUsdaAndHaveASTPhenotypes.png" width="760" height="760" border="0" alt="Illustrated example of Pathogens Isolates Browser display, showing the results of a search for isolates that contain the terms escherichia, and FDA or CDC or USDA, and that have any value in the AST_phenotypes data field. The image shows the results as of July 24, 2018. Click on the image to open the current, live results for the search." /></a>
<ul>
<li>The illustration above shows the Pathogens Isolates Browser results (as of July 24, 2018) of a search for:<br />
<a href="/pathogens/isolates#/search/escherichia%20AND%20(FDA%20CDC%20USDA)%20AND%20AST_phenotypes:*">escherichia AND (FDA CDC USDA) AND AST_phenotypes:*</a><br />
That search retrieves isolates that contain the term "escherichia" in any data field, and contain the term FDA or CDC or USDA in any data field, and contain any value in the AST_phenotypes data field.</li>
<li>Click on the illustration, or enter the query above, into the Isolates Browser, to open the current, live results for that search. Once the results are displayed, use the "<a href="#isolates-browser-display-options"><b>Choose Columns</b></a>" option to customize the display, for example, by adding the "<a href="#isolates-browser-data-field-ASTPhenotypes">AST Phenotypes</a>" column to the display.</li>
<li>The <a href="#isolates-browser">Isolates Browser help</a> section of this document provides additional information about searching, including <a href="#isolates-browser-basic-search">basic searches</a>, <a href="#isolates-browser-advanced-search">advanced searches</a>, available <a href="#isolates-browser-data-fields">data fields</a>, and additional <a href="#solr-sample-searches">examples of SOLR queries</a>.</li>
</ul>
<!-- ======== END_ISOLATES_BROWSER_ILLUSTRATED_EXAMPLE ========= -->
<!-- ========= ISOLATES_BROWSER_Display_in_microbigge ============ -->
<h3 id="isolates-browser-display-in-microbigge">Cross-browser selection - display isolates in MicroBIGG-E <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser-output"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Isolates Browser Output, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h3>
<ul>
<li>Selected isolates can be displayed in <a href="#microbigge">MicroBIGG-E</a>, the <b>Micro</b>bial <b>B</b>rowser for <b>I</b>dentification of <b>G</b>enetic and <b>G</b>enomic <b>E</b>lements which displays the results of <a href="#amr-finder">AMRFinderPlus</a> analyses.</li>
<li>It is possible to view the full results in <a href="#microbigge">MicroBIGG-E</a> for the isolates you have identified.</li>
<li>Click the <b>Cross-browser selection</b> button to the right of the Expand all button (you must be logged into your myNCBI account for this functionality). By default, all of the isolates from your Isolates Browser search will be selected, as indicated by the checkbox column; however, you can deselect rows manually.</li>
<li>Then click the <b>Show in MicroBIGG-E</b> button. A new tab will open with the MicroBIGG-E results for the selected isolates.</li>
<li>For example, having identified isolates that contain a blaKPC gene and a blaTEM-1 gene, a user might want to use <a href="#microbigge">MicroBIGG-E</a> to determine if these genes co-occur on the same contig. Having used the search term <a href="/pathogens/isolates#/search/AMR_genotypes:blaKPC*%20AND%20AMR_genotypes:blaTEM-1">AMR_genotypes:blaKPC* AND AMR_genotypes:blaTEM-1</a>, the user can click the Cross-browser selection button to the right of the Choose Columns button. By default, all of the isolates from your Isolates Browser search will be selected, as indicated by the checkbox column; however, you can deselect columns manually. Then the user can click the "Show in MicroBIGG-E" button. A new tab will open with the MicroBIGG-E results for the selected isolates.</li>
</ul>
<!-- ========= END_ISOLATES_Display_in_microbigge ============ -->
<!-- ======== END_ISOLATES_BROWSER_OUPUT ========= -->
<!-- ========= ISOLATES_BROWSER_AT_GCP ========= -->
<h3 id="isolates-browser-bigquery">Isolates Browser data at Google Cloud Platform in BigQuery <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser-output"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Isolates Browser Output, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h3>
<div style="padding-left: 2em">
Isolates browser and exceptions information is available on Google Cloud in BigQuery. See the <a href="/pathogens/docs/getting_started_bigquery/">Getting Started with BigQuery</a> documentation for help getting started, and <a href="/pathogens/docs/isolates_gcp">Isolates Browser data at Google Cloud Platform</a> for details on the <code>isolates</code> and <code>isolate_exceptions</code> tables at Google BigQuery. From there the data can be analyzed and downloaded in bulk as well as linked to the <code>microbigge</code> table using SQL syntax.
</div>
<!-- ========= END_ISOLATES_BROWSER_AT_GCP ========= -->
<!-- ========= ISOLATES_BROWSER_DOWNLOAD_METADATA_OR_ASSEMBLIES ============ -->
<h3 id="isolates-browser-download">Download data from the Isolates Browser web display <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#isolates-browser-output"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Isolates Browser Output, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h3>
<div style="padding-left: 2em">
The <b>Download button</b> in the <a href="/pathogens/isolates#/search/">Pathogens Isolates Browser</a> allows you to download either the metadata or the assemblies for all of the genomes currently displayed by the Isolates Browser, as described below. Please note that <b>metadata</b> can be downloaded for any isolate, whether or not it has been submitted to GenBank. In contrast, <b>assemblies</b> can only be downloaded for isolates that have been submitted to GenBank (i.e., for isolates that display an accession in the <a href="#isolates-browser-data-field-Assembly">"Assembly" column</a>). For bulk SQL access to table data see <a href="/pathogens/docs/isolates_gcp/">Isolates Browser data at Google Cloud Platform</a>.
Note that we have a new option to download a list of accessions to facilitate use of the <a href="/datasets/docs/v2/download-and-install/">Datasets tool</a> which provides full genome data packages for any of the assemblies listed. See <a href="/pathogens/docs/datasets_assemblies/">Downloading with datasets</a> for more information<br />
<ul>
<li id="isolates-browser-download-metadata"><b>Metadata</b><br />
<ul>
<li>Metadata <b>can be downloaded for any isolate</b>, whether or not it has been submitted to GenBank.</li>
<li>The Isolates Browser will download the <b>data that are currently displayed</b> into a <b>comma separated value (*.csv) file</b>.</li>
<li>For example, if you have chosen to <a href="#isolates-browser-display-options"><b>customize</b> the Isolates Browser display</a>, only the columns you have chosen to display will be downloaded into the file.</li>
<li>Bulk data in tab-delimited format per organism group can also be downloaded from the FTP site. See the <a href="https://ftp.ncbi.nlm.nih.gov/pathogen/ReadMe.txt">ReadMe.txt</a> on the FTP site for more information.</li>
<li>To use SQL to query or to download &gt;100,000 rows see also <a href="/pathogens/docs/isolates_gcp/">Isolates Browser data at Google Cloud Platform</a>.</li>
</ul>
</li>
<li id="isolates-browser-download-assemblies"><b>Assemblies</b><br />
<ul>
<li>Assemblies <b>can only be downloaded for isolates that have been submitted to GenBank</b>:<!-- (i.e., <b>assemblies can only be downloaded for isolates that display an accession in the <a href="#isolates-browser-data-field-Assembly">"Assembly" column</a></b>, because assemblies that have been submitted to GenBank are also represented in the <a href="https://www.ncbi.nlm.nih.gov/assembly/">Assembly Database</a>). -->
<ul>
<li>The <b><a href="#isolates-browser-data-field-Assembly">"Assembly" column</a> will display an accession</b> if an isolate's assembled genome sequence has been submitted to GenBank (because assemblies that have been submitted to GenBank are also represented in the <a href="https://www.ncbi.nlm.nih.gov/assembly/">Assembly Database</a>).</li>
<li>The <b>Assembly column will be blank</b> if an isolate's genome sequence has not yet been submitted to GenBank. (The deposit of &gt;500,000 isolates from the Pathogens Project into the GenBank database is an ongoing project. Many, but not all, of the isolates have been submitted to GenBank. Once the data for a given isolate have been deposited into GenBank, an accession will appear in the Assembly column, and the genomic data will be available for download at that time.)</li>
</ul>
</li>
<li>Annotation data are downloaded as a <b>Generic Feature Format (GFF) file</b>. This is a tabular 9 column file that contains the annotations generated by the Assembly Database API. The <a href="https://www.ncbi.nlm.nih.gov/assembly/">Assembly Database</a> home page includes a link to <a href="https://www.ncbi.nlm.nih.gov/genome/doc/ftpfaq/">Genomes Download FAQ</a>, which provide more information about data downloads.</li>
<li><img src="/pathogens/static/main/app/images/new.png" />The <b>Assembly accessions</b> option allows you to download a list of assembly accessions that can be used with the <a href="https://www.ncbi.nlm.nih.gov/datasets/docs/v2/download-and-install/">Datasets command-line tool</a>. This tool is optimized to download assemblies in bulk. See our <a href="docs/datasets_assemblies/">Datasets downloads documentation</a> for more information.</li>
</ul>
</li>
</ul>
</div>
<!-- ====== END_ISOLATES_BROWSER_DOWNLOAD_METADATA_OR_ASSEMBLIES ====== -->
<!-- ########## END_H2_SECTION:ISOLATES_BROWSER ########## -->
<!-- ======== HORIZONTAL_RULE ============ -->
<hr />
<!-- ======== END_HORIZONTAL_RULE ======== -->
<!-- ########## H2_SECTION:TREE_VIEWER ########## -->
<h2 id="snp-tree-viewer">SNP Tree Viewer help <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h2>
<!-- div style='padding-left: 2em'>
<a href="#snp-tree-viewer-what-is">What is the SNP Tree Viewer?</a><br />
<a href="#snp-tree-viewer-real-time-analysis">RealTimeAnalysis</a><br />
<a href="#snp-tree-viewer-access">How to access the SNP Tree Viewer</a> | <a href="#snp-tree-viewer-access-illustration"><span style="color:#d70000">Illustrated example</span> of SNP Tree Viewer launch points</a><br />
<a href="#snp-tree-viewer-scope-of-data">Scope of data in a tree</a><br />
<a href="#snp-tree-viewer-output"><b>Output</b>: Four panels in a SNP Tree Viewer display</a>:<br />
<div style='padding-left: 2em'>
<a href="#snp-tree-viewer-description"><span style="color:#d70000"><b>[A]</b></span> <b>Description of tree</b> (organism group and number of isolates)</a><br />
<a href="#snp-tree-viewer-isolates-selected"><span style="color:#d70000"><b>[B]</b></span> <b>Isolates selected</b> (navigation panel)</a><br />
<a href="#snp-tree-viewer-isolates-all"><span style="color:#d70000"><b>[C]</b></span> <b>Table of all isolates in tree</b></a><br />
<a href="#snp-tree-viewer-interactive-tree"><span style="color:#d70000"><b>[D]</b></span> <b>Interactive phylogenetic distance tree</b></a>
</div>
<a href="#snp-tree-viewer-controls"><b>SNP Tree Viewer display controls</b></a>|
<a href="#labels">Labels</a> |
<a href="#load-labels">Load Labels</a> |
<a href="#expand">Expand</a> |
<a href="#collapse">Collapse</a> |
<a href="#subtree">Subtree view</a> |
<a href="#neighbors">Neighbors</a> |
<a href="#search-in-tree">Search &amp; Highlight in Tree</a><br />
<a href="#share">"<b>Share</b>" function in the SNP Tree Viewer</a><br />
<a href="#snp-tree-viewer-illustration"><span style="color:#d70000">Illustrated example</span> of a SNP Tree Viewer display</a><br />
<a href="#automated-searches-watch">"<b>Watch</b>" function to receive automatic e-mail notifications about new data related to selected isolate(s)</a><br />
<a href="#automated-searches-watch-illustration"><span style="color:#d70000">Illustrated example</span> of automatic e-mail notification for a watched isolate</a><br />
</div -->
<ul>
<li><a href="#snp-tree-viewer-what-is">What is the SNP Tree Viewer?</a></li>
<li><a href="#snp-tree-viewer-real-time-analysis">RealTimeAnalysis</a></li>
<li><a href="#snp-tree-viewer-access">How to access</a>
<ul>
<li><a href="#snp-tree-viewer-access-illustration"><span style="color:#d70000">Illustrated example</span> of SNP Tree Viewer launch points</a></li>
</ul>
</li>
<li><a href="#snp-tree-viewer-scope-of-data"><b>Scope of data in a tree</b> (cutoffs for inclusion)</a></li>
<li><a href="#snp-tree-viewer-output"><b>Output: four panels in a SNP Tree Viewer display</b></a>
<ul>
<li><a href="#snp-tree-viewer-description"><span style="color:#d70000"><b>[A]</b></span> <b>Description of tree</b> (organism group and number of isolates)</a></li>
<li><a href="#snp-tree-viewer-isolates-selected"><span style="color:#d70000"><b>[B]</b></span> <b>Isolates selected</b> (navigation panel)</a></li>
<li><a href="#snp-tree-viewer-isolates-all"><span style="color:#d70000"><b>[C]</b></span> Table of <b>all isolates</b> in tree</a></li>
<li><a href="#snp-tree-viewer-interactive-tree"><span style="color:#d70000"><b>[D]</b></span> <b>Interactive phylogenetic distance tree</b></a>
<ul>
<li><a href="#snp-tree-viewer-controls">Tree Viewer display controls</a>
<ul>
<li><a href="#labels">Labels</a></li>
<li><a href="#load-labels">Load Labels</a></li>
<li><a href="#expand">Expand</a></li>
<li><a href="#collapse">Collapse</a></li>
<li><a href="#subtree">Subtree view</a></li>
<li><a href="#neighbors">Neighbors</a></li>
<li><a href="#search-in-tree">Search &amp; Highlight in Tree</a></li>
</ul>
</li>
</ul>
</li>
<li><a href="#neighbors">"<b>Neighbors</b>" function</a></li>
<li><a href="#search-in-tree">"<b>Search &amp; Highlight in Tree</b>"</a></li>
<li><a href="#share">"<b>Share</b>" function</a></li>
<li><a href="#snp-tree-viewer-illustration"><span style="color:#d70000">Illustrated example</span> of a SNP Tree Viewer display</a></li>
<li><a href="#automated-searches-watch">"<b>Watch</b>" function to receive automatic e-mail notifications about new data related to selected isolate(s)</a></li>
<li><a href="#automated-searches-watch-illustration"><span style="color:#d70000">Illustrated example</span> of an automatic notification for a watched isolate</a><br /></li>
</ul>
</li>
</ul>
<!-- ========= TREE_VIEWER_WHAT_IS ============ -->
<h3 id="snp-tree-viewer-what-is">What is the SNP Tree Viewer? <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#snp-tree-viewer"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Tree Viewer, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h3>
<div style="padding-left: 2em">
For all pathogen isolates that are clustered together as part of the <a href="/pathogens/docs/data_processing">data processing pipeline</a>, a phylogenetic tree is built for each cluster. The trees can be used to: (1) identify the possible source of an outbreak based on the sequence similarity of the clinical and environmental isolates in a tree, (2) select isolates of interest and examine their relationships to other isolates in the SNP cluster, or to each other, and (3) retrieve metadata about the pathogen isolate.<br /><br />
<i>The information below provides details on <a href="#snp-tree-viewer-real-time-analysis">real time analysis</a>, <a href="#snp-tree-viewer-access">how to access the SNP Tree Viewer</a>, <a href="#snp-tree-viewer-scope-of-data">scope of data in a tree</a> and <a href="#snp-tree-viewer-output">output (four panels in a tree viewer display)</a>, which include: <a href="#snp-tree-viewer-description">[A] description of tree (organism group and number of isolates)</a>, <a href="#snp-tree-viewer-isolates-selected">[B] isolates selected (navigation panel)</a>, <a href="#snp-tree-viewer-isolates-all">[C] table of all isolates in tree</a>, <a href="#snp-tree-viewer-interactive-tree">[D] interactive phylogenetic distance tree</a>.</i><br />
</div>
<!-- ======== END_TREE_VIEWER_WHAT_IS ========= -->
<!-- ========= TREE_VIEWER_REAL_TIME_ANALYSIS ============ -->
<h3 id="snp-tree-viewer-real-time-analysis">Real time analysis <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#snp-tree-viewer"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Tree Viewer, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h3>
<div style="padding-left: 2em">
Unlike other NCBI system such as BLAST, the <a href="/pathogens/">Pathogen Detection</a> project is not built with an interactive interface that allows users to upload their data and immediately obtain an answer. Instead, this project was set up to facilitate interactive analyses of large-scale surveillance projects that are automatically submitting real-time data to the NCBI archives that are then routed to an automated pipeline that generates interactive web reports on a daily basis. The web displays allow users to search, browse, and filter the automatically analyzed data that has been already submitted.
</div>
<!-- ======== END_TREE_VIEWER_REAL_TIME_ANALYSIS ========= -->
<!-- ========= TREE_VIEWER_ACCESS ============ -->
<h3 id="snp-tree-viewer-access">How to access the SNP Tree Viewer <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#snp-tree-viewer"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Tree Viewer, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h3>
<div style="padding-left: 2em">
The SNP Tree Viewer can be accessed from the <a href="/pathogens/isolates#/search/">Isolates Browser</a>.
<!-- The SNP Tree Viewer can be accessed either from the Isolates Browser, or by entering the URL of a previously viewed tree. --> Any isolate that has a <b>"PDS*" accession number</b> in the <b>"SNP Cluster" column</b> has a link to the SNP Tree Viewer. <i>("PDS" is the <a href="#accession-prefixes">accession number prefix</a> for a <b>P</b>athogen <b>D</b>etection <b>S</b>NP cluster.)</i><br /><br />
<b>Example:</b> The FDA's GenomeTrakr project (BioProject <a href="https://www.ncbi.nlm.nih.gov/bioproject/230969">PRJNA230969</a>) for the surveillance and rapid detection of foodborne contamination events include a <a href="/pathogens/isolates#/search/PRJNA230969%20AND%20PDS000003441"><b>subset of <i>E. coli</i> isolates that belong to the SNP cluster "PDS000003441"</b></a>, and that were associated with a 2016 outbreak from all-purpose flour.<br /><br />
In the Isolates Browser display, you can <b>click on the "PDS*" accession number</b> that appears in the <b>"SNP Cluster" column</b> for any one of those isolates <!-- (e.g., isolate PDT000133982.1) --> to open the SNP Tree Viewer display for the SNP cluster and interactively examine the phylogenetic distance tree. (Below is an <a href="#snp-tree-viewer-access-illustration"><span style="color:#d70000">illustrated example</span> of SNP Tree Viewer launch points</a>.)<br /><br />
The resulting SNP Tree View shows a number of <b>clinical and environmental samples that are very closely related</b>, and therefore sheds light on the possible source of the outbreak. The <a href="#snp-tree-viewer-output">SNP Tree Viewer output</a> section of this document includes an <a href="#snp-tree-viewer-illustration"><span style="color:#d70000">illustrated example</span> of a SNP Tree Viewer display</a> that includes isolates from the <i>E. coli</i> outbreak. <i>(<a href="https://www.cdc.gov/ecoli/2016/o121-06-16/index.html">Read more on the CDC website about that outbreak</a>.)</i>
<br /><br />
<img src="/core/assets/pathogens/images/IsolatesBrowserTreeViewerLaunchPoints.png" width="650" height="590" border="0" alt="Illustration of Pathogens Isolates Browser output, showing launch points for the SNP Tree Viewer. Each SNP cluster (PDS*) accession opens a SNP Tree Viewer display." id="snp-tree-viewer-access-illustration" />
</div>
<!-- ======== END_TREE_VIEWER_ACCESS ========= -->
<!-- ========= TREE_VIEWER_SCOPE_OF_DATA ============ -->
<h3 id="snp-tree-viewer-scope-of-data">Scope of data in a tree <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#snp-tree-viewer"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Tree Viewer, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h3>
<div style="padding-left: 2em">
The <a href="/pathogens/docs/data_processing">data processing pipeline</a> section describes what data is available in the SNP Tree Viewer.<br /><br />
Individual phylogenetic trees for each SNP cluster are available on <a href="https://ftp.ncbi.nlm.nih.gov/pathogen/Results/">FTP</a> as well as the NCBI Pathogen Detection <a href="/pathogens/isolates#/search/">Isolates Browser</a>.
<i>(Separate sections of this file provide <a href="#isolates-browser">Isolates Browser help documentation</a> and an <a href="#ftp">overview of the data available on the FTP site</a>.)</i>
</div>
<!-- ======== END_TREE_VIEWER_SCOPE_OF_DATA ========= -->
<!-- ========= TREE_VIEWER_OUTPUT_USER_INTERFACE ============ -->
<h3 id="snp-tree-viewer-output">Output: four panels in a SNP Tree Viewer display <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#snp-tree-viewer"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Tree Viewer, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h3>
<div style="padding-left: 2em">
<a href="#snp-tree-viewer-description"><img src="/core/assets/pathogens/images/red_box_A.png" width="20" height="20" border="0" /> Description of tree (organism group and number of isolates)</a><br />
<a href="#snp-tree-viewer-isolates-selected"><img src="/core/assets/pathogens/images/red_box_B.png" width="20" height="20" border="0" /> Isolates selected (navigation panel)</a><br />
<a href="#snp-tree-viewer-isolates-all"><img src="/core/assets/pathogens/images/red_box_C.png" width="20" height="20" border="0" /> Table of all isolates in tree</a><br />
<a href="#snp-tree-viewer-interactive-tree"><img src="/core/assets/pathogens/images/red_box_D.png" width="20" height="20" border="0" /> Interactive phylogenetic distance tree</a><br />
<a href="#snp-tree-viewer-controls"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="20" border="0" /><b>Tree Viewer display controls</b>:</a><br />
<a href="#labels"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="45" height="20" border="0" /><b>Labels</b></a><br />
<a href="#load-labels"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="45" height="20" border="0" /><b>Load Labels</b></a><br />
<a href="#expand"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="45" height="20" border="0" /><b>Expand</b></a><br />
<a href="#collapse"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="45" height="20" border="0" /><b>Collapse</b></a><br />
<a href="#subtree"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="45" height="20" border="0" /><b>Subtree</b></a><br />
<a href="#neighbors"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="45" height="20" border="0" /><b>Neighbors</b></a><br />
<a href="#search-in-tree"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="45" height="20" border="0" /><b>Search &amp; Highlight in Tree</b></a><br />
<a href="#share"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="1" height="20" border="0" />"<b>Share</b>" function</a><br />
<a href="#snp-tree-viewer-illustration"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="20" border="0" /><span style="color:#d70000">Illustrated example</span> of a SNP Tree Viewer display</a><br />
<a href="#automated-searches-watch"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="20" border="0" />"<b>Watch</b>" function to receive automatic e-mail notifications about new data related to selected isolate(s)</a><br />
<a href="#automated-searches-watch-illustration"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="20" border="0" /><span style="color:#d70000">Illustrated example</span> of automatic e-mail notification for a watched isolate</a><br />
</div>
<div style="padding-left: 2em">
<h4 id="snp-tree-viewer-description"><img src="/core/assets/pathogens/images/red_box_A.png" width="20" height="20" border="0" /> Description of tree <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#snp-tree-viewer"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Tree Viewer, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h4>
<ul>
<li>The top of a SNP Tree Viewer display provides summary information about the phylogenetic distance tree currently being displayed, such as:</li>
<ul>
<li><b>Organism group</b>, such as <i>E. coli and Shigella</i>, and the corresponding <b>PDG accession.version</b> for the group.
(The "PDG" prefix = Pathogen Detection Group.)</li>
<li><b>Number of isolates in the tree</b>, and the corresponding <b>PDS accession.version</b> for the tree.
(The "PDS" prefix = Pathogen Detection SNP cluster.)</li>
</ul>
<li>An example is shown in <span style="background-color: #ffff00"><b>part A</b> of the <a href="#snp-tree-viewer-illustration"><span style="color:#d70000">illustrated example</span> of a SNP Tree Viewer display</a></span>.</li>
<li id="snp-tree-evolves">The composition of a tree can change over time as new data are added to the Pathogen Detection Project.<br />
<i>(A separate section of this document on <a href="#data-retention">data retention and history tracking</a> provides addition information about the ways in which data and analysis results continue to evolve.)</i></li>
</ul>
</div>
<div style="padding-left: 2em">
<h4 id="snp-tree-viewer-isolates-selected"><img src="/core/assets/pathogens/images/red_box_B.png" width="20" height="20" border="0" /> Isolates selected (navigation panel) <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#snp-tree-viewer"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Tree Viewer, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h4>
<ul>
<li>The <b>navigation panel</b>, which has the header "<b>Isolates Selected</b>" in the SNP Tree Viewer interface, allows for easy tree navigation based on the selection of isolates. <b><i>Clicking on ANY isolate in the navigation panel will shift the focus of the tree to where that isolate is.</i></b> This is especially critical for larger trees, where the number of isolates may be several thousand, or where the number of selected isolates is large.</li>
<li>The navigation panel also provides critical information on the similarity of isolates when there is more than one isolate selected, including min, max, and avg. SNP distances and the creation data ranges of the isolate(s), providing a quick and easy to use summary.</li>
<li>The number of items that are listed in the "Isolates Selected" section depends upon which link you followed from the Isolates Browser output to the SNP Tree Viewer display.<br />
<ul>
<li>For example, the <a href="#snp-tree-viewer-access-illustration"><span style="color:#d70000">illustration</span> of SNP Tree Viewer launch points</a> (in the section on "<a href="#snp-tree-viewer-access">how to access the SNP Tree Viewer</a>") shows the Isolates Browser results from a search for the phrase "all-purpose flour" (as of September 4, 2018).
<ul>
<li>In the "<b>Matched Clusters</b>" section of the Isolates Browser results, clicking on the Pathogen Detection SNP cluster (<a href="#accession-prefix-pds">PDS</a>) accession would open a SNP Tree Viewer display with <b>"10 Isolates Selected"</b> out of the total 136 isolates in the tree. This is because 10 of the isolates that contain your search term have been found to belong to a SNP cluster. When you view the SNP cluster in SNP Tree Viewer, those 10 isolates will be automatically selected, and will be shown in red font in the interactive phylogenetic distance tree.</li>
<li>In the "<b>Matched Isolates</b>" section of the Isolates Browser results, clicking on an individual item (i.e., on an individual isolate's Pathogen Detection SNP cluster (PDS) or Pathogen Detection Target (PDT) accession) would open a SNP Tree Viewer display with only <b>"1 Isolate Selected"</b> out of the total 136 isolates in the tree.</li>
</ul>
</li>
</ul>
You can add or remove isolates from that list by clicking on isolates of interest in the phylogenetic tree to select/deselect them, by activating/deactivating their checkboxes in the table of all isolates in the tree, etc.
</li>
<li>An example of the "Isolates Selected" navigation panel is shown as <span style="background-color: #ffff00"><b>part B</b> of the <a href="#snp-tree-viewer-illustration"><span style="color:#d70000">illustrated example</span> of a SNP Tree Viewer display</a></span>. It features six isolates: four clinical isolates, and two environmental isolates.</li>
<li>The selected isolates are also shown at the top of the table that lists all of the isolates in the SNP cluster, with their <b>check boxes activated</b> (as shown in <b>part C</b> of the <a href="#snp-tree-viewer-illustration"><span style="color:#d70000">illustrated example</span> of a SNP Tree Viewer display</a>).</li>
<li>The selected isolates are displayed in <span style="color:#D70000">red font</span> in the <b>phylogenetic distance tree</b> (as shown in <b>part D</b> of the <a href="#snp-tree-viewer-illustration"><span style="color:#d70000">illustrated example</span> of a SNP Tree Viewer display</a>).</li>
</ul>
</div>
<div style="padding-left: 2em">
<h4 id="snp-tree-viewer-isolates-all"><img src="/core/assets/pathogens/images/red_box_C.png" width="20" height="20" border="0" /> Table of all isolates in tree <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#snp-tree-viewer"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Tree Viewer, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h4>
<ul>
<li>A table that lists all of the isolates in the SNP cluster appears above the phylogenetic distance tree. An example is shown in <span style="background-color: #ffff00"><b>part C</b> of the <a href="#snp-tree-viewer-illustration"><span style="color:#d70000">illustrated example</span> of a SNP Tree Viewer display</a></span>.</li>
<li>The table has the same data content as the Isolates Browser, but only for the subset of isolates in the currently viewed SNP cluster. The only additional data is a checkbox column that allows selections in the table to be reflected by selections in the tree and the navigation panel. Conversely selections in the tree are reflected by selections in the table. The table can be hidden from view and customized the same as in the Isolate Browser. <i>(A separate section of this document describes <a href="#isolates-browser-output">Isolates Browser output</a> and provides information on display controls such as <a href="#isolates-browser-display-options">choose columns</a>.)</i></li>
<li>The <b>table can be <a href="#isolates-browser-display-options">customized</a></b> in the same way and the main Isolates Browser display, for example, by using <a href="#filters">filters</a> to narrow the subset of isolates being displayed; using the <a href="#isolates-browser-display-options">choose columns</a> option to select which columns to display or hide; clicking on the column headers to change the <a href="#sort-order">sort order</a> of isolates; etc. To apply the filters to narrow the list of selected isolates click the <span style="background-color: #ffff00"><b>Apply filters</b></span> button in the <a href="#snp-tree-viewer-isolates-selected">Navigation panel</a>.</li>
<li>The "<b>Share</b>" button at the top of the table produces a URL that captures your customized view of the tree, which can then be shared with others to reproduce the same view. Critically, this allows the user to highlight selected isolates, collapse certain parts of the tree, and generate a view that can be shared in a document or via email with collaborators. The URL is temporary; the customized display remains available for one month. <i>(<a href="#share">Read more about the "share" function</a> and <a href="#data-retention">data retention</a>.)</i></li>
</ul>
</div>
<div style="padding-left: 2em">
<h4 id="snp-tree-viewer-interactive-tree"><img src="/core/assets/pathogens/images/red_box_D.png" width="20" height="20" border="0" /> Interactive phylogenetic distance tree <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#snp-tree-viewer"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Tree Viewer, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h4>
<ul>
<li>The bottom section of a SNP Tree Viewer display shows an interactive phylogenetic distance tree, as shown in <span style="background-color: #ffff00"><b>part D</b> of the <a href="#snp-tree-viewer-illustration"><span style="color:#d70000">illustrated example</span> of a SNP Tree Viewer display</a></span>.</li>
<li id="snp-tree-viewer-red-font">Isolates that you have selected are shown in <span style="color:#D70000"><b>red font</b></span>. <b>Click on any isolate of interest</b> in a live SNP Tree Viewer display in order to open a menu that allows you to <b>select/deselect</b> it.</li>
<li id="snp-tree-viewer-controls"><b>Display Controls</b> above a phylogenetic distance tree in the enable you to customize the view. Mouse over a control button in a live SNP Tree Viewer display to read about its function. Some of the controls include:<br /><br />
<ul>
<li id="labels"><b>Labels</b> button (at the top of the table that lists all of the isolates in the tree) allows you to determine which labels are displayed for the isolates in the tree view, from the set of labels that are available in the SNP Tree Viewer. The selections you make will <b>persist</b> within a given browser (e.g., Chrome, Edge, Internet Explorer, Firefox, Safari) until that browser's cookies are cleared/reset.</li>
<li id="load-labels"><b>Load Labels</b> button allows you to add <b>custom labels</b> to one or more isolates in the tree view. To do this:<br />
<ul>
<li>On your local computer, <b>create a tab-delimited text file (*.txt)</b> that lists which isolates to label (by specifying their <a href="#accession-prefix-pdt">PDT*</a> accessions), and which label(s) to add to a given isolate.<br />
<ul>
<li>The text file should contain <b>one line per PDT accession and label-value pair.</b></li>
<li>The text file <b>can contain multiple lines with the same PDT accession</b>. For example, if you want to add two custom labels to a given PDT, the file should contain two lines for that accession, with one label and value pair in each line.</li>
<li>The contents of a <b>sample tab-delimited text file</b> for loading custom labels could look like:<br />
<div style="padding-left: 2em">
PDT000123456 YourLabelName1 ValueA<br />
PDT000123456 YourLabelName2 ValueB<br />
PDT000456789 YourLabelName1 ValueC<br />
PDT000456789 YourLabelName3 ValueD<br />
</div>
</li>
</ul>
</li>
<li><b>Save</b> the text file on your local computer.</li>
<li>Click on the <b>"Load Labels" button</b> and choose the file you want to load.</li>
<li>A messsage will appear that says, <b><i>Add N labels</i></b>, where <b><i>N</i></b> is the number of <b>properly formatted rows</b> in your text file. (Each properly formatted row contains three items in a tab-delimited format: the PDT accession, a label name, and the value. If any item is missing from row, that row will not be counted, and the information it contains will not be displayed in the tree view.)<br />
<ul>
<li>In the case of the <b>sample text file above</b>, the message would say: <b>Add 4 labels</b>. The SNP Tree Viewer would then display ValueA and ValueB for PDT000123456, and ValueC and ValueD for PDT000456789, in addition to the other labels that were already shown for those isolates.</li>
</ul>
</li>
<li>Note: the <a href="#share">Share</a> function will not capture the custom labels you added to the display. However, you can use the "Export" option to save the customized tree in Newick, PNG, or PDF format.</li>
</ul>
</li>
<li id="expand"><b>Expand</b> button expands all branches (default)</li>
<li id="collapse"><b>Collapse</b> button collapses branches to show 100 nodes. Clusters with fewer nodes will not be collapsed.</li>
</ul>
</li>
<li id="subtree">A <b>Subtree menu</b> appears if you <b>click on the circle that represents a node in the tree</b>. The Subtree menu includes options such as:<br />
<ul>
<li id="subtree-view"><b>Subtree view</b> opens only the subtree you have selected in a new tab.</li>
<li id="subtree-collapse"><b>Collapse subtree</b> reduces the isolates in the branch into a blue cloud. Click on the collapsed node to open the menu and "Expand subtree" again, if desired.</li>
<li>As an example, see <b>part D</b> of the <a href="#snp-tree-viewer-illustration"><span style="color:#d70000">illustrated example</span> of a SNP Tree Viewer display</a>. The lower left hand corner includes an inset showing the Subtree menu.</li>
</ul>
</li>
<li id="select-multiple-isolates-in-single-action">The SNP Tree Viewer offers options to <b>highlight or select groups of isolates in a single action</b>, whether you are viewing all isolates in the tree or a only a subtree. For example:<br />
<ul>
<li id="neighbors">The "<b>Neighbors</b>" button (at the top of the table that lists all of the isolates in the tree) allows you to instantly select (i.e., show in red font the tree and add them to the list of "Selected isolates") all isolates that fall within a SNP distance of your originally selected isolate(s).</li>
<li id="search-in-tree">"<b>Search &amp; Highlight in Tree</b>" searches all labels that are currently displayed by the SNP Tree Viewer, including custom labels you might have added to the tree.<!-- (Previously, the "Search in tree" function searched only the default set of labels.) -->
<ul>
<li>The browser will <b>highlight</b> (display in <b>bold font</b>) isolates that contain your search term in the tree.</li>
<li>The <b>check mark icon</b> that appears in the right hand side of the "Search &amp; Highlight in Tree" text box allows you to <b>select all of the highlighted isolates</b> with a single click. Selected isolates are displayed in <span style="color:red"><b>red font</b></span> in the tree, and are added to the list of "Selected isolates" at the top of the SNP Tree Viewer display.</li>
<li>If you prefer to <b>select individual isolates</b>, rather than the complete set of highlighted isolates, simply <b>left click on an isolate of interest</b> and choose "select" from the pop-up menu.</li>
</ul>
</li>
</ul>
</li>
</ul>
</div>
<!-- ======== END_TREE_VIEWER_OUTPUT_USER_INTERFACE ========= -->
<!-- ======== SNP_TREE_VIEWER_SHARE_FUNCTION ============ -->
<h3 id="share">"Share" function in the SNP Tree Viewer <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#snp-tree-viewer"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Tree Viewer, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h3>
<ul>
<li>A "<b>Share</b>" button is available in the SNP Tree Viewer display (as shown in part C of the <a href="#snp-tree-viewer-illustration"><span style="color:#d70000">illustrated example</span> of a SNP Tree Viewer display</a>). It produces a <b>URL that captures your customized view of the tree</b>, which can then be copied and shared with others to reproduce the same view.</li>
<li>The URL is <b>temporary</b>, remaining valid for <b>60 days</b>.</li>
<li>For the <b>first 30 days</b>, the URL will open the customized display, showing the isolates you selected and any other customizations you made to the view.</li>
<li>For the <b>second 30 days</b>, the URL continues to be valid, but during that time, it will only show a link to the default display for the most recent version of the SNP cluster. That is, the URL will not open the original customized view, but instead will redirect to a version of the phylogenetic distance tree that reflects the most recent for the tree.<br /><br />
<i>(As noted above, under <a href="#snp-tree-viewer-description">description of tree</a>, the composition of a tree can change over time as new data are added to the Pathogen Detection Project. A separate section of this document describes the <a href="#data-retention">data retention and history tracking</a> policy and examples of the ways in which <!-- a href="#DataEvolve" -->data and analysis results continue to evolve<!-- /a -->.)</i>
</li>
</ul>
<!-- ======== END_SNP_TREE_VIEWER_SHARE_FUNCTION ========= -->
<!-- ========= TREE_VIEWER_ILLUSTRATED_EXAMPLE ============ -->
<h3 id="snp-tree-viewer-illustration">Illustrated example of SNP Tree Viewer display <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#snp-tree-viewer"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Tree Viewer, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h3>
Each tree displays all members of a SNP cluster, defined as a group of isolates whose genome assemblies are closely related, depending on the clustering methodology used (as noted in the <a href="/pathogens/docs/data_processing">data processing</a> section of this document). The "<a href="#filters">Filters</a>" option can be used, if desired, to display a subset. The interactive phylogenetic distance tree is at the bottom of a SNP Tree Viewer display, and selected isolates shown in <span style="color:#D70000">red font</span> in the tree.<br /><br />
<img src="/core/assets/pathogens/images/TreeViewer_PDS000003441.80.png" width="760" height="2350" border="0" alt="Illustrated example of Pathogens SNP Tree Viewer display, showing the phylogenetic distance tree for a SNP cluster that contains isolates associated with an E. coli outbreak from all-purpose flour, reflecting data as of September 4, 2018. A footnotes under the illustration describes how to open a live SNP Tree Viewer display for the most current data in that SNP cluster." />
<!-- ALTERNATIVE FILENAME: img src="/core/assets/pathogens/images/TreeViewer_PDS000003441.80_PDG000000004.997.png" width="760" height="2350" border="0" -->
<ul id="snp-tree-viewer-illustration-footnotes">
<li>The illustration above shows the SNP Tree Viewer display (as of September 4, 2018) for the Pathogen Detection Group (organism group) PDG000000004.997 and the SNP cluster PDS000003441.80, which includes isolates associated with an E. coli outbreak from all-purpose flour. <i>(<a href="https://www.cdc.gov/ecoli/2016/o121-06-16/index.html">Read about that outbreak on the CDC website</a>.)</i></li>
<li>As noted above, under <a href="#snp-tree-viewer-description">description of tree</a>, the <b>composition of a tree can change over time</b> as new data are added to the Pathogen Detection Project.</li>
<li>To open a live display of the most recent data for the SNP cluster, you can <a href="/pathogens/isolates#/search/PDS000003441">search for PDS000003441 in the Isolates Browser</a>. That will retrieve all isolates that currently belong to that SNP cluster. Then click on the PDS000003441 accession number in the SNP Cluster column for any isolate in the search results to open the SNP Tree Viewer display for the current data. <i>(see <a href="#snp-tree-viewer-access-illustration">illustrated example of SNP Tree Viewer launch points</a>)</i></li>
<li><i>The <a href="#snp-tree-viewer">SNP Tree Viewer help</a> section of this document provides additional information about using the tool.<br />
A "<b>Share</b>" button on the SNP Tree Viewer display can be used to copy a URL that captures your customized view of the tree, which can then be shared with others to reproduce the same view. The URL is temporary; the customized display remains available for one month (<a href="#share">read more about the "share" function</a>).</i></li>
</ul>
<!-- ======== END_TREE_VIEWER_ILLUSTRATED_EXAMPLE ========= -->
<!-- ########## END_H2_SECTION:TREE_VIEWER ########## -->
<!-- ======== HORIZONTAL_RULE ============ -->
<hr />
<!-- ======== END_HORIZONTAL_RULE ======== -->
<!-- ########## H2_SECTION:AUTOMATED_SEARCHES ########## -->
<h2 id="automated-searches">Automatic E-mail Notifications of New Data <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h2>
<!-- div style='padding-left: 2em'>
<a href="#automated-searches-background">Background</a> | <a href="#automated-searches-limitations">Limitations</a><br />
<a href="#automated-searches-requirements">Requirements</a>: <a href="#my-ncbi">(1) My NCBI login</a>; <a href="#perform-search">(2) Perform search in Pathogens Isolates Browser</a>
<br /><a href="#automated-searches-save">SAVE the search in the Isolates Browser</a> (<a href="#automated-searches-save-illustration"><span style="color:#d70000">illustrated example</span></a>)<br />
<a href="#automated-searches-watch">WATCH an isolate in the SNP Tree Viewer</a> (<a href="#automated-searches-watch-illustration"><span style="color:#d70000">illustrated example</span></a>)
<br>
[<a href="#automated-searches-examples"><span style="color:#d70000">Additional examples</span> of saved searches and watched isolates</a>]
</div -->
<ul>
<li><a href="#automated-searches-background">Background</a></li>
<li><a href="#automated-searches-limitations">Limitations</a></li>
<li><a href="#automated-searches-requirements">Requirements</a>
<ul>
<li><a href="#my-ncbi">My NCBI login</a></li>
<li><a href="#perform-search">Perform search in Pathogens Isolates Browser</a></li>
<!-- li><a href="#AutomaticEmailNotificationsSaveOrWatch">SAVE the search in the Isolates Browser and/or WATCH an isolate in the SNP Tree Viewer</a></li -->
</ul>
</li>
<li><a href="#automated-searches-save"><b>SAVE</b> a search in the Pathogens Isolates Browser</a>
<ul>
<li><a href="#automated-searches-save-illustration"><span style="color:#d70000">Illustrated example</span> of automatic e-mail for a SAVED SEARCH</a></li>
</ul>
</li>
<li><a href="#automated-searches-watch"><b>WATCH</b> an isolate(s) in the SNP Tree Viewer</a>
<ul>
<li><a href="#automated-searches-watch-illustration"><span style="color:#d70000">Illustrated example</span> of automatic e-mail for a WATCHED ISOLATE</a></li>
</ul>
</li>
<!-- li><a href="#automated-searches-examples"><span style="color:#d70000">Additional examples</span> of saved searches and watched isolates</a>
<li><a href="#____________">____________</a></li>
<ul>
<li><a href="#____________">____________</a></li>
</ul>
</li -->
</ul>
<!-- ========= AUTOMATED_SEARCHES_OVERVIEW_BACKGROUND ============ -->
<h3 id="automated-searches-background">Background <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#automated-searches"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Isolates Browser Automated Searches, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h3>
<ul>
<li>The <a href="/pathogens/">NCBI Pathogen Detection Project</a> data are updated frequently. The project includes a feature for <b>automatic e-mail notifications of new data</b>. It is a current awareness service to inform you about new data as it becomes available, for pathogens that are of interest to you. This feature is designed to allow users to <b>search once</b>, and then <b>get automatic notifications</b> if any pathogen isolates match their search criteria.</li>
<li>Components of the automatic e-mail notifications system include:<br /><br />
<ul>
<li>A "<b>Save</b>" button in the <b>Isolates Browser</b> interface,<br />which allows you to save a search and automatically notifies you about new isolates that match the criteria of the saved search.
<i>(<a href="#automated-searches-save">Read more</a> and view an <a href="#automated-searches-save-illustration"><span style="color:#d70000">illustrated example</span></a>.)</i></li>
<li>A "<b>Watch</b>" button in the <b>SNP Tree Viewer</b> interface,<br />which allows you to watch one or more selected isolates in a tree, and automatically notifies you about new isolates that are similar to the isolate(s) you have chosen to watch, because they fall within the SNP distance that you have specified.
<i>(<a href="#automated-searches-watch">Read more</a> and view an <a href="#automated-searches-watch-illustration"><span style="color:#d70000">illustrated example</span></a>.)</i></li>
</ul>
</li>
</ul>
<!-- ======== END_AUTOMATED_SEARCHES_OVERVIEW_BACKGROUND ========= -->
<!-- ========= AUTOMATED_SEARCHES_LIMITATIONS ============ -->
<h3 id="automated-searches-limitations">Limitations <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#automated-searches"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Isolates Browser Automated Searches, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h3>
<ul>
<li>Searches are triggered for each and every organism group update that is delivered to the Pathogen Browser. An email is sent for each set of hits per organism group. That means if a search, for example for a particular antimicrobial resistance gene is not specific for a certain organism, then search results may be delivered multiple times per day. This is considered a feature and not a bug. There are currently 22 organism groups, and more are expected in the future. Not all searches can currently be done.</li>
</ul>
<!-- ======== END_AUTOMATED_SEARCHES_LIMITATIONS ========= -->
<!-- ========= AUTOMATED_SEARCHES_REQUIREMENTS_MyNCBI ============ -->
<h3 id="automated-searches-requirements">Requirements for automatic e-mail notifications <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#automated-searches"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Isolates Browser Automated Searches, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h3>
<div style="padding-left: 2em"><a href="#my-ncbi">My NCBI login</a> | <a href="#perform-search">Perform search in Pathogens Isolates Browser</a></div>
<ol>
<li id="my-ncbi"><b>My NCBI login</b><br />
<ul>
<li>Searches are tied to an email address. The only way to do this is to use your <a href="https://www.ncbi.nlm.nih.gov/myncbi/">My NCBI login</a>. If you do not yet have a My NCBI account, it is easy to set one up and there is no cost.</li>
<li>You will <b>need to be logged in</b> to My NCBI order to <b>save searches</b>, which will then be run in an automated way on a daily basis. The system will send e-mail notifications when new data arrive for a saved search.</li>
<li>You <b>do not need to be logged in</b> to <b>receive the e-mail notifications</b>. The notifications will be sent to the My NCBI email address you used when creating the account.</li>
<li>More information about My NCBI is available in the <a href="https://www.ncbi.nlm.nih.gov/books/NBK3843/">My NCBI help document</a>, <a href="https://www.youtube.com/watch?v=ks46w3mNAQE">video overview (YouTube)</a>.<br />
<ul>
<li><i>The main function of MyNCBI for the Pathogens Isolates Browser is to associate your e-mail address with the searches that you save, so you can received e-mail notifications about new data.</i></li>
<li><i>The My NCBI help document and video overview, above, provide general information about My NCBI and are included here as a general reference.</i></li>
<li><i>Some of the features described in help document and video overview apply to NCBI databases that are within the <a href="https://www.ncbi.nlm.nih.gov/search/">Entrez search system</a>, but might not apply to Pathogens, which is outside of that system because it uses a different search engine (<a href="#solr">SOLR</a>).</i></li>
<li><i>For example, the Pathogens saved searches will not appear directly on your My NCBI account page, but are instead accessible through the "<a href="#saved-searches">Saved Searches</a>" link in the Pathogens Isolates Browser or the "<a href="#watched-isolates">Watched Isolates</a>" link in the SNP Tree Viewer.</i></li>
</ul>
</li>
</ul>
</li>
<li id="perform-search"><b>Perform search in Pathogens Isolates Browser</b><br />
<ul>
<li>In order to received automated search results by e-mail, a search first needs to be performed in the <a href="/pathogens">Pathogens Isolates Browser</a>.</li>
<li>We recommend starting with <b>narrowly defined searches</b>, otherwise you will be inundated with meaningless and noisy search results by email, which would be better performed in the browser when needed.<br />
<i>(A separate section of this document provides <a href="#isolates-browser">Isolates Browser help</a>, which includes detailed information about search syntax, including <a href="#allowable-search-terms">allowable search terms</a>, <a href="#isolates-browser-query-tips">query tips</a>, <a href="#isolates-browser-advanced-search">advanced search</a> techniques that use the SOLR query language, a complete list of <a href="#isolates-browser-data-fields">data fields</a>, and <a href="#solr-sample-searches">examples of SOLR queries</a>.)</i></li>
<li>Then you can either <a href="#automated-searches-save">SAVE</a> your search and/or <a href="#automated-searches-watch">WATCH</a> an isolate(s) of interest, as described below, in order to receive automatic e-mail notifications of any new data that become available.</li>
</ul>
</li>
</ol>
<!-- ======== END_AUTOMATED_SEARCHES_REQUIREMENTS_MyNCBI ========= -->
<!-- ========= AUTOMATED_SEARCHES_SAVE ============ -->
<h3 id="automated-searches-save">SAVE a search in the Pathogens Isolates Browser <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#automated-searches"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Isolates Browser Automated Searches, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h3>
<ul>
<li id="save-button">After you have: (1) logged into your <a href="#my-ncbi">MyNCBI account</a>, and (2) performed a <a href="#text-terms">text search</a> search in the <a href="/pathogens/isolates#/search/">Pathogens Isolates Browser</a>, you can use the <b>"Save" button</b> to store the search strategy.</li>
<li>Your <b>search will then be run in an automated way on a daily basis</b> .</li>
<li>You will receive <b>automatic e-mail notifications only if/when</b> new isolates become available that match your search criteria.</li>
<li id="saved-searches">Use the <b>"Saved Searches" link</b> on the Pathogens Isolates Browser interface to view the list of your saved searches, and to edit or delete the searches.</li>
<li>The <a href="#automated-searches-save-illustration"><span style="color:#d70000">illustrated example</span></a> below shows the "Save" button, the "Saved Searches" link, and a sample automatic e-mail for a saved Search.</li>
</ul>
<!-- ======== END_AUTOMATED_SEARCHES_SAVE ========= -->
<!-- ========= AUTOMATED_SEARCHES_SAVE_ILLUSTRATION ============ -->
<h3 id="automated-searches-save-illustration">Illustrated example of automatic e-mail notification for a Saved Search <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#automated-searches"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Tree Viewer, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h3>
<img src="/core/assets/pathogens/images/IsolatesBrowserSaveSearch_Salmonella_mindiff0to4.png" width="800" height="1650" border="0" alt="Illustrated example of the Pathogens Isolates Browser SAVE function, and including an example of an automatic e-mail message that contains a notification of new isolates that match the saved search." />
<br />
<!-- ======== END_AUTOMATED_SEARCHES_SAVE_ILLUSTRATION ========= -->
<!-- ========= AUTOMATED_SEARCHES_WATCH ============ -->
<h3 id="automated-searches-watch">WATCH an isolate in the SNP Tree Viewer <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#automated-searches"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Isolates Browser Automated Searches, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h3>
<ul>
<li id="watch-button">After you have (1) logged into your <a href="#my-ncbi">MyNCBI account</a>, (2) performed a search in the <a href="/pathogens/isolates#/search/">Pathogens Isolates Browser</a>, and (3) launched the <b>SNP Tree Viewer</b> for any isolate retrieved by your search, you can use the <b>"Watch" button</b> to store the isolate in your <a href="#my-ncbi">My NCBI</a> account and receive automatic e-mail <b>notifications of closely related new isolates as they become available</b> in the system.<br />
<i>(A separate section of this document provides more details about <a href="#snp-tree-viewer-access">how to access the SNP Tree Viewer</a> as well an an <a href="#snp-tree-viewer-access-illustration"><span style="color:#d70000">illustrated example</span> of SNP Tree Viewer launch points</a>.)</i></li>
<li>If you select <b>multiple isolates</b> in the SNP Tree View and then press the "<b>Watch</b>" button, then <b>all of the selected isolates</b> will be added to your list of <b>watched isolates</b>.</li>
<li>The system will prompt you to enter a <b>name</b> for the watched isolate(s), and to specify the <b>maximum SNP distance</b> for receiving reports of new data.</li>
<li>Each isolate will be <b>watched on a daily basis</b> in an automated way.</li>
<li>You will receive <b>automatic e-mail notifications</b> only if/when <b>new isolates that fall within a specified SNP distance</b> of the isolate(s) that you select in that tree view.</li>
<li id="watched-isolates">Use the <b>"Watched Isolates" link</b> on the SNP Tree Viewer interface to view your list of watched isolates, and to rename a watch, edit the SNP cutoff, or delete it from your list.</li>
<li>The <a href="#automated-searches-watch-illustration"><span style="color:#d70000">illustrated example</span></a> below shows the "Watch" button, the "Watched Isolates" link, and a sample automatic e-mail for a watched isolate.</li>
</ul>
<!-- ======== END_AUTOMATED_SEARCHES_WATCH_BUTTON ========= -->
<!-- ========= AUTOMATED_SEARCHES_WATCH_ILLUSTRATION ============ -->
<h3 id="automated-searches-watch-illustration">Illustrated example of automatic e-mail notification for a Watched Isolate <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#automated-searches"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Tree Viewer, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h3>
<img src="/core/assets/pathogens/images/TreeViewerWatch_Campylobacter_PDT000428978_30SNP_distance.png" width="800" height="2200" border="0" alt="Illustrated example of the Pathogens SNP Tree Viewer WATCH function, and including an example of an automatic e-mail message that contains a notification of new isolates that fall within the SNP distance you specified from an isolate that you are watching." />
<br /><br />
<!-- ======== END_AUTOMATED_SEARCHES_WATCH_ILLUSTRATION ========= -->
<!-- ========= AUTOMATED_SEARCHES_EXAMPLES ============ -->
<!-- H3 id="automated-searches-examples">Additional examples of saved searches and watched isolates <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#automated-searches"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Isolates Browser Automated Searches, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h3>
<ul>
<li>_________ <a href="/pathogens/isolates#/search/">Isolates Browser</a> _____________ <b>________</b> _____________ <a href="#_____________">_____________</a>.</li>
<li>________________________________________________.</li>
<li>________________________________________________.</li>
</ul -->
<!-- ======== END_AUTOMATED_SEARCHES_EXAMPLES ========= -->
<!-- ======= END_ISOLATES_BROWSER_AUTOMATED_SEARCHES ========== -->
<!-- ########## END_H2_SECTION:AUTOMATED_SEARCHES ########## -->
<!-- ======== HORIZONTAL_RULE ============ -->
<hr />
<!-- ======== END_HORIZONTAL_RULE ======== -->
<!-- ########## H2_SECTION:ANTIMICROBIAL_RESISTANCE_AMR_RESOURCES ########## -->
<h2 id="amr">Antimicrobial Resistance (AMR) Resources <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h2>
<!-- div style='padding-left: 2em'>
<a href="#amr-overview">Overview</a> | <a href="#amr-resources-schematic"><span style="color:#d70000">schematic illustration</span> of AMR resources</a><br />
<a href="#amr-landing-page">AMR Landing page</a> | <a href="#amr-resources-page">AMR Resources page</a><br />
<a href="#reference-gene-catalog">Pathogen Detection Reference Gene Catalog</a> | <a href="#refgene-sample-searches"><span style="color:#d70000">use cases/sample searches</span></a><br />
<a href="#amr-finder">AMRFinderPlus</a> | <a href="#amr-finder-install">install software</a>; <a href="#amr-finder-data-files">download data files</a>: <a href="#amr-finder-reference-gene-catalog">Reference Gene Catalog data</a>, <a href="#amr-finder-hmms">Hidden Markov Models (HMMs)</a>, <a href="#amr-finder-hierarchy">AMRFinder Hierarchy</a> (<a href="#amr-finder-hierarchy-illustration"><span style="color:#d70000">illustrated example</span> of a hierarchy</a>); <a href="#amr-finder-results">interpret AMRFinderPlus results</a>; <a href="#amr-finder-read-more">read more</a>, <a href="#amr-finder-publication">publication/citation</a><br />
<a href="#amr-submit">Submit sequence and phenotype data related to AMR</a><br />
<a href="#amr-ftp">FTP/Raw Data Download</a>
</div -->
<ul>
<li><a href="#amr-overview">Overview</a> (<a href="#amr-resources-schematic"><span style="color:#d70000">schematic illustration</span> of AMR resources</a>)</li>
<li><a href="#amr-landing-page">AMR Landing page</a></li>
<li><a href="#amr-resources-page">AMR Resources page</a></li>
<li><a href="#amr-finder"><b>AMRFinderPlus</b></a>
<ul>
<li><a href="#amr-finder">What is AMRFinderPlus?</a></li>
<li><a href="#amr-finder-install">Install software</a></li>
<li><a href="#amr-finder-data-files">Download data files</a>: <a href="#amr-finder-reference-gene-catalog">Reference Gene Catalog data</a>, <a href="#amr-finder-hmms">Hidden Markov Models (HMMs)</a>, <a href="#amr-finder-hierarchy">AMRFinder Hierarchy</a> (<a href="#amr-finder-hierarchy-illustration"><span style="color:#d70000">illustrated example</span> of a hierarchy</a>)</li>
<li><a href="#amr-finder-results">Interpret AMRFinderPlus results</a></li>
<li><a href="#amr-finder-read-more">Read more</a></li>
<li><a href="#amr-finder-publication">Publication/Citation</a></li>
</ul>
</li>
<li><a href="#microbigge"><b>MicroBIGG-E</b> (<b>Micro</b>bial <b>B</b>rowser for <b>I</b>dentification of <b>G</b>enetic and <b>G</b>enomic <b>E</b>lements)</a>
<ul>
<li><a href="#microbigge-what-is">What is MicroBIGG-E?</a></li>
<li><a href="#microbigge-access">Where to access MicroBIGG-E?</a></li>
<li><a href="#microbigge-search-tips">Search tips</a></li>
<li><a href="#microbigge-data-fields">Data fields</a></li>
<li><a href="#microbigge-output">Output</a></li>
<li><a href="#microbigge-sample-searches"><span style="color:#d70000">Use cases/sample searches</span> of MicroBIGG-E</a></li>
<li><a href="/pathogens/docs/microbigge_gcp/">Full MicroBIGG-E results in Google Cloud</a></li>
<li><a href="/pathogens/docs/microbigge_map/">MicroBIGG-E Map</a>
<ul>
<li><a href="/pathogens/docs/microbigge_map/#what-is-the-microbigge-map">What is the MicroBIGG-E Map</a></li>
<li><a href="/pathogens/docs/microbigge_map/#using-the-microbigge-map">Using the MicroBIGG-E Map</a></li>
<li><a href="/pathogens/docs/microbigge_map/#microbigge-map-displays">MicroBIGG-E Map Displays</a></li>
<li><a href="/pathogens/docs/microbigge_map/#downloading-figures">Downloading Figures</a></li>
</ul>
</li>
</ul>
</li>
<li><a href="#reference-gene-catalog"><b>Pathogen Detection Reference Gene Catalog</b></a>
<ul>
<li><a href="#refgene-what-is">What is the Pathogen Detection Reference Gene Catalog?</a></li>
<li><a href="#refgene-access">Where to access the Pathogen Detection Reference Gene Catalog</a></li>
<li><a href="#refgene-search-tips">Search tips</a></li>
<li><a href="#refgene-data-fields">Data Fields</a></li>
<li><a href="#refgene-output">Output</a></li>
<li><a href="#refgene-sample-searches"><span style="color:#d70000">Use cases/sample searches</span> of the Reference Gene Catalog</a></li>
</ul>
</li>
<li><a href="/pathogens/docs/gene_hierarchy/"><b>Pathogen Detection Reference Gene Hierarchy</b></a>
<ul>
<li><a href="/pathogens/docs/gene_hierarchy/#what-is-the-reference-gene-hiera">What is the Reference Gene Hierarchy?</a></li>
<li><a href="/pathogens/docs/gene_hierarchy/#where-to-access-the-reference-ge">Where to access the Reference Gene Hierarchy</a></li>
<li><a href="/pathogens/docs/gene_hierarchy/#how-to-search-the-reference-gene">How to search the Reference Gene Hierarchy</a></li>
<li><a href="/pathogens/docs/gene_hierarchy/#data-fields-in-the-reference-gen">Data fields in the Reference Gene Hierarchy</a></li>
<li><a href="/pathogens/docs/gene_hierarchy/#output">Output</a></li>
</ul>
</li>
<li><a href="/pathogens/docs/ast/"><b>Pathogen Detection Antibiotic Susceptiblity Test (AST) Browser</b></a>
<ul>
<li><a href="/pathogens/docs/ast/#what-is-the-ast-browser">What is the AST Browser</a></li>
<li><a href="/pathogens/docs/ast/#where-to-access-the-pathogen-det">Where to access the Pathogen Detection AST Browser </a></li>
<li><a href="/pathogens/docs/ast/#using-the-ast-browser">How to use the AST Browser</a></li>
<li><a href="/pathogens/docs/ast/#data-fields-in-the-ast-browser">Data fields in the AST Browser</a></li>
<li><a href="/pathogens/docs/ast/#output">Output</a></li>
</ul>
</li>
<li><a href="/pathogens/docs/HMM_catalog/"><b>Pathogen Detection Reference HMM Catalog</b></a>
<ul>
<li><a href="/pathogens/docs/HMM_catalog/#what-is-the-reference-hmm-catalo">What is the Pathogen Detection Reference HMM Catalog</a></li>
<li><a href="/pathogens/docs/HMM_catalog/#where-to-access-the-pathogen-det">Where to access the Pathogen Detection Reference HMM Catalog</a></li>
<li><a href="/pathogens/docs/HMM_catalog/#search-tips-for-the-pathogen-det">Search tips</a></li>
<li><a href="/pathogens/docs/HMM_catalog/#data-fields-in-the-pathogen-dete">Data fields</a></li>
<li><a href="/pathogens/docs/HMM_catalog/#output">Output</a></li>
</ul>
</li>
<li><a href="#amr-submit">Submit sequence and phenotype data related to AMR</a></li>
<li><a href="#amr-ftp">FTP/Raw Data Download</a></li>
</ul>
<!-- =========== AMR_OVERVIEW ============ -->
<h3 id="amr-overview">AMR Overview <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#amr"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Antimicrobial resistance (AMR) resources, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h3>
<div style="padding-left: 2em">
In response to the rising threat of antimicrobial resistance (AMR) in pathogens, the White House developed the <a href="https://obamawhitehouse.archives.gov/blog/2015/03/27/our-plan-combat-and-prevent-antibiotic-resistant-bacteria">National Action Plan</a> for Combating Antibiotic-Resistant Bacteria in 2015 and updated that plan with the <a href="https://aspe.hhs.gov/reports/national-action-plan-combating-antibiotic-resistant-bacteria-2020-2025">2020-2025 National Action Plan for Combating Antibiotic-Resistant Bacteria</a>. NCBI has built several resources and tools to achieve several specific project goals, including comparison of newly isolated pathogens to existing pathogen data to identify relationships, and to analyze the AMR repertoire of each isolate. The NCBI Pathogen Detection project has developed several resources and web interfaces as part of this effort including <a href="/pathogens/antimicrobial-resistance/AMRFinder/">AMRFinderPlus</a>, the <a href="/pathogens/isolates/">Isolates Browser</a>, <a href="/pathogens/microbigge/">MicroBIGG-E</a>, the <a href="/pathogens/ast/">AST Browser</a>, the <a href="/pathogens/refgene/">Reference Gene Catalog</a>, the <a href="/pathogens/genehierarchy/">Reference Gene Hieararchy</a>, the <a href="/pathogens/hmm/">Reference HMM Catalog</a>, also making data avaliable on <a href="/docs/gcp/">Google Cloud</a> and no our <a href="https://ftp.ncbi.nlm.nih.gov/pathogen/">FTP site</a>. The <a href="#amr-resources-schematic"><span style="color:#d70000">schematic illustration</span></a> below shows some of the antimicrobial resistance resources in the NCBI Pathogen Detection project, including data sets and tools, as well as the relationships among them.<br /><br />
<span id="amr-resources-schematic">
<img src="/core/assets/pathogens/images/AMR_resources_schematic.png" width="800" height="1050" border="0" alt="Schematic illustration showing the antimicrobial resistance (AMR) resources in the NCBI Pathogen Detection project." /></span><br />
<div style="padding-left: 2em">
Additional details about each resource are available:
<ul>
<li><b>Pathogen Detection Reference Gene Catalog</b>: <a href="#reference-gene-catalog">read more</a>, <a href="/pathogens/isolates#/refgene/">browse/search</a>, <a href="https://ftp.ncbi.nlm.nih.gov/pathogen/Antimicrobial_resistance/Data/">download data</a>, <a href="https://ftp.ncbi.nlm.nih.gov/pathogen/Antimicrobial_resistance/AMRFinderPlus/database/latest/changes.txt">Change log</a></li>
<li><b>NCBI AMR Hidden Markov Models (HMMs)</b>: <a href="/pathogens/docs/HMM_catalog">read more</a>, <a href="/pathogens/hmm">browse/search</a>, <a href="https://ftp.ncbi.nlm.nih.gov/hmm/NCBIfam-AMRFinder/">download data</a></li>
<li><b>AMRFinder Hierarchy</b>: <a href="#amr-finder-hierarchy">read more</a>, <a href="/pathogens/docs/gene_hierarchy">read more</a>, <a href="https://ftp.ncbi.nlm.nih.gov/pathogen/Antimicrobial_resistance/AMRFinderPlus/database/latest/ReferenceGeneCatalog.txt">view/download file</a></li>
<li><b>AMRFinderPlus</b>: <a href="#amr-finder">read more</a>, <a href="https://github.com/ncbi/amr/wiki">install</a></li>
<li><b>Isolates Browser</b>: <a href="#isolates-browser">read more about the Isolates Browser</a>, about <a href="#data-type-genotype">genotypes</a> <i>(which are displayed in the <a href="#isolates-browser-data-field-AMRGenotypes">AMR_genotypes</a>, <a href="#isolates-browser-data-field-stress-genotypes">stress_genotypes</a>, and <a href="#isolates-browser-data-field-virulence-genotypes">virulence_genotypes</a> data fields)</i>; and about <a href="#data-type-phenotype">phenotypes</a> <i>(which are displayed in the <a href="#isolates-browser-data-field-ASTPhenotypes">AST_phenotypes</a> data field and are based upon Antimicrobial Susceptibility Test (AST) results)</i></li>
<li><b>MicroBIGG-E</b> (<b>Micro</b>bial <b>B</b>rowser for <b>I</b>dentification of <b>G</b>enetic and <b>G</b>enomic <b>E</b>lements): <a href="#microbigge">read more</a>, <a href="/pathogens/microbigge/">browse/search</a>
<!-- ul>
<li><a href="https://ftp.ncbi.nlm.nih.gov/pathogen/Antimicrobial_resistance/AMRFinder/data/">download data from AMRFinder analyses of isolate genomes</a></li>
<li><a href="https://ftp.ncbi.nlm.nih.gov/pathogen/Antimicrobial_resistance/AMRFinderPlus/data/">download data from AMRFinderPlus analyses of isolate genomes</a></li>
</ul -->
</li>
</ul>
</div>
</div>
<!-- =========== END_AMR_OVERVIEW ============ -->
<!-- =========== AMR_HOME_PAGE ============ -->
<h3 id="amr-landing-page">AMR Landing page <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#amr"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Antimicrobial resistance (AMR) resources, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h3>
<div style="padding-left: 2em">
The <a href="/pathogens/antimicrobial-resistance/">AMR landing page</a> provides information about the NCBI National Database of Antibiotic Resistant Organisms (<b>NDARO</b>), a collaborative, cross-agency, centralized hub for researchers to access AMR data to facilitate real-time surveillance of pathogenic organisms. (<i>Read more in the <a href="https://ftp.ncbi.nlm.nih.gov/pub/factsheets/Factsheet_AMR_Project.pdf">antimicrobial resistance factsheet</a>.</i>)
</div>
<!-- =========== END_AMR_HOME_PAGE ============ -->
<!-- =========== AMR_RESOURCES_PAGE ============ -->
<h3 id="amr-resources-page">AMR Resources page <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#amr"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Antimicrobial resistance (AMR) resources, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h3>
<div style="padding-left: 2em">
The <a href="/pathogens/antimicrobial-resistance/resources/">AMR Resources page</a> provides a list of available resources, with a brief description and sample searches or links to additional information about each one.
</div>
<!-- =========== END_AMR_RESOURCES_PAGE ============ -->
<!-- =========== REFERENCE_GENE_CATALOG ============ -->
<h3 id="reference-gene-catalog">Pathogen Detection Reference Gene Catalog help <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#amr"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Antimicrobial resistance (AMR) resources, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h3>
<!-- =========== REFGENE_TOC ============ -->
<div style="padding-left: 2em">
<ul>
<li><a href="#refgene-what-is">What is the Pathogen Detection Reference Gene Catalog?</a>
<ul>
<li><a href="#refgene-scope">Scope: the Reference Gene Catalog includes two data subsets:</a>
<ul>
<li><a href="#refgene-scope-core">Core</a></li>
<li><a href="#refgene-scope-plus">Plus</a></li>
</ul>
</li>
<li><a href="#refgene-non-redundant">Non-redundant</a></li>
<li><a href="#refgene-and-isolates-browser-relationship">Relationship between Isolates Browser and Pathogen Detection Reference Gene Catalog</a></li>
<li><a href="#refgene-and-hierarchy-and-hmm">Relationship between the Pathogen Detection Reference Gene Catalog, Reference Gene Hierarchy, and Reference HMM Catalog</a></li>
</ul>
</li>
<li><a href="#refgene-access">Where to access the Pathogen Detection Reference Gene Catalog</a>
<ul>
<li><a href="#refgene-access-browse">Browse/Search the Pathogen Detection Reference Gene Catalog</a></li>
<li><a href="#refgene-access-download">Download the Pathogen Detection Reference Gene Catalog data</a></li>
</ul>
</li>
<li><a href="#refgene-search-tips">Search tips</a>
<ul>
<li><a href="#refgene-allowable-search-terms">Allowable search terms</a></li>
<li><a href="#refgene-basic-search">Basic search</a></li>
<li><a href="#refgene-advanced-search">Advanced search</a></li>
<li><a href="#refgene-filters">Filters</a></li>
</ul>
</li>
<li><a href="#refgene-data-fields">Data Fields</a>
<ul>
<li><a href="#refgene-data-field-allele">allele</a></li>
<li><a href="#refgene-data-field-gene-family">gene_family</a></li>
<li><a href="#refgene-data-field-product-name">product_name</a></li>
<li><a href="#refgene-data-field-scope">scope</a></li>
<li><a href="#refgene-data-field-type">type</a></li>
<li><a href="#refgene-data-field-subtype">subtype</a></li>
<li><a href="#refgene-data-field-class">class</a></li>
<li><a href="#refgene-data-field-subclass">subclass</a></li>
<li><a href="#refgene-data-field-refseq-protein-accession">refseq_protein_accession</a></li>
<li><a href="#refgene-data-field-refseq-nucleotide-accession">refseq_nucleotide_accession</a></li>
<li><a href="#refgene-data-field-genbank-protein-accession">genbank_protein_accession</a></li>
<li><a href="#refgene-data-field-genbank-nucleotide-accession">genbank_nucleotide_accession</a></li>
<li><a href="#refgene-data-field-organism">organism fields:</a>
<ul>
<li><a href="#refgene-data-field-whitelisted-taxa">whitelisted_taxa</a></li>
<li><a href="#refgene-data-field-blacklisted-taxa">blacklisted_taxa</a></li>
</ul>
</li>
<li><a href="#refgene-data-field-curated-refseq-start">curated_refseq_start</a></li>
<li><a href="#refgene-data-field-genbank-start">genbank_start</a></li>
<li><a href="#refgene-data-field-genbank-stop">genbank_stop</a></li>
<li><a href="#refgene-data-field-genbank-strand">genbank_strand</a></li>
<li><a href="#refgene-data-field-refseq-start">refseq_start</a></li>
<li><a href="#refgene-data-field-refseq-stop">refseq_stop</a></li>
<li><a href="#refgene-data-field-refseq-strand">refseq_strand</a></li>
<li><a href="#refgene-data-field-pubmed-reference">pubmed_reference</a></li>
<li><a href="#refgene-data-field-synonyms">synonyms</a></li>
<li><a href="#refgene-data-field-links">links</a></li>
<!-- li><a href="#_______">______________</a></li -->
</ul>
</li>
<li><a href="#refgene-output">Output</a>
<ul>
<li><a href="#refgene-output-table">Tabular list of genes</a></li>
<li><a href="#refgene-filters">Filters to refine results</a></li>
<!-- li><a href="#refgene-sort-order">Sort order</a></li -->
<li><a href="#refgene-display-options">Customize the Reference Gene Catalog display</a>
</li>
<li><a href="#reference-data-retention">Data archive and retention policy</a></li>
</ul>
</li>
<li><a href="#refgene-sample-searches"><span style="color:#d70000">Use cases/sample searches</span> of the Reference Gene Catalog</a>
<ul>
<li><a href="#refgene-sample-search-multidrug-resistant">Find multidrug resistant genes</a></li>
<li><a href="#refgene-sample-search-amr-gene-carbapenem">Find carbapenem resistant genes</a></li>
<li><a href="#refgene-sample-search-amr-point-mutations-quinolones">Find point mutations in <i>Escherichia</i> that confer resistance to quinolones</a></li>
</ul>
</li>
<!-- li><a href="#_______">______________</a></li>
<li><a href="#_______">______________</a>
<ul>
<li><a href="#_______">______________</a></li>
<li><a href="#_______">______________</a></li>
<li><a href="#_______">______________</a></li>
<li><a href="#_______">______________</a></li>
</ul>
</li>
<li><a href="#_______">______________</a>
<ul>
<li><a href="#_______">______________</a></li>
<li><a href="#_______">______________</a></li>
<li><a href="#_______">______________</a></li>
<li><a href="#_______">______________</a></li>
<li><a href="#_______">______________</a>
<ul>
<li><a href="#_______">______________</a></li>
<li><a href="#_______">______________</a></li>
<li><a href="#_______">______________</a></li>
<li><a href="#_______">______________</a></li>
<li><a href="#_______">______________</a></li>
</ul>
</li>
</ul>
</li -->
</ul>
</div>
<!-- =========== END_REFGENE_TOC ============ -->
<!-- ========= REFGENE_WHAT_IS ============ -->
<div style="padding-left: 2em">
<h4 id="refgene-what-is">What is the Pathogen Detection Reference Gene Catalog? <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#reference-gene-catalog"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Pathogen Detection Reference Gene Catalog help, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h4>
<div style="padding-left: 2em">
The NCBI <a href="/pathogens/isolates#/refgene/">Pathogen Detection Reference Gene Catalog</a> is a <a href="#refgene-non-redundant">non-redundant</a> database of bacterial genes related to antimicrobial resistance, biocide and stress resistance, general efflux, virulence, or antigenicity. A graphical user interface (GUI) allows you to browse and search the database.<br /><br />
<b>Every row</b> in the Pathogen Detection Reference Gene Catalog display is a <b>reference gene</b> or a <b>point mutation</b>.<br /><br />
<!-- ======= REFERENCE_GENE_CATALOG_SCOPE ======= -->
<span id="refgene-scope"><b>Scope: the Reference Gene Catalog includes two data subsets:</b></span> <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#reference-gene-catalog"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Pathogen Detection Reference Gene Catalog help, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br />
<ol>
<li id="refgene-scope-core">"<b>Core</b>": this subset includes highly curated, AMR-specific genes and proteins from the Bacterial Antimicrobial Resistance Reference Gene Database (BioProject <a href="https://www.ncbi.nlm.nih.gov/bioproject/PRJNA313047">PRJNA313047</a>), plus point mutations. The sources of input for this <b>curated database</b> include: 1) allele assignments, 2) exchanges with other external curated resources, 3) reports of novel antimicrobial resistance proteins in the literature.</li>
<li id="refgene-scope-plus">"<b>Plus</b>": this subset includes genes related to biocide and stress resistance, general efflux, virulence or antigenicity, or other AMR genes whose presence/absence are unlikely to affect phenotype and/or whose phenotype is highly uncertain.<br /><br />
<i>Proteins in the reference gene catalog may be recategorized from core to plus or vice-versa based on curation and the literature. Changes are enumerated in the 'changes.txt' file for each AMRFinderPlus database release.</i>
</li>
</ol>
<!-- ======= REFERENCE_GENE_CATALOG_SCOPE ======= -->
<!-- ======= REFERENCE_GENE_CATALOG_NON_REDUNDANT ======= -->
<span id="refgene-non-redundant"><b>Non-redundant</b></span> <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#reference-gene-catalog"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Pathogen Detection Reference Gene Catalog help, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br />
<ul>
<li id="refgene-non-redundant-definition">The definition of redundant (or 'non-unique') will differ, depending on the type of data element (allele, gene, or point mutation). For example:</li>
<li id="refgene-non-redundant-allele">An <b>ALLELE</b> should only ever show up once in the table. An allele is a unique protein sequence that corresponds to a unique gene symbol, and so, by definition, should occur only once.<!-- PD-2613, Slava, 20190919: In the AMR database all alleles have unique sequences and unique names. --></li>
<li id="refgene-non-redundant-point-mutation">An allele name for a <b>POINT MUTATION</b> can occur in <b>multiple rows</b> of the Reference Gene Catalog, if the point mutation is found in <b>different organisms</b><!-- (technically, different <b>taxonomic groups<b>, as some organisms, such as E. coli and Shigella, are placed into a single taxonomic group) -->, and if the <b>proteins</b> in those organisms are <b>not identical</b>.
<!-- An <b>ALLELE NAME</b> might appear in multiple rows of the Reference Gene Catalog display, if that allele has been found in multiple nucleotide or protein sequences. --><!-- The text below was ok'ed by Mike and is from https://jira.ncbi.nlm.nih.gov/browse/PD-2864: -->
<ul>
<li id="refgene-non-redundant-different-proteins">
For example, the allele name <a href="/pathogens/isolates#/refgene/gyrA_D82G">gyrA_D82G</a> occurs in both <i>E. coli</i> and <i>Salmonella</i>. Each of those organisms has its own reference sequence protein (<a href="#accession-prefix-wp">WP_* accession</a>), because the protein sequences are not identical. The <i>E. coli</i> gyrA protein sequence is <a href="https://www.ncbi.nlm.nih.gov/protein/WP_001281243.1">WP_001281243.1</a>, and the <i>Salmonella</i> gyrA protein is <a href="https://www.ncbi.nlm.nih.gov/protein/WP_001281271.1">WP_001281271.1</a>.<br />
<!-- i>(Note: To view the identifier of the sequence in which an allele or gene appears, mouse over the refseq_protein_accession or the refseq_nucleotide_accession, as available, and/or click on the accession to view the sequence record.)</i --></li>
<li id="refgene-non-redundant-identical-proteins">If, on the other hand, <b>two or more organisms</b> have an <b>identical protein</b> sequence for a given gene, and the <b>same allele</b> has been found in all of those organisms, there will be a <b>single row</b> in the Reference Gene Catalog, showing the allele name and the Reference Sequence <a href="#accession-prefix-wp">WP_* accession</a>. </li>
</ul>
</li>
<li id="refgene-non-redundant-gene">A given <b>GENE SYMBOL</b> can have multiple rows in the table, as multiple proteins can be assigned the same gene symbol, but each <a href="#accession-prefix-wp">WP_* accession</a> will be unique.<br /><br />
<i>Details about <b>WP_* accessions</b></i> <i>are provided on the web pages that describe the <a href="https://www.ncbi.nlm.nih.gov/refseq/about/nonredundantproteins/">RefSeq non-redundant proteins</a>, the <a href="https://www.ncbi.nlm.nih.gov/refseq/about/prokaryotes/reannotation/">Prokaryotic RefSeq Genome Re-annotation Project</a>, and the <a href="https://ftp.ncbi.nlm.nih.gov/refseq/release/announcements/WP-proteins-06.10.2013.pdf">New RefSeq protein product and data model</a>.</i></li>
</ul>
<!-- ======= END_REFERENCE_GENE_CATALOG_NON_REDUNDANT ======= -->
<!-- ==== RELATIONSHIP_BETWEEN_REFERENCE_GENE_CATALOG_AND_ISOLATES_BROWSER ==== -->
<span id="refgene-and-isolates-browser-relationship"><b>Relationship between the Pathogen Detection Reference Gene Catalog and Pathogens Isolates Browser</b></span> <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#reference-gene-catalog"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Pathogen Detection Reference Gene Catalog help, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br />
<ul>
<li>The <a href="/pathogens/isolates#/refgene/">Pathogen Detection Reference Gene Catalog</a> and <a href="/pathogens/isolates#/search/">Pathogens Isolates Browser</a> are <b>related</b> resources and are <b>integrated</b> with each other.</li>
<li>The main <b>similiarities</b> between the resources are their <b>shared search engine</b> and <b>similar search techniques</b>:
<ul>
<li>Both use the <a href="#solr">SOLR query language</a> and allow searches by a wide variety of text terms.</li>
<li>The search tips provided in the <a href="#isolates-browser">Isolates Browser help documentation</a> therefore also apply to the Reference Gene Catalog, such as <a href="#isolates-browser-basic-search">basic search</a> techniques, <a href="#isolates-browser-advanced-search">advanced search</a> techniques, <a href="#query-tips-case-sensitive-vs-case-insensitive">case sensitive versus case insensitive searches</a>, and the availability of "filters" to refine search results.</li>
</ul>
</li>
<li>The main <b>differences</b> between the resources are the <b>scope</b> of data being searched, the set of <b>data fields</b> (and <b>filters</b>, which are based on data fields) that are available for searching, and the <b>columns</b> that are shown in the display of search results: <!-- i>(The <a href="#refgene-data-fields">Reference Gene Catalog data fields</a> are described below, and the <a href="#isolates-browser-data-fields">Pathogens Isolates Browser data fields</a> are described in the <a href="#isolates-browser">Isolates Browser help</a>.)</i -->
<ul>
<li>The <a href="/pathogens/isolates#/search/"><b>Pathogens Isolates Browser</b></a> searches all <b>isolate genomes</b> in the Pathogen Detection project, as well as corresponding <b>metadata</b> that are described under <a href="#data-types">types of data</a>.
<ul>
<li><b>Every row</b> in the Isolates Browser is an <b>assembled isolate</b>, possibly with antimicrobial resistance (AMR), virulence, and/or stress response <a href="#data-type-genotype">genotype data</a>, and antibiotic susceptibility (AST) <a href="#data-type-phenotype">phenotype data</a>, as available.</li>
<li>The <a href="#isolates-browser">Isolates Browser help documentation</a> describes the <a href="#isolates-browser-data-fields">available data fields</a> and <a href="#isolates-browser-output">output</a>.</li>
</ul>
</li>
<li>The <a href="/pathogens/isolates#/refgene/"><b>Pathogen Detection Reference Gene Catalog</b></a> is a <a href="#refgene-non-redundant">non-redundant</a> database of <b>bacterial genes</b> related to antimicrobial resistance, biocide and stress resistance, general efflux, virulence, or antigenicity.
<ul>
<li><b>Every row</b> in the Pathogen Detection Reference Gene Catalog display is a <b>reference gene</b> or a <b>point mutation</b>.</li>
<li>The <a href="#reference-gene-catalog">Reference Gene Catalog help</a> describes the <a href="#refgene-scope">scope of data</a>, <a href="#refgene-data-fields">available data fields</a>, and <a href="#refgene-output">output</a>.</li>
<!-- li>The <a href="#refgene-data-fields">Pathogen Detection Reference Gene Catalog data fields</a> and <a href="#refgene-output">output</a> are described in the <a href="#reference-gene-catalog">Reference Gene Catalog help</a>.</li -->
</ul>
</li>
</ul>
</li>
<li>They are <b>integrated</b> with each other through links in the data displays. For example:
<ul>
<!-- li>The <a href="#isolates-browser-data-field-AMRGenotypes">AMR genotypes</a>, <a href="#isolates-browser-data-field-stress-genotypes">Stress genotypes</a>, and <a href="#isolates-browser-data-field-virulence-genotypes">Virulence genotypes</a> columns in the Isolates Browser link to the corresponding gene/allele record(s) in the Pathogen Detection Reference Gene Catalog.</li -->
<li>The <a href="#refgene-data-field-gene-family">gene family</a> column in the Pathogen Detection Reference Gene Catalog links to the Isolates Browser. Clicking on a gene symbol in that column will open the Isolates Browser and will display the isolates that have been found, by the <a href="/pathogens/docs/data_processing">data processing pipeline</a>, to contain the gene of interest.</li>
</ul>
</li>
</ul>
<!-- ==== RELATIONSHIP_BETWEEN_REFERENCE_GENE_CATALOG_AND_ISOLATES_BROWSER ==== -->
<!-- ==== RELATIONSHIP_BETWEEN_REFERENCE_GENE_CATALOG_AND_HIERARCHY_AND_HMM ==== -->
<span id="refgene-and-hierarchy-and-hmm"><b>Relationship between the Pathogen Detection Reference Gene Catalog, Reference Gene Hierarchy, and Reference HMM Catalog</b></span> <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#reference-gene-catalog"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Pathogen Detection Reference Gene Catalog help, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br />
<ul>
<li>The <a href="/pathogens/isolates#/refgene/">Pathogen Detection Reference Gene Catalog</a>, <a href="/pathogens/genehierarchy">Reference Gene Hierarchy</a>, and <a href="/pathogens/hmm">Reference HMM Catalog</a> are interrelated and integrated databases that are all used in concert to identify gene sequences by <a href="https://github.com/ncbi/amr/wiki">AMRFinderPlus</a>. <br />
Curation of Reference genes and HMMs is organized in the framework of the <a href="/pathogens/genehierarchy">Reference Gene Hierarchy</a>, so looking at this resource will show how Pathogen Detection curators relate genes to one-another. Note that genes are placed in the Reference Gene Hierarchy, but point mutations are not.</li>
<ul>
<li>As with the isolates browser all use a shared search engine and similar search techniques:</li>
<ul>
<li>All use the <a href="#solr">SOLR query language</a> and allow searches by a wide variety of text terms.</li>
<li>The search tips provided in the <a href="#isolates-browser">Isolates Browser help documentation</a> therefore also apply to the reference browsers, such as <a href="#isolates-browser-basic-search">basic search</a> techniques, <a href="#isolates-browser-advanced-search">advanced search</a> techniques, <a href="#query-tips-case-sensitive-vs-case-insensitive">case sensitive versus case insensitive searches</a>, and the availability of "filters" to refine search results.</li>
</ul>
<li>To link out to the Reference Gene Hierarchy from the Reference Gene Catalog use the <b>Choose columns</b> button to add the <b>Hierarchy node ID</b> column to the table then click on the Hierarchy node ID you wish to see in the Reference Gene Hierarchy</li>
</ul>
</ul>
<!-- ==== RELATIONSHIP_BETWEEN_REFERENCE_GENE_CATALOG_AND_HIERARCHY_AND_HMM ==== -->
</div>
</div>
<!-- ====== END_REFGENE_WHAT_IS ========= -->
<!-- ========= REFGENE_ACCESS ============ -->
<div style="padding-left: 2em">
<h4 id="refgene-access">Where to access the Pathogen Detection Reference Gene Catalog <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#reference-gene-catalog"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Pathogen Detection Reference Gene Catalog help, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h4>
<div style="padding-left: 2em">
<a href="/pathogens/isolates#/refgene/">The Pathogen Detection Reference Gene Catalog</a> is accessible from the
<a href="/pathogens">Pathogen Detection Project home page</a> (as a link in the right hand margin under "Data Resources"), from the
<a href="/pathogens/antimicrobial-resistance/">AMR landing page</a> (National Database of Antibiotic Resistant Organisms (NDARO)), and from the <a href="/pathogens/antimicrobial-resistance/resources/">AMR Resources page</a>.<br /><br />
<span id="refgene-access-browse"><b>Browse/Search</b> the Reference Gene Catalog:</span><br />
<a href="/pathogens/isolates#/refgene/">https://www.ncbi.nlm.nih.gov/pathogens/refgene</a>.<br /><br />
<span id="refgene-access-download"><b>Download</b> Reference Gene Catalog data:</span><br />
<p>Data from the Reference Gene Catalog can be downloaded in multiple formats. From the web interface you can get sequence and table data you see by clicking on the <b>Download</b> button at the top of the table (See the <a href="#refgene-output-table">Output section</a> for more info).</p>
<p>To get the data in <b>table</b> format click <b>Download</b> then select the <b>File type: Table</b>, select either tab-delimited (.tsv) or comma-delimited (.csv) and select a filename to download. Only the rows and columns that are visible in the table view on the web interface will be included in the downloaded file.</p>
<p>To get <b>sequence</b> data from the web interface click the <b>Download</b> button then select the <b>File type: Dataset</b>. Choose <b>Reference nucleotide</b>, <b>Reference nucleotide with flanks</b>, and/or the <b>Reference protein</b> sequence to download in FASTA format. Note that reference sequences for point mutations will be the "wildtype" references not including the mutations, and that RNA genes or promoter region references will not have protein sequences. Flanking nucleotide sequences may be limited to 100-bp or less depending on the source sequences in GenBank or RefSeq. The .zip file downloaded will be in the "Datsets" format including the metadata for sequences included in JSON format. See the <a href="/datasets/docs/v1/reference-docs/data-reports/">NCBI Datasets documentation</a> for more information on metadata file formats.</p>
<p>A tab-delimited table of the metadata in the Reference Gene Catalog is available in the AMRFinderPlus database release. See the <a href="https://github.com/ncbi/amr/wiki/AMRFinderPlus-database">AMRFinderPlus database</a> documentation for the location and the <a href="https://github.com/ncbi/amr/wiki/AMRFinderPlus-database#referencegenecatalogtxt">ReferenceGeneCatalog.txt file format documentation</a> for more information.</p>
<br /><br />
</div>
</div>
<!-- ====== END_REFGENE_ACCESS ========= -->
<!-- ========= REFGENE_SEARCH_TIPS ============ -->
<div style="padding-left: 2em">
<h4 id="refgene-search-tips">Search tips for the Pathogen Detection Reference Gene Catalog <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#reference-gene-catalog"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Pathogen Detection Reference Gene Catalog help, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h4>
<div style="padding-left: 2em">
<span id="refgene-allowable-search-terms"><b>Allowable search terms</b> (Pathogen Detection Reference Gene Catalog)</span> <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#reference-gene-catalog"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Pathogen Detection Reference Gene Catalog help, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br />
<ul>
<li>The <a href="/pathogens/isolates#/refgene/">Pathogen Detection Reference Gene Catalog</a> can be searched by the terms that appear in any of the <a href="#refgene-data-fields"><b>data fields</b></a> described below. A search example is provided after each data field description, when possible.</li>
</ul>
<span id="refgene-basic-search"><b>Basic search</b> (Pathogen Detection Reference Gene Catalog)</span> <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#reference-gene-catalog"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Pathogen Detection Reference Gene Catalog help, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br />
<ul>
<li>The query tips described in the <a href="#isolates-browser">Isolates Browser help</a> &gt; <a href="#isolates-browser-basic-search">basic search</a> section also apply to the Reference Gene Catalog, such as searches for <a href="#query-tips-multiple-terms">multiple terms</a>, <a href="#query-tips-special-characters">special characters</a>, <a href="#query-tips-phrase-search-quotes">phrase searches</a>, <a href="#query-tips-case-sensitive-vs-case-insensitive">case sensitive vs. case insensitive searches</a>, etc.</li>
</ul>
<span id="refgene-advanced-search"><b>Advanced search</b> (Pathogen Detection Reference Gene Catalog)</span> <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#reference-gene-catalog"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Pathogen Detection Reference Gene Catalog help, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br />
<ul>
<li>The query tips described in the <a href="#isolates-browser">Isolates Browser help</a> &gt; <a href="#isolates-browser-advanced-search">advanced search</a> section also apply to the Reference Gene Catalog, because both resources use the <a href="#solr">SOLR query language</a>.</li>
<li>The main difference is the data fields that are available to be searched, because each resource has its own set of data fields. <i>(See a list of the <a href="#refgene-data-fields-list">data fields in the Pathogen Detection Reference Gene Catalog</a> (below) or the <a href="#isolates-browser-data-fields-list">data fields in the Isolates Browser</a>.)</i></li>
<li>The query tips described in the <a href="#isolates-browser">Isolates Browser help</a> also apply to the Reference Gene Catalog, such as searches for <a href="#query-tips-multiple-terms">multiple terms</a>, <a href="#query-tips-special-characters">special characters</a>, <a href="#query-tips-phrase-search-quotes">phrase searches</a>, <a href="#query-tips-case-sensitive-vs-case-insensitive">case sensitive vs. case insensitive searches</a>, etc.</li>
</ul>
<span id="refgene-filters"><b>Filters</b> (Pathogen Detection Reference Gene Catalog)</span> <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#reference-gene-catalog"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Pathogen Detection Reference Gene Catalog help, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br />
<ul>
<li>The "Filters" menu options in the <a href="/pathogens/isolates#/refgene/">Pathogen Detection Reference Gene Catalog</a> enable you to <b>facet or subset the data</b> in a variety of ways, and therefore can be used to refine your results, whether you have done a basic search or an advanced search.</li>
<li>By default, each filter displays the <b>top 100 terms</b> (based on the number of items retrieved by a term) listed by count of value within that set of top 100. Note that:
<ul>
<li>A <b>Boolean "OR"</b> is applied if multiple items are checked in the same filter field. This way you can choose multiple values in the same filter. For example:
<ul>
<li>Open the "Filters" tab of the <a href="/pathogens/isolates#/refgene/">Pathogen Detection Reference Gene Catalog</a>, then check the boxes for "Stress" and for "Virulence" in the "Type" filter. The system will retrieve genes that are associated with either stress resistance or with virulence.</li>
</ul>
</li>
<li>A <b>Boolean "AND"</b> is applied if you select items in several different filter fields (Type, Class, etc). For example:
<ul>
<li>Open the "Filters" tab of the <a href="/pathogens/isolates#/refgene/">Pathogen Detection Reference Gene Catalog</a>, then check the boxes for "Point" in the "Subtype" filter and "Quinolone" in the "Class" filter. The system will retrieve alleles that meet both of your specified criteria (in this case, point mutations that confer resistance to quinolones).</li>
</ul>
</li>
<!-- li>If you prefer to apply a <b>Boolean "AND"</b> to multiple items within the same filter field, you can enter a <b>SOLR query</b>. For example:
<ul>
<li>To retrieve alleles that have [that meet all of the checked criteria, rather than one or more of them] <b>both</b> ____ AND ____, open the <a href="/pathogens/isolates#/refgene/">Pathogen Detection Reference Gene Catalog</a> and enter a SOLR query such as:
<a href="______">datafieldXXname:"value" AND datafieldXXname:"value"</a>.<br />
<i>(A separate section of this document provides additonal information about the <a href="#solr">SOLR query language</a>. Additionally, note that only a subset of the available data fields are shown in the default output of the <a href="/pathogens/isolates#/refgene/">Pathogen Detection Reference Gene Catalog</a>; use the <b>choose columns</b> to add additional columns to the display.)</i></li>
</ul>
</li -->
</ul>
</li>
<li>As explained in the <a href="#isolates-browser">Isolates Browser help</a>, <a href="#filters-on-the-fly">Filters are generated on the fly</a>. As a result, the terms that are listed under each filter will depend on the data set you are currently displaying in the browser. That is also true for the filters in the <a href="/pathogens/isolates#/refgene/">Pathogen Detection Reference Gene Catalog</a>.</li>
</ul>
</div>
</div>
<!-- ====== END_REFGENE_SEARCH_TIPS ========= -->
<!-- ========= REFGENE_DATA_FIELDS ============ -->
<div style="padding-left: 2em">
<h4 id="refgene-data-fields">Data Fields in the Pathogen Detection Reference Gene Catalog <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#reference-gene-catalog"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Pathogen Detection Reference Gene Catalog help, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h4>
<div style="padding-left: 2em">
The <a href="#refgene-data-fields-list">data fields listed below</a> have been indexed by the Pathogen Detection project and are therefore <b>directly searchable</b>, using the <a href="#isolates-browser-advanced-search">advanced search techniques</a> that are described in the <a href="#isolates-browser">Isolates Browser help</a>, because both the Pathogen Detection Reference Gene Catalog and the Isolates Browser use the <a href="#solr">SOLR query language</a>. Note that the <span style="background-color: #ffff00">data field names and values are <a href="#case-sensitive"><b>case sensitive</b></a></span>, as described in the Isolates Browser help.<br /><br />
Each data field reflects an available column in the <a href="/pathogens/isolates#/refgene/">Pathogen Detection Reference Gene Catalog</a> web interface. The <a href="#refgene-output">output</a> section of this document provides tips on how to <a href="#refgene-display-options">customize the display</a>, using the "choose columns" function.<br /><br />
<b>Please note:</b> in the list of available data fields below: <br />
<ul>
<li>The term shown in the <span style="background-color: #ffff00">regular font</span> is the <span style="background-color: #ffff00">display name</span> (column header) shown by the Pathogen Detection Reference Gene Catalog web interface. The term shown in <span style="background-color: #ffff00"><i>(italics)</i></span> is the <span style="background-color: #ffff00"><b><i>name of the corresponding data field</i></b>, if you want to search that field directly</span>.</li>
<li>For example, one data field is listed as: <a href="#refgene-data-field-gene-family">gene family (<b><i>gene_family</i></b>)</a>. The phrase "<b>gene family</b>" (with a space between the words) appears in the Reference Gene Catalog column header, and "<b><i>gene_family</i></b>" (with an underscore bar instead of a space) is the string you should use if you want to search that data field directly.</li>
<li>Brief <b><i>italicized search examples</i></b> are also provided for each data field, when possible, showing how to query the data field directly. The values represent text strings <b>exactly as they appear in the data fields</b>, including upper case and lower case letters, <a href="#special-characters">special characters</a> such as hyphens, etc. The <span style="background-color: #ffff00">data field names and values are <a href="#case-sensitive"><b>case sensitive</b></a></span>.</li>
</ul>
<span id="refgene-data-fields-list"><b>The available data fields in the <a href="/pathogens/isolates#/refgene/">Pathogen Detection Reference Gene Catalog</a> include the following:</b></span> <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#reference-gene-catalog"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Pathogen Detection Reference Gene Catalog help, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br />
Note that each field is written in this format: &#160;&#160;<b>display name</b> (<b><i>data_field_name</i></b>)<br />
The "display name" is the column header that appears in the Reference Gene Catalog web interface, and the "<i>data_field_name</i>" is the <a href="#case-sensitive">case-sensitive</a> string you should enter if you want to search the data field directly using a <a href="#solr">SOLR query</a>:<br />
<!-- ========== REFGENE_DATA_FIELDS_MINI_TOC =========== -->
<table width="100%">
<tr>
<td width="50%" valign="top">
<a href="#refgene-data-field-allele">Allele (<b><i>allele</i></b>)</a><br />
<a href="#refgene-data-field-gene-family">Gene family (<b><i>gene_family</i></b>)</a><br />
<a href="#refgene-data-field-product-name">Product name (<b><i>product_name</i></b>)</a><br />
<a href="#refgene-data-field-scope">Scope (<b><i>scope</i></b>)</a><br />
<a href="#refgene-data-field-type">Type (<b><i>type</i></b>)</a><br />
<a href="#refgene-data-field-subtype">Subtype (<b><i>subtype</i></b>)</a><br />
<a href="#refgene-data-field-class">Class (<b><i>class</i></b>)</a><br />
<a href="#refgene-data-field-subclass">Subclass (<b><i>subclass</i></b>)</a><br />
<a href="#refgene-data-field-refseq-protein-accession">RefSeq protein accession (<b><i>refseq_protein_accession</i></b>)</a><br />
<a href="#refgene-data-field-refseq-nucleotide-accession">RefSeq nucleotide accession (<b><i>refseq_nucleotide_accession</i></b>)</a><br />
<a href="#refgene-data-field-genbank-protein-accession">GenBank protein accession (<b><i>genbank_protein_accession</i></b>)</a><br />
<a href="#refgene-data-field-genbank-nucleotide-accession">GenBank nucleotide accession (<b><i>genbank_nucleotide_accession</i></b>)</a><br />
</td>
<td width="50%" valign="top">
<a href="#refgene-data-field-organism">organism fields:</a><br />
<div style="padding-left: 2em">
<a href="#refgene-data-field-whitelisted-taxa">Whitelisted taxa (<b><i>whitelisted_taxa</i></b>)</a><br />
<a href="#refgene-data-field-blacklisted-taxa">Blacklisted taxa (<b><i>blacklisted_taxa</i></b>)</a><br />
</div>
<a href="#refgene-data-field-curated-refseq-start">Curated refseq start (<b><i>curated_refseq_start</i></b>)</a><br />
<a href="#refgene-data-field-genbank-start">GenBank start (<b><i>genbank_start</i></b>)</a><br />
<a href="#refgene-data-field-genbank-stop">GenBank stop (<b><i>genbank_stop</i></b>)</a><br />
<a href="#refgene-data-field-genbank-strand">GenBank strand (<b><i>genbank_strand</i></b>)</a><br />
<a href="#refgene-data-field-refseq-start">RefSeq start (<b><i>refseq_start</i></b>)</a><br />
<a href="#refgene-data-field-refseq-stop">RefSeq stop (<b><i>refsesq_stop</i></b>)</a><br />
<a href="#refgene-data-field-refseq-strand">RefSeq strand (<b><i>refseq_strand</i></b>)</a><br />
<a href="#refgene-data-field-pubmed-reference">PubMed reference (<b><i>pubmed_reference</i></b>)</a><br />
<a href="#refgene-data-field-synonyms">synonyms (<b><i>synonyms</i></b>)</a><br />
<a href="#refgene-data-field-links">links (<b><i>links_count</i></b>)</a><br />
<!-- a href="#refgene-data-field-_______">_______ (<b><i>_______</i></b>)</a><br / -->
</td>
</tr>
</table>
<!-- ========= END_REFGENE_DATA_FIELDS_MINI_TOC ========= -->
<!-- ========= REFGENE_DATA_FIELDS_DESCRIPTIONS =========== -->
<ul>
<!-- ======== REFGENE_DATA_FIELD_allele ========== -->
<li id="refgene-data-field-allele">
<span style="background-color: #cde1ff">Allele (<b><i>allele</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#refgene-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of Reference Gene Catalog data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
Gene or allele. If the data element is an allele (e.g., 23S_C2627A), its name reflects both the name of the gene family in which a point mutation was found, and the location coordinate of the mutation, and the wild type and mutated nucleotides/amino acids<br /><br />
Data field names and values are <a href="#case-sensitive"><b>case sensitive</b></a>, as shown in the examples below. Additional sections of this document provide tips about search terms that contain <a href="#special-characters">special characters</a> (such as the parentheses, hyphens, and apostrophes), and the use of <a href="#wildcards">wildcards</a> (such as the asterisk or question mark).<br /><br />
<b>Examples:</b>
<ul>
<li>To search this field directly, enter a query such as: &#160;
<i>allele:searchterm</i></li>
<li>Search for: &#160; <i>allele:gyrA_D82G</i><br />
to show all alleles with that name.<br />
<i>(A separate section of this document describes the <a href="#refgene-non-redundant">non-redundant</a> nature of the Reference Gene Catalog, and how the definition of redundant (or 'non-unique') will differ, depending on the type of data element (allele, gene, or point mutation).)</i>
</li>
<li>Search for: &#160; <i>allele:blaB-1</i><br />
to show the reference gene for the blaB-1 allele: subclass B1 metallo-beta-lactamase BlaB-1.</li>
<li>Search for: &#160; <i>allele:blaB-*</i><br />
to show the reference genes for all blaB alleles.</li>
</ul>
</li>
<!-- ======== REFGENE_DATA_FIELD_gene_family ========== -->
<li id="refgene-data-field-gene-family">
<span style="background-color: #cde1ff">Gene family (<b><i>gene_family</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#refgene-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of Reference Gene Catalog data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
Gene symbol, or, if a point mutation, the reference gene symbol.<br /><br />
Data field names and values are <a href="#case-sensitive"><b>case sensitive</b></a>. Additional sections of this document provide tips about search terms that contain <a href="#special-characters">special characters</a> (such as the parentheses, hyphens, and apostrophes), and the use of <a href="#wildcards">wildcards</a> (such as the asterisk or question mark).<br /><br />
<b>Examples:</b>
<ul>
<li>To search this field directly, enter a query such as: &#160;
<i>gene_family:searchterm</i></li>
<li>Search for: &#160; <i>gene_family:bla2</i><br />
to show members of the bla2 gene family: BcII family subclass B1 metallo-beta-lactamases. Each hit will correspond to a unique protein sequence, and corresponding unique nucleotide sequence.
That is, each hit will have a unique <a href="#accession-prefix-wp">WP_* accession</a> (refseq_protein_accession), and/or a corresponding unique <a href="https://www.ncbi.nlm.nih.gov/books/NBK50679/#RefSeqFAQ.what_is_an_ng_accession_and_wh">NG_* accession</a> (refseq_nucleotide_accession). <i>(A separate section of this document describes the <a href="#refgene-non-redundant">non-redundant</a> nature of the Reference Gene Catalog, and how the definition of redundant (or 'non-unique') will differ, depending on the type of data element (allele, gene, or point mutation).)</i>
</li>
</ul>
</li>
<!-- ======== REFGENE_DATA_FIELD_product_name ========== -->
<li id="refgene-data-field-product-name">
<span style="background-color: #cde1ff">Product name (<b><i>product_name</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#refgene-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of Reference Gene Catalog data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
Name of gene product or genomic region.<br /><br />
Data field names and values are <a href="#case-sensitive"><b>case sensitive</b></a>, as shown in the examples below. Additional sections of this document provide tips about search terms that contain <a href="#special-characters">special characters</a> (such as the parentheses, hyphens, and apostrophes), and the use of <a href="#query-tips-phrase-search-quotes">quotes to search for a phrase</a>.<br /><br />
<b>Examples:</b>
<ul>
<li>To search this field directly, enter a query such as: &#160;
<i>product_name:searchterm</i></li>
<li>Search for: &#160; <i>product_name:"BcII family subclass B1 metallo-beta-lactamase"</i><br />
to show all entries in the Reference Gene Catalog that have the exact product name that you specified, including upper and lower case letters as well as special characters (in this case, hyphens). As of July 5, 2019, the search retrieves 6 hits.<br /><br />
Note: If the search is entered <i>without quotes</i> surrounding the product name, such as:<br />
Search for: &#160; <i>product_name:BcII family subclass B1 metallo-beta-lactamase</i>
then each space is interpreted by the search system as a Boolean OR. As of July 5, 2019, the search retrieves 1,466 hits.<br />
<i>(<a href="#operators">read more about SOLR operators</a>)</i>
</li>
</ul>
</li>
<!-- ======== REFGENE_DATA_FIELD_scope ========== -->
<li id="refgene-data-field-scope">
<span style="background-color: #cde1ff">Scope (<b><i>scope</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#refgene-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of Reference Gene Catalog data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
This field specifies the <a href="#refgene-scope">data subset</a> to which an allele or gene belongs, and the <b>value</b> can either be <a href="#refgene-scope-core"><b>core</b></a> (curated for relevance to resistance, usually AMR-specific genes and point mutations) or <a href="#refgene-scope-plus"><b>plus</b></a> (genes related to biocide and stress resistance, general efflux, virulence, or antigenicity , or where the presence of this gene may not be informative as to resistance phenotype or the relationship is not clear).<br /><br />
Data field names and values are <a href="#case-sensitive"><b>case sensitive</b></a>. In this case, both the data field name and the value are written in all <b>lower case</b>, as shown in the example below.<br /><br />
<b>Examples:</b>
<ul>
<li>To search this field directly, enter a query such as: &#160;
<i>scope:searchterm</i></li>
<li>Search for: &#160; <i>scope:plus</i><br />
to show the genes in the "plus" subset of the Pathogen Detection Reference Gene Catalog. That subset includes genes related to biocide and stress resistance, general efflux, virulence, or antigenicity.
</li>
</ul>
</li>
<!-- ======== REFGENE_DATA_FIELD_type ========== -->
<li id="refgene-data-field-type">
<span style="background-color: #cde1ff">Type (<b><i>type</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#refgene-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of Reference Gene Catalog data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
Classification for the type of gene found, such as AMR, STRESS, or VIRULENCE.
A more detailed description of the type and subtype fields is available on the <a href="https://github.com/ncbi/amr/wiki/Interpreting-results#element-type-and-subtype">AMRFinderPlus wiki</a><br /><br />
<i>(In general, <a href="#refgene-data-field-type">type</a> and <a href="#refgene-data-field-subtype">subtype</a> refer to the category of gene or genetic element, while <a href="#refgene-data-field-class">class</a> and <a href="#refgene-data-field-subclass">subclass</a> refer to the a phenotype associated with the genetic element.)</i><br /><br />
Data field names and values are <a href="#case-sensitive">case sensitive</a>, and the <b>values</b> for this data field are written in <b>upper case</b>, as shown in the example below.<br /><br />
<b>Examples:</b>
<ul>
<li>To search this field directly, enter a query such as: &#160;
<i>type:searchterm</i></li>
<li>Search for: &#160; <i>type:STRESS</i><br />
to show genes that confer stress resistance.<br />
As an alternative method for retrieving those genes, you can open the "<b>Filters</b>" function of the Reference Gene Catalog and check the box for the desired Type. By doing so, the Filters function will refresh itself to show the subtype values that are available for the type you have selected, enabling you to further narrow your search results, if desired. For example, the subtype values under STRESS currently include BIOCIDE, HEAT, and METAL. (As noted below, <a href="#refgene-filters">filters</a> are <a href="#refgene-filters-on-the-fly">generated on the fly</a> and reflect the attributes of the data that you are currently viewing.)
</li>
</ul>
</li>
<!-- ======== REFGENE_DATA_FIELD_subtype ========== -->
<li id="refgene-data-field-subtype">
<span style="background-color: #cde1ff">Subtype (<b><i>subtype</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#refgene-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of Reference Gene Catalog data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
Classification for the subtype of gene found.
A more detailed description of the type and subtype fields is available on the <a href="https://github.com/ncbi/amr/wiki/Interpreting-results#element-type-and-subtype">AMRFinderPlus wiki</a><br /><br />
<i>(In general, <a href="#refgene-data-field-type">type</a> and <a href="#refgene-data-field-subtype">subtype</a> refer to the category of gene or genetic element, while <a href="#refgene-data-field-class">class</a> and <a href="#refgene-data-field-subclass">subclass</a> refer to the substrate.)</i><br /><br />
Data field names and values are <a href="#case-sensitive">case sensitive</a>, and the <b>values</b> for this data field are written in <b>upper case</b>, as shown in the example below.<br /><br />
<b>Examples:</b>
<ul>
<li>To search this field directly, enter a query such as: &#160;
<i>subtype:searchterm</i></li>
<li>Search for: &#160; <i>subtype:HEAT</i><br />
to show genes that confer heat resistance.<br />
As an alternative method for retrieving those genes, you can open the "<b>Filters</b>" function of the Reference Gene Catalog and check the box for the desired Subtype. By doing so, the Filters function will refresh itself to show the corresponding type under which the selected subtype falls. For example, the subtype value of HEAT falls under the type STRESS. (As noted below, <a href="#refgene-filters">filters</a> are <a href="#refgene-filters-on-the-fly">generated on the fly</a> and reflect the attributes of the data that you are currently viewing.)
</li>
</ul>
</li>
<!-- ======== REFGENE_DATA_FIELD_class ========== -->
<li id="refgene-data-field-class">
<span style="background-color: #cde1ff">Class (<b><i>class</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#refgene-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of Reference Gene Catalog data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
"Class" provides a broad definition of the phenotype affected by the gene or allele, and includes resistance phenotypes such as antimicrobial and stress resistance, virulence, and antigenicity. For some virulence genes this field contains typing information.
More information about class and subclass fields can be found on the <a href="https://github.com/evolarjun/amr/wiki/Interpreting-results#class-and-subclass">AMRFinderPlus wiki</a> <br /><br />
<i>(In general, <a href="#refgene-data-field-type">type</a> and <a href="#refgene-data-field-subtype">subtype</a> refer to the category of gene or genetic element, while <a href="#refgene-data-field-class">class</a> and <a href="#refgene-data-field-subclass">subclass</a> refer to the substrate.)</i><br /><br />
Data field names and values are <a href="#case-sensitive">case sensitive</a>, and the <b>values</b> for this data field are written in <b>upper case</b>, as shown in the example below.<br /><br />
Additional sections of this document provide tips search terms that contain <a href="#special-characters">special characters</a> (such as the parentheses, hyphens, and apostrophes), and the use of <a href="#wildcards">wildcards</a> (such as the asterisk or question mark).<br /><br />
<b>Examples:</b>
<ul>
<li>To search this field directly, enter a query such as: &#160;
<i>class:searchterm</i></li>
<li>Search for: &#160; <i>class:BETA-LACTAM</i><br />
to show all genes classified as BETA-LACTAM.
<!-- When the search results are displayed, clicking on the "Filters" tab will display options for further narrowing the search results, such as subclass and gene_family, that are specific to the BETA-LACTAM class of genes. --><br />
As an alternative method for retrieving those genes, you can open the "<b>Filters</b>" function of the Reference Gene Catalog and check the box for the desired Class. By doing so, the Filters function will refresh itself to show the subclass values that are available for the type you have selected, enabling you to further narrow your search results, if desired. For example, the subclass values under BETA-LACTAM currently include BETA-LACTAM, CARBAPENEM, CEPHALOSPORIN, CEPHALOTHIN, and METHICILLIN. (As noted below, <a href="#refgene-filters">filters</a> are <a href="#refgene-filters-on-the-fly">generated on the fly</a> and reflect the attributes of the data that you are currently viewing.)
</li>
</ul>
</li>
<!-- ======== REFGENE_DATA_FIELD_subclass ========== -->
<li id="refgene-data-field-subclass">
<span style="background-color: #cde1ff">Subclass (<b><i>subclass</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#refgene-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of Reference Gene Catalog data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
Where it is known, "Subclass" provides a more specific definition of the particular antibiotics or classes that are affected by the gene or point mutation (e.g., that are resisted by the gene/allele). While most subclass designations are self-explanatory, a few others have particular meanings. Specifically, "CEPHALOSPORIN" is equivalent to the Lahey 2be definition; "CARBAPENEM" means the protein has carbapenemase activity, but it might or might not confer resistance to other beta-lactams; "QUARTERNARY AMMONIUM" are quarternary ammonium compounds. In addition, stx subtypes (e.g., STX2E) and intimin subtypes (e.g., ALPHA) are defined for Shiga toxin proteins (class of STX1 or STX2) and intimins (class of INTIMIN) respectively. Where the phenotypic information is incomplete, contradictory, or unclear, the "Class" value is used for the "Subclass" value.<br /><br />
More information about the class and subclass fields can be found on the <a href="https://github.com/evolarjun/amr/wiki/Interpreting-results#class-and-subclass">AMRFinderPlus wiki</a> <br /><br />
<i>(In general, <a href="#refgene-data-field-type">type</a> and <a href="#refgene-data-field-subtype">subtype</a> refer to the category of gene or genetic element, while <a href="#refgene-data-field-class">class</a> and <a href="#refgene-data-field-subclass">subclass</a> refer to the substrate.)</i><br /><br />
Data field names and values are <a href="#case-sensitive">case sensitive</a>, and the <b>values</b> for this data field are written in <b>upper case</b>, as shown in the example below.<br /><br />
Additional sections of this document provide tips about search terms that contain <a href="#special-characters">special characters</a> (such as the parentheses, hyphens, and apostrophes), and the use of <a href="#wildcards">wildcards</a> (such as the asterisk or question mark).<br /><br />
<b>Examples:</b>
<ul>
<li>To search this field directly, enter a query such as: &#160;
<i>subclass:searchterm</i></li>
<li>Search for: &#160; <i>subclass:CEPHALOSPORIN</i><br />
to show genes that confer resistance to cephalosporin antibiotics.<br />
As an alternative method for retrieving those genes, you can open the "<b>Filters</b>" function of the Reference Gene Catalog and check the box for the desired subclass. The Filters function will then refresh itself to show the corresponding class under which the selected subclass falls. For example, the subclass value of CEPHALOSPORIN falls under the class BETA-LACTAM. (As noted below, <a href="#refgene-filters">filters</a> are <a href="#refgene-filters-on-the-fly">generated on the fly</a> and reflect the attributes of the data that you are currently viewing.)
</li>
</ul>
</li>
<!-- ======== REFGENE_DATA_FIELD_refseq_protein_accession ========== -->
<li id="refgene-data-field-refseq-protein-accession">
<span style="background-color: #cde1ff">RefSeq protein accession (<b><i>refseq_protein_accession</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#refgene-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of Reference Gene Catalog data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
Accession of the <a href="https://www.ncbi.nlm.nih.gov/refseq/">RefSeq</a> protein sequence record in which the gene or allele is found. It generally has a <a href="#accession-prefix-wp">WP_* prefix</a>.
<i>(Read more <a href="https://www.ncbi.nlm.nih.gov/refseq/about/">about RefSeq</a>, the distinct format of <a href="https://www.ncbi.nlm.nih.gov/books/NBK21091/table/ch18.T.refseq_accession_numbers_and_mole/?report=objectonly">RefSeq accessions</a>, and the various <a href="#accession-prefixes">accession prefixes</a> that appear in the Pathogen Detection project.)</i><br /><br />
Enter the sequence record identifier in the <b>accession.version format</b>, as shown in the first example below.<br />
If you don't know the <b>version</b> of the sequence record, enter <b>just the accession</b>, as shown in the second example below.<br /><br />
<b>Examples:</b>
<ul>
<li>To search this field directly, enter a query such as: &#160;
<i>refseq_protein_accession:searchterm</i></li>
<li>Search for: &#160; <i>refseq_protein_accession:WP_001281243.1</i><br />
to show the Reference Gene Catalog entries associated with this RefSeq protein sequence record. If multiple alleles have been found to exist in this protein, there will be a separate entry for each allele.
<i>(A separate section of this document describes the <a href="#refgene-non-redundant">non-redundant</a> nature of the Reference Gene Catalog, and how the definition of redundant (or 'non-unique') will differ, depending on the type of data element (allele, gene, or point mutation.)</i>
</li>
<li>Search for: &#160; <i>refseq_protein_accession:WP_001281243</i><br />
to show the Reference Gene Catalog entries associated with this RefSeq protein accession, regardless of its version number. <i>(The Reference Gene Catalog contains the latest version of a sequence record; if you don't know what version number is the latest, enter only the accession as your query, without any dot or version number.)</i>
</li>
</ul>
</li>
<!-- ======== REFGENE_DATA_FIELD_refseq_nucleotide_accession ========== -->
<li id="refgene-data-field-refseq-nucleotide-accession">
<span style="background-color: #cde1ff">RefSeq nucleotide accession (<b><i>refseq_nucleotide_accession</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#refgene-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of Reference Gene Catalog data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
Accession of the <a href="https://www.ncbi.nlm.nih.gov/refseq/">RefSeq</a> nucleotide sequence record in which the gene or allele is found. It generally has an <!-- a href="https://www.ncbi.nlm.nih.gov/books/NBK50679/#RefSeqFAQ.what_is_an_ng_accession_and_wh" --><a href="#accession-prefix-ng">NG_* prefix</a>.
<i>(Read more <a href="https://www.ncbi.nlm.nih.gov/refseq/about/">about RefSeq</a>, the distinct format of <a href="https://www.ncbi.nlm.nih.gov/books/NBK21091/table/ch18.T.refseq_accession_numbers_and_mole/?report=objectonly">RefSeq accessions</a>, and the various <a href="#accession-prefixes">accession prefixes</a> that appear in the Pathogen Detection project.)</i><br /><br />
Enter the sequence record identifier in the <b>accession.version format</b>, as shown in the first example below.<br />
If you don't know the <b>version</b> of the sequence record, enter <b>just the accession</b>, as shown in the second example below.<br /><br />
<b>Examples:</b>
<ul>
<li>To search this field directly, enter a query such as: &#160;
<i>refseq_nucleotide_accession:searchterm</i></li>
<li>Search for: &#160; <i>refseq_nucleotide_accession:NG_047553.1</i><br />
to show the Reference Gene Catalog entry associated with this RefSeq nucleotide sequence record.
</li>
<li>Search for: &#160; <i>refseq_nucleotide_accession:NG_047553</i><br />
to show the Reference Gene Catalog entries associated with this RefSeq nucleotide accession, regardless of its version number. <i>(The Reference Gene Catalog contains the latest version of a sequence record; if you don't know what version number is the latest, enter only the accession as your query, without any dot or version number.)</i>
</li>
</ul>
</li>
<!-- ======== REFGENE_DATA_FIELD_genbank_protein_accession ========== -->
<li id="refgene-data-field-genbank-protein-accession">
<span style="background-color: #cde1ff">GenBank protein accession (<b><i>genbank_protein_accession</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#refgene-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of Reference Gene Catalog data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
Accession of the <a href="https://www.ncbi.nlm.nih.gov/genbank/">GenBank</a> protein sequence record in which the gene or allele is found. <i>(Read more about the format of <a href="https://support.nlm.nih.gov/knowledgebase/article/KA-03434/en-us">GenBank accessions</a>, and about the various <a href="#accession-prefixes">accession prefixes</a> that appear in the Pathogen Detection project.)</i><br /><br />
Enter the sequence record identifier in the <b>accession.version format</b>, as shown in the example below.<br />
If you don't know the <b>version</b> of the sequence record, enter <b>just the accession</b>, as shown in the second example below.<br /><br />
<b>Examples:</b>
<ul>
<li>To search this field directly, enter a query such as: &#160;
<i>genbank_protein_accession:searchterm</i></li>
<li>Search for: &#160; <i>genbank_protein_accession:AAB00464.1</i><br />
to show the Reference Gene Catalog entries associated with this GenBank protein.
</li>
<li>Search for: &#160; <i>genbank_protein_accession:AAB00464</i><br />
to show the Reference Gene Catalog entries associated with this GenBank protein accession, regardless of its version number. <i>(The Reference Gene Catalog contains the latest version of a sequence record; if you don't know what version number is the latest, enter only the accession as your query, without any dot or version number.)</i>
</li>
</ul>
</li>
<!-- ===== REFGENE_DATA_FIELD_genbank_nucleotide_accession ===== -->
<li id="refgene-data-field-genbank-nucleotide-accession">
<span style="background-color: #cde1ff">GenBank nucleotide accession (<b><i>genbank_nucleotide_accession</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#refgene-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of Reference Gene Catalog data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
Accession of the <a href="https://www.ncbi.nlm.nih.gov/genbank/">GenBank</a> nucleotide sequence record in which the gene or allele is found. <i>(Read more about the format of <a href="https://www.ncbi.nlm.nih.gov/Sequin/acc.html">GenBank accessions</a>, and about the various <a href="#accession-prefixes">accession prefixes</a> that appear in the Pathogen Detection project.)</i><br /><br />
Enter the sequence record identifier in the <b>accession.version format</b>, as shown in the example below.<br />
If you don't know the <b>version</b> of the sequence record, enter <b>just the accession</b>, as shown in the second example below.<br /><br />
<b>Examples:</b>
<ul>
<li>To search this field directly, enter a query such as: &#160;
<i>genbank_nucleotide_accession:searchterm</i></li>
<li>Search for: &#160; <i>genbank_nucleotide_accession:L26954.1</i><br />
to show the Reference Gene Catalog entries associated with this GenBank nucleotide sequence.
</li>
<li>Search for: &#160; <i>genbank_nucleotide_accession:L26954</i><br />
to show the Reference Gene Catalog entries associated with this GenBank nucleotide sequence, regardless of its version number. <i>(The Reference Gene Catalog contains the latest version of a sequence record; if you don't know what version number is the latest, enter only the accession as your query, without any dot or version number.)</i>
</li>
</ul>
</li>
<!-- ======== REFGENE_DATA_FIELD_organism ========== -->
<li id="refgene-data-field-organism">
<span style="background-color: #cde1ff">organism fields:</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#refgene-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of Reference Gene Catalog data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
<!--Organism-specific genes or mutations. The data fields listed below are populated only if a gene or mutation is specific to a given organism(s). <i>(Note: if a gene or mutation is present in multiple organisms, the organism data field in the Reference Gene Catalog will be blank. The corresponding RefSeq protein record (<a href="#accession-prefix-wp">WP_* accession</a>), however, will list the organisms in which the protein occurs.)</i -->
The <a href="#refgene-data-field-whitelisted-taxa"><i>whitelisted_taxa</i></a> and <a href="#refgene-data-field-blacklisted-taxa"><i>blacklisted_taxa</i></a> data fields below are used for retrieving organism-specific results. Specifically, they are used to screen for known resistance-causing point mutations within an organism group, and for common, non-informative genes, respectively.<br /><br />
Point mutations are currently identified for 28 bacterial taxonomic groups, which are listed <a href="https://github.com/ncbi/amr/wiki/Curated-organisms">here</a>. Note that rRNA mutations will not be screened if only a protein file is provided. To screen known Shigella mutations, use Escherichia as the organism. See Organism option below for more details.
<br /><br />
<ul>
<li id="refgene-data-field-whitelisted-taxa">
<span style="background-color: #cde1ff">Whitelisted taxa (<b><i>whitelisted_taxa</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#refgene-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of Reference Gene Catalog data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
<div style="padding-left: 2em">
The <i>whitelisted_taxa</i> data field indicates for which taxa this element is curated for mutational resistance mechansims.<br /><br />
An example of a whitelisted sequence is the 16S_A1055G point mutation in <i>E. coli</i>.<br /><br />
See the <a href="https://github.com/ncbi/amr/wiki/Running-AMRFinderPlus#--organism-option">AMRFinderPlus documentation</a> for a list of taxa where resistance mechanisms based on mutations are curated.
Data field names and values are <a href="#case-sensitive"><b>case sensitive</b></a>, as shown in the examples below. Additional sections of this document provide tips about search terms that contain <a href="#special-characters">special characters</a> (such as the parentheses, hyphens, and apostrophes), and the use of <a href="#wildcards">wildcards</a> (such as the asterisk or question mark).<br /><br />
<b>Examples:</b>
<ul>
<li>To search this field directly, enter a query such as: &#160;
<i>whitelisted_taxa:searchterm</i></li>
<li>Search for: &#160; <i>whitelisted_taxa:Escherichia</i><br />
to list the resistance-causing point mutations found in the <i>Escherichia</i> taxonomic group (i.e., <i>Escherichia coli</i> and <i>Shigella spp.</i>, <i>Escherichia fergusonii</i>).</li>
</ul>
<b>Additional note:</b>
<ul>
<li>The <b><a href="#amr-finder">AMRFinderPlus</a> software</b> automatically looks for whitelisted sequences if an organism is specified during a search. For example, if AMRFinderPlus is run with <i>Escherichia</i> in the organism field, then your isolate will be screened for the presence of point mutations that confer antimicrobial resistance in this taxonomic group (such as the 16S_A1055G point mutation). If AMRFinderPlus is run without <i>Escherichia</i> in the organism field, then your isolate will not be screened for the presence of this point mutation.</li>
</ul>
</div>
</li>
<li id="refgene-data-field-blacklisted-taxa">
<span style="background-color: #cde1ff">Blacklisted taxa (<b><i>blacklisted_taxa</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#refgene-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of Reference Gene Catalog data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
<div style="padding-left: 2em">
The <i>blacklisted_taxa</i> data field screens for <b>genes that are common within a taxonomic group</b>, and are <b>therefore non-informative</b> with regard to antimicrobial resistance.
<!-- Organisms in which this sequence can be blacklisted, because it is ubiquitous that taxon/taxa and therefore reporting it does not provide useful information. --><br /><br />
An example of a blacklisted sequence is fieF which is blacklisted for both <i>E. coli</i> and <i>Salmonella</i>.
<br /><br />
The available values in <b>blacklisted_taxa</b> currently include:
<ul>
<li><i>Escherichia</i> &gt; <i>Escherichia coli</i> and <i>Shigella spp.</i>, <i>Escherichia fergusonii</i></li>
<li><i>Klebsiella</i> &gt; <i>Klebsiella pneumoniae</i> and <i>Klebsiella oxytoca</i></li>
<li><i>Salmonella</i> &gt; <i>Salmonella enterica</i></li>
<li><i>Staphylococcus</i> &gt; <i>Staphylococcus pseudintermedius</i></li>
<li><i>Vibrio</i> &gt; <i>Vibrio cholerae</i></li>
</ul>
Data field names and values are <a href="#case-sensitive"><b>case sensitive</b></a>, as shown in the examples below. Additional sections of this document provide tips about search terms that contain <a href="#special-characters">special characters</a> (such as the parentheses, hyphens, and apostrophes), and the use of <a href="#wildcards">wildcards</a> (such as the asterisk or question mark).<br /><br />
<b>Examples:</b>
<ul>
<li>To search this field directly, enter a query such as: &#160;
<i>blacklisted_taxa:searchterm</i></li>
<li>Search for: &#160; <i>blacklisted_taxa:Klebsiella</i><br />
to list genes that have been blacklisted in the <i>Klebsiella</i> taxonomic group (i.e., <i>Klebsiella pneumoniae</i> and <i>Klebsiella oxytoca</i>).
</li>
<li>Search for: &#160; <i>blacklisted_taxa:Escherichia AND blacklisted_taxa:Salmonella</i><br />
to list genes that have been blacklisted in both the <i>Escherichia</i> taxonomic group (i.e., <i>Escherichia coli</i> and <i>Shigella spp.</i>, <i>Escherichia fergusonii</i>), and in <i>Salmonella</i>.
</li>
</ul>
<b>Additional note:</b>
<ul>
<li>The <b><a href="#amr-finder">AMRFinderPlus</a> software</b> automatically excludes blacklisted sequences if an organism is specified during a search. For example, if AMRFinderPlus is run with either <i>Escherichia</i> or <i>Salmonella</i> in the organism field, then your isolate will be screened for the presence of common genes in the taxonomic group, and those common genes will be eliminated from the AMRFinderPlus results. For example, the fieF gene will not be reported even if it is present in your isolate, since fieF is ubiquitous in both of these taxa and reporting it does not provide useful information.
<!-- For example, if AMRFinderPlus is run with either <i>Escherichia</i> or <i>Salmonella</i> in the organism field, then your isolate will be screened for the presence of common genes in the taxonomic group that are not informative with regard to antimicrobial resistance (such as the fieF gene), and those common genes will be eliminated from the AMRFinderPlus results. --></li>
</ul>
</div>
</li>
</ul>
<!-- Data field names and values are <a href="#case-sensitive">case sensitive</a>. When searching the organism data fields, enter the <b>genus name</b> exactly as it is listed under "Filters," as shown in the examples above. As an alternative to a direct search of the organism fields, you can simply activate the check box for the desired organism in the Filters tab of the Reference Gene Catalog to retrieve the alleles and genes that are whitelisted or blacklisted for that taxonomy group.<br /><br / -->
</li>
<!-- ======== REFGENE_DATA_FIELD_curated_refseq_start ========== -->
<li id="refgene-data-field-curated-refseq-start">
<span style="background-color: #cde1ff">Curated RefSeq start (<b><i>curated_refseq_start</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#refgene-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of Reference Gene Catalog data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
Did curators alter the start coordinate from the GenBank record when making the RefSeq record? The allowable values for this field are <b>Yes</b> or <b>No</b>, and must be written with a leading upper case letter.<br /><br />
A "Yes" indicates that NCBI RefSeq curators either changed the translation start site (in the <a href="#accession-prefix-ng">NG_* genomic sequence record</a>) from what was shown on the corresponding GenBank record, or provided start and stop coordinates that the GenBank record lacked.<br /><br />
The data field name is also <a href="#case-sensitive">case sensitive</a> and should be written in all lower case, as shown in the example below. (Separate sections of this document provides additional details about <a href="#case-sensitive">case sensitive</a> searches and <a href="#accession-prefixes">accession prefixes</a> that appear in the Pathogen Detection project.)<br /><br />
<b>Examples:</b>
<ul>
<li>To search this field directly, enter a query such as: &#160;
<i>curated_refseq_start:searchterm</i></li>
<li>Search for: &#160; <i>curated_refseq_start:Yes</i><br />
to show all genes an alleles that have a curated RefSeq start.
</li>
</ul>
</li>
<!-- ======== REFGENE_DATA_FIELD_genbank_start ========== -->
<li id="refgene-data-field-genbank-start">
<span style="background-color: #cde1ff">GenBank start (<b><i>genbank_start</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#refgene-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of Reference Gene Catalog data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
The start coordinate of the reference sequence for this element on the GenBank nucleotide sequence record. This field should always be lower than the <b>GenBank stop</b> field regardless of the <b>GenBank strand</b> <br /><br />
</li>
<!-- ======== REFGENE_DATA_FIELD_genbank_stop ========== -->
<li id="refgene-data-field-genbank-stop">
<span style="background-color: #cde1ff">GenBank stop (<b><i>genbank_stop</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#refgene-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of Reference Gene Catalog data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
The stop coordinate of this reference sequence for this element on the GenBank nucleotide sequence record. This field should always be higher than the <b>GenBank start</b> field regardless of the <b>GenBank strand</b>.<br /><br />
</li>
<!-- ===== REFGENE_DATA_FIELD_genbank_strand ====== -->
<li id="refgene-data-field-genbank-strand">
<span style="background-color: #cde1ff">GenBank strand (<b><i>genbank_strand</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#refgene-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of Reference Gene Catalog data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
The strand (<b>+</b>/<b>-</b>) on which the reference sequence occurs, relative to the nucleotide sequence that appears in the genbank_nucleotide_accession listed for the gene or allele.<br /><br />
</li>
<!-- ======== REFGENE_DATA_FIELD_refseq_start ========== -->
<li id="refgene-data-field-refseq-start">
<span style="background-color: #cde1ff">RefSeq start (<b><i>refseq_start</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#refgene-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of Reference Gene Catalog data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
The start coordinate of this reference sequence for this element on the RefSeq nucleotide sequence record. This field should always be lower than the <b>RefSeq stop</b> field regardless of the <b>RefSeq strand</b> <br /><br />
</li>
<!-- ======== REFGENE_DATA_FIELD_refseq_stop ========== -->
<li id="refgene-data-field-refseq-stop">
<span style="background-color: #cde1ff">RefSeq stop (<b><i>refseq_stop</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#refgene-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of Reference Gene Catalog data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
The stop coordinate of this reference sequence for this element on the RefSeq nucleotide sequence record. This field should always be higher than the <b>RefSeq start</b> field regardless of the <b>RefSeq strand</b>.<br /><br />
</li>
<!-- ===== REFGENE_DATA_FIELD_refseq_strand ====== -->
<li id="refgene-data-field-refseq-strand">
<span style="background-color: #cde1ff">RefSeq strand (<b><i>refseq_strand</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#refgene-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of Reference Gene Catalog data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
The strand (<b>+</b>/<b>-</b>) of reference sequence for this element, relative to the nucleotide sequence that appears in the refseq_nucleotide_accession listed for the gene or allele.<br /><br />
</li>
<!-- ======== REFGENE_DATA_FIELD_pubmed_reference ========== -->
<li id="refgene-data-field-pubmed-reference">
<span style="background-color: #cde1ff">PubMed reference (<b><i>pubmed_reference</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#refgene-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of Reference Gene Catalog data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
Links to references describing gene, if available. The value in the data field is a <a href="https://www.ncbi.nlm.nih.gov/pubmed/">PubMed</a> identifier (PMID). Clicking on an entry in this field will take you to the page for that paper in PubMed. <!-- ><i>(<a href="#_______">read more about _______</a>)</i --> <br /><br />
<!-- b>Tips:</b><br />
A separate section of this document provide search tips about <a href="#case-sensitive">case sensitive</a> searches, search terms that contain <a href="#special-characters">special characters</a> (such as the parentheses, hyphens, and apostrophes), and the use of <a href="#wildcards">wildcards</a> (such as the asterisk or question mark).<br /><br />
<b>Examples:</b>
<ul>
<li>To search this field directly, enter a query such as: &#160;
<i>pubmed_reference:searchterm</i></li>
<li>Search for: &#160; <i>pubmed_reference:_________ AND pubmed_reference:_________</i><br />
to show ___________________________.
</li>
</ul -->
</li>
<!-- ======== REFGENE_DATA_FIELD_synonyms ========== -->
<li id="refgene-data-field-synonyms">
<span style="background-color: #cde1ff">Synonyms (<b><i>synonyms</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#refgene-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of Reference Gene Catalog data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
Other symbols used to refer to this element / gene in the literature.<br /><br />
</li>
<!-- ======== REFGENE_DATA_FIELD_links ========== -->
<li id="refgene-data-field-links">
<span style="background-color: #cde1ff">Links (<b><i>links_count</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#refgene-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of Reference Gene Catalog data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
Links will contain hyperlinks to other resources. Currently the field contains links to PubChem when there is an identical protein within PubChem for the current protein.<br /><br />
</li>
<!-- ======== REFGENE_DATA_FIELD_XXXXXXX ========== -->
<!-- li id="refgene-data-field-XXXXXXXX">
<span style="background-color: #cde1ff">_________ (<b><i>_________</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#refgene-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of Reference Gene Catalog data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
Text text text text text text text text text text text. <i>(<a href="#_______">read more about _______</a>)</i><br /><br />
<b>Tips:</b><br />
A separate section of this document provide search tips about <a href="#case-sensitive">case sensitive</a> searches, search terms that contain <a href="#special-characters">special characters</a> (such as the parentheses, hyphens, and apostrophes), and the use of <a href="#wildcards">wildcards</a> (such as the asterisk or question mark).<br /><br />
<b>Examples:</b>
<ul>
<li>To search this field directly, enter a query such as: &#160;
<i>_________:searchterm</i></li>
<li>Search for: &#160; <i>_________:_________ AND _________:_________</i><br />
to show ___________________________.
</li>
</ul>
</li -->
<!-- ======== END_OF_LAST_DATA_FIELD ========== -->
</ul>
<!-- ========= END_REFGENE_DATA_FIELDS_DESCRIPTIONS =========== -->
</div>
</div>
<!-- ====== END_REFGENE_DATA_FIELDS ========= -->
<!-- ========= REFGENE_OUTPUT ============ -->
<div style="padding-left: 2em">
<h4 id="refgene-output">Output from the Pathogen Detection Reference Gene Catalog <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#reference-gene-catalog"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Pathogen Detection Reference Gene Catalog help, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h4>
<div style="padding-left: 2em">
<!-- ========= REFGENE_OUTPUT_TABLE ============ -->
<span id="refgene-output-table"><b>Tabular list of genes</b></span> <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#reference-gene-catalog"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Pathogen Detection Reference Gene Catalog help, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br />
<ul>
<li>Upon opening the <a href="/pathogens/isolates#/refgene/">Pathogen Detection Reference Gene Catalog</a>, a table displays data for <b>all genes and alleles</b> that are currently in the catalog.</li>
<li><b>Every row</b> in the Pathogen Detection Reference Gene Catalog display is a <b>reference gene</b> or a <b>point mutation</b>.</li>
<li>The data available for each item can include gene or allele name, product name, type, subtype, class, subclass, and more, as available. (See the <a href="#refgene-data-fields">Pathogen Detection Reference Gene Catalog data fields</a> for a complete list.) Some of the data elements, such a accessions for corresponding protein and nucleotide sequence records and publications, <b>link</b> to additional information in related databases such as RefSeq, GenBank, and PubMed.</li>
<li>The genes and point mutations can be <b>sorted</b> by clicking on column headers, <b>faceted</b> by using <a href="#refgene-output-filters">filters</a> (e.g., class:AMINOGLYCOSIDE), or <b>searched</b> using <a href="#refgene-basic-search">basic</a> or <a href="#refgene-advanced-search">advanced</a> search techniques. <!-- (see <a href="#refgene-sample-searches"><span style="color:#d70000">use cases/sample searches</span> of the Reference Gene Catalog</a> and an <a href="#refgene-illustration"><span style="color:#d70000">illustrated example</span> of search results</a>). --></li>
<li><b>Download</b> the list of elements and their metadata shown. Click on the <b>Download</b> button just above the main data table and select <b>File type: Table</b>. From there you can select Tab-delimited (.tsv) or Comma-delimited (.csv) and set the filename. Clicking <b>Download</b> will download the data shown in the table filtered by the search and with the visible columns included. See the <a href="#refgene-access-download">Download the Reference Gene Catalog data</a> section for more information and how to download sequences.</li>
</ul>
<!-- ========= END_REFGENE_OUTPUT_TABLE ============ -->
<!-- ========= REFGENE_FILTERS ============ -->
<span id="refgene-output-filters"><b>Filters to refine results</b></span> <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#reference-gene-catalog"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Pathogen Detection Reference Gene Catalog help, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
<ul>
<li>The "Filters" menu options in the <a href="/pathogens/isolates#/refgene/">Reference Gene Catalog</a> enable you to <b>facet or subset the data</b> in a variety of ways, and therefore can be used to refine your results, whether you have done a <a href="#refgene-basic-search">basic search</a> or an <a href="#refgene-advanced-search">advanced search</a>.</li>
<li>By default, each filter displays the <b>top 10 terms</b> (based on the number of genes/alleles retrieved by a term). The "<b>more [+]</b>" option displays up to the <b>top 100 terms</b>, listed alphabetically within that set of top 100.</li>
<li id="refgene-filters-on-the-fly"><b>Filters are generated on the fly</b>. The choices listed in the "Filters" tab depend on the data set you are currently displaying in the browser, and reflect the attributes of the genes and alleles in that data set.</li>
<li>A separate section of this document provides <a href="#refgene-filters">additional information about Filters</a>.</li>
</ul>
<!-- ========= END_REFGENE_FILTERS ============ -->
<!-- ========= REFGENE_OUPUT_DISPLAY_OPTIONS ========= -->
<span id="refgene-display-options"><b>Customize the Reference Gene Catalog display</b></span> <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#reference-gene-catalog"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Pathogen Detection Reference Gene Catalog help, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br />
<ul>
<li>The columns displayed by the Reference Gene Catalog reflect the <a href="#refgene-data-fields">data fields</a>. By default, the Reference Gene Catalog displays only a subset of the available data fields.</li>
<li id="refgene-choose-columns">You can use the "<b>Choose Columns</b>" option at the top of the tabular list of genes in order to remove columns, select additional columns to display, and/or change the order of the columns.</li>
<li>The options you select will <b>persist</b> within a given browser (e.g., Chrome, Edge, Internet Explorer, Firefox, Safari) until that browser's cookies are cleared/reset.</li>
</ul>
<!-- ========= END_REFGENE_OUPUT_DISPLAY_OPTIONS ========= -->
</div>
</div>
<!-- ====== END_REFGENE_OUTPUT ========= -->
<!-- ========= REFGENE_USE_CASES ============ -->
<div style="padding-left: 2em">
<h4 id="refgene-sample-searches">Use cases/sample searches of the Pathogen Detection Reference Gene Catalog <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#reference-gene-catalog"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Pathogen Detection Reference Gene Catalog help, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h4>
<ul>
<li><a href="#refgene-sample-search-multidrug-resistant">Find multidrug resistant genes</a></li>
<li><a href="#refgene-sample-search-amr-gene-carbapenem">Find carbapenem resistant genes</a></li>
<li><a href="#refgene-sample-search-amr-point-mutations-quinolones">Find point mutations in <i>Escherichia</i> that confer resistance to quinolones</a></li>
</ul>
<!-- ====== REFGENE_SAMPLE_SEARCH_MULTIDRUG_RESISTANT =========== -->
<span id="refgene-sample-search-multidrug-resistant"><b>Find multidrug resistant genes</b></span> <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#refgene-sample-searches"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Pathogen Detection Reference Gene Catalog help, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
<div style="padding-left: 2em">
As an example:<br />
<ul>
<li>Open the NCBI <a href="/pathogens/isolates#/refgene/">Pathogen Detection Reference Gene Catalog</a>.</li>
<li>Open the "<b><i>Filters</i></b>" function.</li>
<li>By <b>default</b>, each filter shows the <b>top 100 terms</b> (based on the number of genes/alleles retrieved by a term).</li>
<li>In the <b><i>Class</i></b> section of the filters, scroll down to find MULTIDRUG or search for MULTIDRUG in the search box.</li>
<li>"<b><i>MULTIDRUG</i></b>" now appears as an option under <b><i>Class</i></b>. Select that option. Upon this action, the Filters display will refresh itself to show only the set of filters that apply to that class of antibiotics, and the tabular list of genes and alleles will refresh itself to show only the items that fall in that class.</li>
</ul>
<i>An alternative method for retrieving those genes and allele is to search the subclass data field directly. To do this, open the <a href="/pathogens/isolates#/refgene/">Pathogen Detection Reference Gene Catalog</a> and enter the query:<br /> <b>class:MULTIDRUG</b><br />
Separate sections of this file provides details about <a href="#refgene-filters">filters</a>, and about how to directly search specific <a href="#refgene-data-fields">data fields</a>, such as the <a href="#refgene-data-field-class">class</a> and <a href="#refgene-data-field-subclass">subclass</a> fields, and <a href="#case-sensitive">case sensitive</a> searches.</i><br /><br />
</div>
<!-- ====== END_REFGENE_SAMPLE_SEARCH_MULTIDRUG_RESISTANT ======== -->
<!-- ====== REFGENE_SAMPLE_SEARCH_AMR_GENE_CARBAPENEM =========== -->
<span id="refgene-sample-search-amr-gene-carbapenem"><b>Find carbapenem resistant genes</b></span> <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#refgene-sample-searches"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Pathogen Detection Reference Gene Catalog help, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
<div style="padding-left: 2em">
As an example:<br />
<ul>
<li>Open the NCBI <a href="/pathogens/isolates#/refgene/">Pathogen Detection Reference Gene Catalog</a>.</li>
<li>Open the "<b><i>Filters</i></b>" function.</li>
<li>In the <b><i>Class</i></b> section of the filters, select "<b><i>BETA-LACTAM</i></b>." Upon this action, the Filters display will refresh itself to show only the set of filters that apply to the Beta-Lactam class.</li>
<li>The <b><i>Subclass</i></b> section of the filters will now list "<b><i>CARBAPENEM</i></b>" as an option. Check the box for CARBAPENEM to show the genes that confer resistance to that subclass of antibiotics.</li>
</ul>
<i>An alternative method for retrieving those genes and allele is to search the subclass data field directly. To do this, open the <a href="/pathogens/isolates#/refgene/">Pathogen Detection Reference Gene Catalog</a> and enter the query:<br /> <b>subclass:CARBAPENEM</b><br />
Separate sections of this file provides details about <a href="#refgene-filters">filters</a>, and about how to directly search specific <a href="#refgene-data-fields">data fields</a>, such as the <a href="#refgene-data-field-class">class</a> and <a href="#refgene-data-field-subclass">subclass</a> fields, and <a href="#case-sensitive">case sensitive</a> searches.</i><br /><br />
</div>
<!-- ====== END_REFGENE_SAMPLE_SEARCH_AMR_GENE_CARBAPENEM ======== -->
<!-- ===== REFGENE_SAMPLE_SEARCH_AMR_POINT_MUTATIONS_QUINOLONES ===== -->
<span id="refgene-sample-search-amr-point-mutations-quinolones"><b>Find point mutations in Escherichia that confer resistance to quinolones</b></span> <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#refgene-sample-searches"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Pathogen Detection Reference Gene Catalog help, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
<div style="padding-left: 2em">
As an example:<br />
<ul>
<li>Open the NCBI <a href="/pathogens/isolates#/refgene/">Pathogen Detection Reference Gene Catalog</a>.</li>
<li>Open the "<b><i>Filters</i></b>" function.</li>
<li>By <b>default</b>, each filter shows the <b>top 100 terms</b> (based on the number of genes/alleles retrieved by a term).</li>
<li>In the <b><i>Organism</i></b> section of the filters, select "<b><i>Escherichia</i></b>." Upon this action, the Filters display will refresh itself to show only the set of filters that apply to <i>Escherichia</i>.</li>
<li>In the <b><i>Subtype</i></b> section of the filters, select "<b><i>POINT</i></b>." Upon this action, the Filters display will refresh itself to show only the set of filters that apply to <i>Escherichia</i> point mutations.</li>
<li>In the <b><i>Subclass</i></b> section of the filters, scroll to "<b><i>QUINOLONE</i></b>" or type that term in the search box. It now appears as an option. Select that option.</li>
<li>The resulting output is a list of <i>Escherichia</i> point mutations that confer resistance to quinolone antibiotics.</li>
</ul>
<i>An alternative method for retrieving those genes and allele is to search the subclass data field directly. To do this, open the <a href="/pathogens/isolates#/refgene/">Pathogen Detection Reference Gene Catalog</a> and enter the query:<br /> <b>organism:Escherichia AND subtype:POINT AND subclass:QUINOLONE</b><br />
Separate sections of this file provides details about <a href="#refgene-filters">filters</a>, and about how to directly search specific <a href="#refgene-data-fields">data fields</a>, such as the <a href="#refgene-data-field-organism">organism</a>, <a href="#refgene-data-field-type">type</a>, <a href="#refgene-data-field-subtype">subtype</a>, <a href="#refgene-data-field-class">class</a>, and <a href="#refgene-data-field-subclass">subclass</a> fields, and <a href="#case-sensitive">case sensitive</a> searches.</i><br /><br />
</div>
<!-- ==== END_REFGENE_SAMPLE_SEARCH_AMR_POINT_MUTATIONS_QUINOLONES ==== -->
<!-- ====== REFGENE_SAMPLE_SEARCH_XXXXXXXXX =========== -->
<!-- span id="________"><b>_____TEMPLATE______</b></span> <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#refgene-sample-searches"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Pathogen Detection Reference Gene Catalog help, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
<div style='padding-left: 2em'>
As an example:<br />
<ul>
<li>Open the NCBI <a href="/pathogens/isolates#/refgene/">Pathogen Detection Reference Gene Catalog</a>.</li>
<li><a href="_______">_______</a></li>
<li><a href="_______">_______</a></li>
<li><a href="_______">_______</a></li>
<li><a href="_______">_______</a></li>
</ul>
<i>A separate section of this file provides details about how to search specific <a href="#refgene-data-fields">data fields</a>, such as the <a href="#refgene-data-field-gene-family">gene_family</a> fields.<br />
The "<a href="#refgene-filters">Filters</a>" option provides an alternative method to select the alleles and/or gene families of interest.</i><br /><br />
<i>An alternative method for retrieving those genes and allele is to search the subclass data field directly. To do this, open the <a href="/pathogens/isolates#/refgene/">Pathogen Detection Reference Gene Catalog</a> and enter the query:<br /> <b>________:_______</b><br />
A separate section of this file provides details about how to search specific <a href="#refgene-data-fields">data fields</a>, such as the <a href="#refgene-data-field-class">class</a> and <a href="#refgene-data-field-subclass">subclass</a> fields, and <a href="#case-sensitive">case sensitive</a> searches.</i><br /><br />
</div -->
<!-- ====== END_REFGENE_SAMPLE_SEARCH_XXXXXXXXX ======== -->
</div>
<!-- ====== END_REFGENE_USE_CASES ========= -->
<!-- ========= REFGENE_XXXXXXXX ============ -->
<!-- div style='padding-left: 2em'>
<h4 id="refgene-_________">_______TEMPLATE________ <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#reference-gene-catalog"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Pathogen Detection Reference Gene Catalog help, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h4>
<div style='padding-left: 2em'>
<span id="________"><b>___________</b></span><br /><br />
The NCBI <a href="/pathogens/isolates#/refgene/">Pathogen Detection Reference Gene Catalog</a> is a ___________.<br /><br />
Text text text text text text text text text text text text text text text text text text text text text text text text text text <a href="#_______">_______</a>.<br /><br />
<i>A separate section of this file provides <a href="#isolates-browser">Isolates Browser help documentation</a>, with details on how the browser can be used, including allowable <a href="#isolates-browser-input">input</a>, a decription of the <a href="#isolates-browser-output">output</a>, and an <a href="#isolates-browser-illustration"><span style="color:#d70000">illustrated example</span> of search results</a>.</i><br />
</div>
</div -->
<!-- ====== END_REFGENE_XXXXXXXX ========= -->
<!-- =========== END_REFERENCE_GENE_CATALOG ============ -->
<!-- =========== AMR_FINDER ============ -->
<h3 id="amr-finder">AMRFinderPlus <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#amr"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Antimicrobial resistance (AMR) resources, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h3>
<div style="padding-left: 2em">
<!-- ======= MINI-TOC ========= -->
<a href="#amr-finder-what-is">What is AMRFinderPlus?</a> | <a href="#amr-finder-install">Install software</a> | <a href="#amr-finder-data-files">Download data files</a>: <a href="#amr-finder-reference-gene-catalog">Reference Gene Catalog data</a>, <a href="#amr-finder-hmms">Hidden Markov Models (HMMs)</a>, <a href="#amr-finder-hierarchy">AMRFinder Hierarchy</a> (<a href="#amr-finder-hierarchy-illustration"><span style="color:#d70000">illustrated example</span> of a hierarchy</a>) | <a href="#amr-finder-results">Interpret AMRFinderPlus results</a> | <a href="#amr-finder-read-more">Read more</a> | <a href="#amr-finder-publication">Publication/citation</a><br /><br />
<!-- ======= END_MINI-TOC ========= -->
<span id="amr-finder-what-is"><b>What is AMRFinderPlus?</b></span> <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#amr-finder"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="AMRFinderPlus, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
<a href="/pathogens/antimicrobial-resistance/AMRFinder/">AMRFinderPlus</a> - Identifies antimicrobial resistance (AMR) genes and point mutations in assembled nucleotide and protein sequences. AMRFinderPlus also identifies select virulence and stress resistance genes. AMRFinderPlus compares isolate genomes against the reference protein set using BLAST and against the HMM set using HMMER, and uses the gene hierarchy to provide the most specific protein assignment to antimicrobial resistant protein or family, if present in the query set of proteins. The <a href="https://github.com/ncbi/amr/wiki/v1-Home">original AMRFinder</a> identifies acquired antimicrobial resistance (AMR) genes, as well as point mutations that confer antimicrobial resistance, in either protein datasets or nucleotide data, including genomic data. <a href="https://github.com/ncbi/amr/wiki">AMRFinderPlus</a> identifies the AMR genes and point mutations that are found by the original AMRFinder, plus it identifies select members of additional classes of genes such as virulence factors, biocide, heat, acid, and metal resistance genes. Unlike other AMR gene detection methods that report the best hit, AMRFinderPlus reports the specific gene symbol based on the available evidence. For example, when presented with a novel blaKPC allele that is nearly identical to blaKPC-2, closest hit tools might return blaKPC-2, but AMRFinderPlus would call it as blaKPC (<a href="#amr-finder-hierarchy-illustration">illustrated example</a>). More details about the tool are provided in a publication by <a href="https://pubmed.ncbi.nlm.nih.gov/34135355/">Feldgarden M, et al., 2021</a>.
<ul>
<li id="amr-finder-install"><b>Install AMRFinderPlus</b> from: <a href="https://github.com/ncbi/amr/wiki">https://github.com/ncbi/amr/wiki</a> <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#amr-finder"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="AMRFinderPlus, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></li>
<li id="amr-finder-data-files"><b>Download data files</b>: <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#amr-finder"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="AMRFinderPlus, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br />
The AMRFinderPlus software uses the following data sets, which can be downloaded from the links below:
<ol>
<li id="amr-finder-reference-gene-catalog"><b>Pathogen Detection Reference Gene Catalog</b>:
<ul>
<li>The collection of curated genes used in AMRFinderPlus, which includes two subsets of genes/alleles: (1) "Core:" highly curated, AMR-specific genes; (2) "Plus:" biocide and stress resistance, general efflux, virulence, or antigenicity genes.</li>
<li><a href="#reference-gene-catalog">Read more about the Reference Gene Catalog</a></li>
<li> <a href="/pathogens/isolates#/refgene/">browse/search the Reference Gene Catalog</a></li>
<li>Download: <a href="https://ftp.ncbi.nlm.nih.gov/pathogen/Antimicrobial_resistance/AMRFinderPlus/database/latest/ReferenceGeneCatalog.txt">https://ftp.ncbi.nlm.nih.gov/pathogen/Antimicrobial_resistance/AMRFinderPlus/database</a></li>
</ul>
</li>
<li id="amr-finder-hmms"><b>Pathogen Detection HMM Catalog (Hidden Makrov Models)</b>:
<ul>
<li>A library of Hidden Markov Models (HMMs) that was created, calibrated, and annotated at NCBI, in order to create a hierarchical classification system for AMR proteins, with fine divisions of both recognized families and additional groups to sensitively and accurately identify AMR gene sequences.</li>
<li><a href="/pathogens/docs/HMM_catalog">Read more about the Reference HMM Catalog</a></li>
<li><a href="/pathogens/docs/HMM_catalog/">browse/search the Reference HMM Catalog</a></li>
<li>Download: <a href="https://ftp.ncbi.nlm.nih.gov/hmm/NCBIfam-AMRFinder/">https://ftp.ncbi.nlm.nih.gov/hmm/NCBIfam-AMRFinder/</a></li>
</ul>
</li>
<li id="amr-finder-hierarchy"><b>Reference Gene Hierarchy</b>:
<ul>
<li>A hierarchical framework of gene families, symbols, and names to provide the most specific protein assignment to antimicrobial resistant protein or family. Both the reference proteins and the HMMs are placed into this hierarchy. Unlike other AMR gene detection methods that report the best hit, AMRFinderPlus reports the specific gene symbol based on the available evidence. For example, when presented with a novel blaKPC allele that is nearly identical to blaKPC-2, closest hit tools might return blaKPC-2, but AMRFinder would not incorrectly call it the blaKPC-2 allele (<a href="#amr-finder-hierarchy-illustration">illustrated example</a>).
<li><a href="/pathogens/docs/gene_hierarchy">Read more about the Reference Gene Hierarchy</a></li>
<li><a href="/pathogens/genehierarchy">Browse/search the Reference Gene Hierarchy</a></li>
<li>Download: <a href="https://ftp.ncbi.nlm.nih.gov/pathogen/Antimicrobial_resistance/AMRFinderPlus/database/latest/ReferenceGeneHierarchy.txt">Reference Gene Hierarchy in tab-delimited format</a></li>
<br /><br />
<span id="amr-finder-hierarchy-illustration">
<img src="/core/assets/pathogens/images/AMR_hierarchy_example_blaKPC2.png" width="700" height="475" border="0" alt="Illustrated example of AMRFinderPlus hierarchical classification system for antimicrobial resistance proteins, featuring the hierarchy for blaKPC-2." /></span><br />
</li>
</ul>
</li>
</ol>
</li>
<li id="amr-finder-results"><b>Interpret AMRFinderPlus results</b>: <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#amr-finder"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="AMRFinderPlus, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a>
<ul>
<li>See the AMRFinderPlus documentation on GitHub for details about intepreting AMRFinderPlus results: <a href="https://github.com/ncbi/amr/wiki/Interpreting-results">https://github.com/ncbi/amr/wiki/Interpreting-results</a></li>
</ul>
</li>
<li id="amr-finder-read-more"><b>Read more about AMRFinderPlus</b>: <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#amr-finder"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="AMRFinderPlus, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a>
<ul>
<li><b>Overview</b>: <a href="/pathogens/antimicrobial-resistance/AMRFinder/">AMRFinderPlus</a></li>
<li><b>AMRFinder</b> (original version) identifies acquired <i>antimicrobial resistance (AMR) genes</i>, as well as <i>point mutations</i> that confer antimicrobial resistance, in either protein datasets or nucleotide data, including genomic data. Additional details are provided in the <a href="https://github.com/ncbi/amr/wiki/v1-Home">documentation for AMRFinder</a> in <b>GitHub</b> (https://github.com/ncbi/amr/wiki/v1-Home).</li>
<li><b>AMRFinderPlus</b> identifies the <i>AMR genes</i> and <i>point mutations</i> that are found by the original AMRFinder, <i>plus</i> it identifies select members of additional classes of genes such as <i>virulence factors, biocide, heat, acid, and metal resistance genes</i>. Additional details are provided in the <a href="https://github.com/ncbi/amr/wiki">documentation for AMRFinderPlus</a> in <b>GitHub</b> (https://github.com/ncbi/amr/wiki).</li>
</ul>
</li>
<li id="amr-finder-publication"><b>Publication/Citation</b>: <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#amr-finder"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="AMRFinderPlus, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a>
<ul>
See <a href="#amrfinder_citations">AMRFinderPlus references</a>
</ul>
</li>
<!-- li>Publication: <a href="https://doi.org/10.1128/AAC.00483-19">Feldgarden et al. (2019), https://doi.org/10.1128/AAC.00483-19</a>, <a href="https://www.ncbi.nlm.nih.gov/pubmed/31427293">PubMed PMID: 31427293</a>.
[bioarchive: <a href="https://doi.org/10.1101/550707">Feldgarden et al. (2019), https://doi.org/10.1101/550707</a]>]</li -->
</ul>
</div>
<!-- =========== END_AMR_FINDER ============ -->
<!-- =========== MicroBIGG-E ============ -->
<h3 id="microbigge">MicroBIGG-E (<b>Micro</b>bial <b>B</b>rowser for <b>I</b>dentification of <b>G</b>enetic and <b>G</b>enomic <b>E</b>lements) <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#amr"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Antimicrobial resistance (AMR) resources, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h3>
<div style="padding-left: 2em">
<!-- ======= MINI-TOC ========= -->
<ul>
<li><a href="#microbigge-what-is">What is MicroBIGG-E?</a>
<ul>
<li><a href="#microbigge-acronym">MicroBIGG-E acronym</a></li>
<li><a href="#microbigge-and-isolates-browser-relationship">Relationship between MicroBIGG-E and Pathogens Isolates Browser</a></li>
</ul>
</li>
<li><a href="#microbigge-access">Where to access MicroBIGG-E?</a>
<ul>
<li><a href="#microbigge-access-browse">Browse/Search MicroBIGG-E</a></li>
<li><a href="#microbigge-access-download">Download the MicroBIGG-E data</a></li>
<li><img src="https://www.ncbi.nlm.nih.gov/pathogens/static/main/app/images/new.png" /> <a href="/pathogens/docs/microbigge_gcp">MicroBIGG-E at Google Cloud</a></li>
</ul>
</li>
<li><a href="#microbigge-search-tips">Search tips</a>
<ul>
<li><a href="#microbigge-allowable-search-terms">Allowable search terms</a></li>
<li><a href="#microbigge-basic-search">Basic search</a></li>
<li><a href="#microbigge-advanced-search">Advanced search</a></li>
<li><a href="#microbigge-filters">Filters</a></li>
</ul>
</li>
<li><a href="#microbigge-data-fields">Data fields</a> include:
<ul>
<li><a href="#microbigge-data-field-group-isolate">Isolate data fields</a>, such as:
<ul>
<li><a href="#microbigge-data-field-scientific-name">Scientific name (<b><i>scientific_name</i></b>)</a></li>
<li><a href="#microbigge-data-field-isolate">Isolate (<b><i>target_acc</i></b>)</a></li>
<li><a href="#microbigge-data-field-isolation-type">Isolation type (<b><i>epi_type</i></b>)</a></li>
</ul>
</li>
<li><a href="#microbigge-data-field-group-element">Element data fields</a>, such as:
<ul>
<li><a href="#microbigge-data-field-element-symbol">Element symbol (<b><i>element_symbol</i></b>)</a></li>
<li><a href="#microbigge-data-field-element-name">Element name (<b><i>element_name</i></b>)</a></li>
<li><a href="#microbigge-data-field-protein">Protein (<b><i>protein_acc</i></b>)</a></li>
<li><a href="#microbigge-data-field-contig">Contig (<b><i>contig_acc</i></b>)</a></li>
<li><a href="#microbigge-data-field-start">Start (<b><i>start_on_contig</i></b>)</a></li>
<li><a href="#microbigge-data-field-stop">Stop (<b><i>end_on_contig</i></b>)</a></li>
</ul>
</li>
<li><a href="#microbigge-data-field-group-reference">Reference data fields</a>, such as:
<ul>
<li><a href="#microbigge-data-field-closest-reference-accession">Closest reference accession (<b><i>closest_reference_acc</i></b>)</a></li>
<li><a href="#microbigge-data-field-closest-reference-name">Closest reference name (<b><i>closest_reference_name</i></b>)</a></li>
<li><a href="#microbigge-data-field-hmm-acc">HMM Accession (<b><i>hmm_acc</i></b>)</a></li>
</ul>
</li>
<li><a href="#microbigge-data-field-group-analysis-results">Analysis results (Element vs Reference) data fields</a>, such as:
<ul>
<li><a href="#microbigge-data-field-alignment-length">Alignment length (<b><i>align_length</i></b>)</a></li>
<li><a href="#microbigge-data-field-identity">% Identity
(<b><i>pct_ref_identity</i></b>)</a></li>
<li><a href="#microbigge-data-field-coverage">% Coverage (<b><i>pct_ref_coverage</i></b>)</a></li>
</ul>
</li>
<li><a href="#microbigge-data-field-group-analysis-log">Analysis log data fields</a>, such as:
<ul>
<li><a href="#microbigge-data-field-analysis-type">AMRFinderPlus analysis type (<b><i>amrfinderplus_analysis_type</i></b>)</a></li>
<li><a href="#microbigge-data-field-amrfinderplus-version">AMRFinderPlus version (<b><i>amrfinderplus_version</i></b>)</a></li>
<li><a href="#microbigge-data-field-refgene-db-version">PD Ref Gene Catalog Version (<b><i>refgene_db_version</i></b>)</a></li>
</ul>
</li>
<!-- li><a href="#microbigge-data-field-group-________">________ data fields</a>, such as:
<ul>
<li><a href="#microbigge-data-field-________">________</a></li>
<li><a href="#microbigge-data-field-________">________</a></li>
<li><a href="#microbigge-data-field-________">________</a></li>
</ul>
</li -->
<li><a href="#microbigge-data-fields-list">see a list of all MicroBIGG-E data fields</a></li>
</ul>
</li>
<li><a href="#microbigge-output">Output</a>
<ul>
<li><a href="#microbigge-output-table">Tabular list of genes</a></li>
<li><a href="#microbigge-filters">Filters to refine results</a></li>
<!-- li><a href="#microbigge-sort-order">Sort order</a></li -->
<li><a href="#microbigge-display-options">Customize the MicroBIGG-E display</a></li>
<li><a href="#microbigge-cross-browser-selection">Cross-browser selection</a></li>
</ul>
</li>
<li><a href="#microbigge-sample-searches"><span style="color:#d70000">Use cases/sample searches</span> of MicroBIGG-E</a>
<ul>
<li><a href="#microbigge-sample-search-genes-co-occur-on-contig">Identify isolates that have same set of genes and determine if they co-occur on the same contig</a></li>
<li><a href="#microbigge-sample-search-partial-gene-in-middle-of-contig">Identify partial gene sequences in the middle of contigs</a></li>
<li><a href="#microbigge-sample-search-find-alleles-described-by-publication">Find the isolates and alleles described by a publication of interest</a></li>
<li><a href="#microbigge-sample-search-isolates-with-co-occurring-genes">Display isolates in isolates browser that have the same set of genes co-occurring on the same contig</a></li>
<li><a href="#microbigge-sample-search-hits-from-isolates-with-co-occurring-genes">Display hits from isolates with co-occurring genes</a></li>
</ul>
</li>
</ul>
<!-- ======= END_MINI-TOC ========= -->
<!-- =========== MicroBIGG-E_WHAT_IS ============ -->
<h4 id="microbigge-what-is">What is MicroBIGG-E? <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#microbigge"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="MicroBIGG-E help, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h4>
<div style="padding-left: 2em">
<span id="microbigge-acronym">"<a href="/pathogens/isolates#/microbigge/"><b>MicroBIGG-E</b></a>" is the <b>Micro</b>bial <b>B</b>rowser for <b>I</b>dentification of <b>G</b>enetic and <b>G</b>enomic <b>E</b>lements.</span> <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#microbigge"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="MicroBIGG-E help, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a>
<ul>
<li>MicroBIGG-E contains genetic and genomic elements identified in assemblies analyzed by <a href="https://www.ncbi.nlm.nih.gov/pathogens/antimicrobial-resistance/AMRFinder/">AMRFinderPlus</a> as part of the Pathogen Detection Pipeline. See the <a href="https://github.com/ncbi/amr/wiki">AMRFinderPlus wiki</a> for more information on how AMRFinderPlus works and the <a href="#refgene-what-is">Pathogen Detection Reference Gene Catalog</a> for a list of the elements that AMRFinderPlus is searching for.</li>
<li>MicroBIGG-E will be updated each time an <a href="#isolates-browser-data-field-OrganismGroup">organism group</a> is updated in the Isolates Browser.</li>
<li>It contains the <b>genetic and genomic elements</b> that have been found in isolate genomes that have been <b>published in GenBank</b>. <i>(This is in contrast to the Isolates Browser, which contains isolates that have been published in GenBank as well as those awaiting submission to GenBank.)</i> The output is the results of <a href="/pathogens/antimicrobial-resistance/AMRFinder/">AMRFinderPlus</a> analyses, as described in the <a href="/pathogens/docs/data_processing">data processing pipeline</a> section of this document.</li>
<li>The MicroBIGG-E will initially include <b>genes</b>, <b>alleles</b>, and <b>point mutations</b>.</li>
<li><b>Every row</b> in the <a href="/pathogens/isolates#/microbigge/">MicroBIGG-E</a> display is an <b>anti-microbial resistance (AMR)</b>, <b>stress response</b>, and/or <b>virulence</b> gene that has been identified in an isolate assembly by the <a href="/pathogens/docs/data_processing">data processing pipeline</a>, with information about the method used to identify it, supporting evidence, and the element's type, subtype, class, subclass, and more.</li>
<li>The <b>purpose of MicroBIGG-E</b> is to enable researchers to obtain detailed information about the element as well as the actual contigs that contain a genetic or genomic element of interest, in order to conduct further analysis.</li>
<li>The Pathogen Detection pipeline uses two assemblers, a <i>de novo</i> assembler and a targeted assembler (SAUTE) to increase assembly sensitivity and accuracy for AMR genes. A region of the genome may therefor appear in two contigs so it looks like there are duplicated genes. For this reason the copy number for AMR genes in MicroBIGG-E will often be higher than appears in the actual isolate.</li>
</ul>
<!-- ==== RELATIONSHIP_BETWEEN_MicroBIGG-E_AND_ISOLATES_BROWSER ==== -->
<span id="microbigge-and-isolates-browser-relationship"><b>Relationship between MicroBIGG-E and Pathogens Isolates Browser</b></span> <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#microbigge"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="MicroBIGG-E help, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a>
<ul>
<li><a href="/pathogens/isolates#/microbigge/">MicroBIGG-E</a><!-- , the <a href="/pathogens/isolates#/refgene/">Pathogen Detection Reference Gene Catalog</a>, --> and the <a href="/pathogens/isolates#/search/">Pathogens Isolates Browser</a> are <b>related</b> resources and are <b>integrated</b> with each other.</li>
<li>The main <b>similiarities</b> between the resources are their <b>shared search engine</b> and <b>similar search techniques</b>:
<ul>
<li>Both use the <a href="#solr">SOLR query language</a> and allow searches by a wide variety of text terms.</li>
<li>The search tips provided in the <a href="#isolates-browser">Isolates Browser help documentation</a> therefore also apply<!-- to the Reference Gene Catalog and --> to MicroBIGG-E, such as <a href="#isolates-browser-basic-search">basic search</a> techniques, <a href="#isolates-browser-advanced-search">advanced search</a> techniques, <a href="#query-tips-case-sensitive-vs-case-insensitive">case sensitive versus case insensitive searches</a>, and the availability of "filters" to refine search results.</li>
</ul>
</li>
<li>The main <b>differences</b> between the resources are the <b>scope</b> of data being searched, the set of <b>data fields</b> (and <b>filters</b>, which are based on data fields) that are available for searching, and the <b>columns</b> that are shown in the display of search results: <i>(The <a href="#microbigge-data-fields">MicroBIGG-E data fields</a> are described below, and the <a href="#refgene-data-fields">Reference Gene Catalog data fields</a> and <a href="#isolates-browser-data-fields">Pathogens Isolates Browser data fields</a> are described in the help for each of those resources.)</i>
<ul>
<li>The <a href="/pathogens/isolates#/search/"><b>Pathogens Isolates Browser</b></a> searches all <b>isolate genomes</b> in the Pathogen Detection project <b>which have been deposited in GenBank</b>, as well as corresponding <b>metadata</b> that are described under <a href="#data-types">types of data</a>.
<ul>
<li><b>Every row</b> in the Isolates Browser is an <b>assembled isolate</b>, possibly with antimicrobial resistance (AMR), virulence, and/or stress response <a href="#data-type-genotype">genotype data</a>, and antibiotic susceptibility (AST) <a href="#data-type-phenotype">phenotype data</a>, as available.</li>
<li>The <a href="#isolates-browser">Isolates Browser help documentation</a> describes the <a href="#isolates-browser-data-fields">available data fields</a> and <a href="#isolates-browser-output">output</a>.</li>
</ul>
</li>
<!-- li>The <a href="/pathogens/isolates#/refgene/"><b>Pathogen Detection Reference Gene Catalog</b></a> is a <a href="#refgene-non-redundant">non-redundant</a> database of bacterial genes related to antimicrobial resistance, biocide and stress resistance, general efflux, virulence, or antigenicity.
<ul>
<li><b>Every row</b> in the Pathogen Detection Reference Gene Catalog display is a <b>reference gene</b> or a <b>point mutation</b>.</li>
<li>The <a href="#reference-gene-catalog">Reference Gene Catalog help</a> describes the <a href="#refgene-scope">scope of data</a>, <a href="#refgene-data-fields">available <b>data fields</b></a>, and <a href="#refgene-output">output</a>.</li>
</ul>
</li -->
<li>The <a href="/pathogens/isolates#/microbigge/"><b>MicroBIGG-E</b></a> searches the collection of <b>genetic and genomic elements</b>, such as genes related to antimicrobial resistance, stress resistance, and virulence, that have been identified in the isolates through the <a href="/pathogens/docs/data_processing">data processing pipeline</a>.
<ul>
<li><b>Every row</b> in the <a href="/pathogens/isolates#/microbigge/">MicroBIGG-E</a> display is an <b>anti-microbial resistance (AMR)</b>, <b>stress response</b>, and/or <b>virulence</b> gene that has been identified in an isolate by the <a href="/pathogens/docs/data_processing">data processing pipeline</a>, with information about the method used to identify it, supporting evidence, and the element's type, subtype, class, subclass.</li>
<li>The <a href="#microbigge-data-fields">MicroBIGG-E data fields</a> are described below, and are reflected in the columns displayed in the <a href="#microbigge-output">MicroBIGG-E output</a>.</li>
</ul>
</li>
</ul>
</li>
<li>The <a href="/pathogens/isolates#/search/">Pathogens Isolates Browser</a> and <a href="/pathogens/isolates#/microbigge/">MicroBIGG-E</a> are linked using <a href="#microbigge-cross-browser-selection">Cross-browser selection</a>.<!-- For example: -->
<!-- ul>
<li>The <a href="#isolates-browser-data-field-AMRGenotypes">AMR genotypes</a>, <a href="#isolates-browser-data-field-stress-genotypes">Stress genotypes</a>, and <a href="#isolates-browser-data-field-virulence-genotypes">Virulence genotypes</a> columns in the Isolates Browser link to the corresponding gene/allele record(s) in MicroBIGG-E.</li>
<li>The <a href="#microbigge-data-field-________">________</a> column in MicroBIGG-E links to the Isolates Browser. Clicking on a ________ in that column will open the Isolates Browser and will display the isolates that have been found, by the <a href="/pathogens/docs/data_processing">data processing pipeline</a>, to contain the gene of interest.</li>
</ul -->
</li>
</ul>
<!-- === END_RELATIONSHIP_BETWEEN_MicroBIGG-E_AND_ISOLATES_BROWSER === -->
</div>
<!-- =========== END_MicroBIGG-E_WHAT_IS ============ -->
<!-- =========== MicroBIGG-E_ACCESS ============ -->
<h4 id="microbigge-access">Where to access MicroBIGG-E <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#microbigge"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="MicroBIGG-E help, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h4>
<div style="padding-left: 2em">
"<a href="/pathogens/isolates#/microbigge/"><b>MicroBIGG-E</b></a>," the <b>Micro</b>bial <b>B</b>rowser for <b>I</b>dentification of <b>G</b>enetic and <b>G</b>enomic <b>E</b>lements, is accessible from the
<a href="/pathogens">Pathogen Detection Project home page</a> (as a link in the right hand margin under "Data Resources"), from the
<a href="/pathogens/antimicrobial-resistance/">AMR landing page</a> (National Database of Antibiotic Resistant Organisms (NDARO)), and from the <a href="/pathogens/antimicrobial-resistance/resources/">AMR Resources page</a>.<br /><br /> and the raw data behind it is available at <a href="/pathogens/docs/microbigge_gcp">Google Cloud</a>.
You can also access MicroBIGG-E directly from the links below:
<br /><br />
<span id="microbigge-access-browse"><b>Browse/Search</b> MicroBIGG-E:</span><br />
<a href="/pathogens/isolates#/microbigge/">/pathogens/isolates#/microbigge/</a>.<br /><br />
<span id="microbigge-access-download"><b>Download</b> the MicroBIGG-E data:</span><br />
Click the "Download" button in the header of the MicroBIGG-E table to download data.
You can either download a tab-delimited or csv formatted representation of the table view or a set of sequences under the "Dataset" selection.
<ul>
<li><b>Table</b> downloads can be in either Tab-delimited (.tsv) format or Excel comma-delimited format (.csv), and have a maximum of 100,000 rows.</li>
<li><b>Datasets</b> downloads contain protein or nucleotide data related to the elements shown in the table. These can be the DNA sequence of the elements, the elements plus flanks (up to 2,000 bp), the entire contig containing the elements (max 1,000 contigs), or the amino-acid sequences of the protein elements.</li>
<li><img src="/pathogens/static/main/app/images/new.png" /> <b>GCP BigQuery</b> Full table access using SQL. See <a href="/pathogens/docs/microbigge_gcp">MicroBIGG-E data at Google Cloud Platform</a> for more information on how to get full MicroBIGG-E data on Google Cloud in BigQuery. </li>
</ul>
Bulk access for MicroBIGG-E data is under active development. Table data is now <a href="/pathogens/docs/microbigge_gcp">avalable on GCP</a>. Email NCBI at <a href="mailto:pd-help@ncbi.nlm.nih.gov">pd-help@ncbi.nlm.nih.gov</a> if the current functionality does not meet your needs.<br /><br />
</div>
<!-- =========== END_MicroBIGG-E_ACCESS ============ -->
<!-- =========== MicroBIGG-E_SEARCH_TIPS ============ -->
<h4 id="microbigge-search-tips">Search tips for MicroBIGG-E <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#microbigge"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="MicroBIGG-E help, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h4>
<div style="padding-left: 2em">
<span id="microbigge-allowable-search-terms"><b>Allowable search terms</b> (MicroBIGG-E)</span> <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#microbigge"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="MicroBIGG-E help, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br />
<ul>
<li><a href="/pathogens/isolates#/microbigge/">MicroBIGG-E</a> can be searched by the terms that appear in any of the <a href="#microbigge-data-fields"><b>data fields</b></a> described below. A search example is provided after each data field description, when possible.</li>
</ul>
<span id="microbigge-basic-search"><b>Basic search</b> (MicroBIGG-E)</span> <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#microbigge"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="MicroBIGG-E help, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br />
<ul>
<li>The query tips described in the <a href="#isolates-browser">Isolates Browser help</a> &gt; <a href="#isolates-browser-basic-search">basic search</a> section also apply to MicroBIGG-E, such as searches for <a href="#query-tips-multiple-terms">multiple terms</a>, <a href="#query-tips-special-characters">special characters</a>, <a href="#query-tips-phrase-search-quotes">phrase searches</a>, <a href="#query-tips-case-sensitive-vs-case-insensitive">case sensitive vs. case insensitive searches</a>, etc.</li>
</ul>
<span id="microbigge-advanced-search"><b>Advanced search</b> (MicroBIGG-E)</span> <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#microbigge"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="MicroBIGG-E help, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br />
<ul>
<li>The query tips described in the <a href="#isolates-browser">Isolates Browser help</a> &gt; <a href="#isolates-browser-advanced-search">advanced search</a> section also apply to the MicroBIGG-E, because both resources use the <a href="#solr">SOLR query language</a>.</li>
<li>The main difference is the data fields that are available to be searched, because each resource has its own set of data fields. <i>(The data fields in MicroBIGG-E are the same as the <a href="#refgene-data-fields-list">data fields in the Pathogen Detection Reference Gene Catalog</a>, which are different from the <a href="#isolates-browser-data-fields-list">data fields in the Isolates Browser</a>.)</i></li>
<li>The query tips described in the <a href="#isolates-browser">Isolates Browser help</a> also apply to MicroBIGG-E, such as searches for <a href="#query-tips-multiple-terms">multiple terms</a>, <a href="#query-tips-special-characters">special characters</a>, <a href="#query-tips-phrase-search-quotes">phrase searches</a>, <a href="#query-tips-case-sensitive-vs-case-insensitive">case sensitive vs. case insensitive searches</a>, etc.</li>
</ul>
<span id="microbigge-filters"><b>Filters</b> (MicroBIGG-E)</span> <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#microbigge"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="MicroBIGG-E help, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br />
<ul>
<li>The "Filters" menu options in the <a href="/pathogens/isolates#/microbigge/">MicroBIGG-E</a> enable you to <b>facet or subset the data</b> in a variety of ways, and therefore can be used to refine your results, whether you have done a basic search or an advanced search.</li>
<li>Each filter displays counts of elements next to each term in the filter. Note that these counts are for elements in the browser, and may not accurately describe the number of genes in actual isolates because Pathogen Detection assemblies use both <i>de novo</i> and guided assemblies which may represent the same gene in an assembly multiple times. </li>
<li>By default, each filter displays the <b>top 100 terms</b> (based on the number of isolates retrieved by a term) listed by count of value within that set of top 100. Use the search box to search for filters not in the top 100. Note that:
<ul>
<li>A <b>Boolean "OR"</b> is applied if multiple items are checked in the same filter field. This way you can choose multiple values in the same filter. For example:
<ul>
<li>Open the "Filters" tab of the <a href="/pathogens/isolates#/microbigge/">MicroBIGG-E</a>, then check the boxes for "Stress" and for "Virulence" in the "Type" filter. The system will retrieve genetic/genomic elements that are associated with either stress resistance or with virulence.</li>
</ul>
</li>
<li>A <b>Boolean "AND"</b> is applied if you select items in several different filter fields (Type, Class, etc). For example:
<ul>
<li>Open the "Filters" tab of the <a href="/pathogens/isolates#/microbigge/">MicroBIGG-E</a> web interface, then check the boxes for "Point" in the "Subtype" filter and "Quinolone" in the "Class" filter. The system will retrieve genetic/genomic elements that meet both of your specified criteria (in this case, point mutations that confer resistance to quinolones).</li>
</ul>
</li>
<!-- li>If you prefer to apply a <b>Boolean "AND"</b> to multiple items within the same filter field, you can enter a <b>SOLR query</b>. For example:
<ul>
<li>To retrieve alleles that have [that meet all of the checked criteria, rather than one or more of them] <b>both</b> ____ AND ____, open the <a href="/pathogens/isolates#/microbigge/">MicroBIGG-E</a> and enter a SOLR query such as:
<a href="______">datafieldXXname:"value" AND datafieldXXname:"value"</a>.<br />
<i>(A separate section of this document provides additonal information about the <a href="#solr">SOLR query language</a>. Additionally, note that only a subset of the available data fields are shown in the default output of <a href="/pathogens/isolates#/microbigge/">MicroBIGG-E</a>; use the <b>choose columns</b> to add additional columns to the display.)</i></li>
</ul>
</li -->
</ul>
</li>
<li>As explained in the <a href="#isolates-browser">Isolates Browser help</a>, <a href="#filters-on-the-fly">Filters are generated on the fly</a>. As a result, the terms that are listed under each filter will depend on the data set you are currently displaying in the browser. That is also true for the filters in the <a href="/pathogens/isolates#/microbigge/">MicroBIGG-E</a>.</li>
</ul>
</div>
<!-- =========== END_MicroBIGG-E_SEARCH_TIPS ============ -->
<!-- =========== MicroBIGG-E_DATA_FIELDS ============ -->
<h4 id="microbigge-data-fields">Data Fields in MicroBIGG-E <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#microbigge"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="MicroBIGG-E help, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h4>
<div style="padding-left: 2em">
The MicroBIGG-E <a href="#microbigge-data-fields-list">data fields listed below</a> have been indexed by the Pathogen Detection project and are therefore <b>directly searchable</b>, using the <a href="#isolates-browser-advanced-search">advanced search techniques</a> that are described in the <a href="#isolates-browser">Isolates Browser help</a>, because both MicroBIGG-E and the Isolates Browser use the <a href="#solr">SOLR query language</a>. Note that the <span style="background-color: #ffff00">data field names and values are <a href="#case-sensitive"><b>case sensitive</b></a></span>, as described in the Isolates Browser help.<br /><br />
Each data field reflects an available column in the <a href="/pathogens/isolates#/microbigge/">MicroBIGG-E</a> web interface. The <a href="#microbigge-output">output</a> section of this document provides tips on how to <a href="#microbigge-display-options">customize the display</a>, using the "choose columns" function.<br /><br />
<b>Please note:</b> in the list of available data fields below: <br />
<ul>
<li>The term shown in the <span style="background-color: #ffff00">regular font</span> is the <span style="background-color: #ffff00">display name</span> (column header) shown by the MicroBIGG-E web interface. The term shown in <span style="background-color: #ffff00"><i>(italics)</i></span> is the <span style="background-color: #ffff00"><b><i>name of the corresponding data field</i></b>, if you want to search that field directly</span>.</li>
<li>For example, one data field is listed as: <a href="#microbigge-data-field-method">Method (<b><i>amr_method</i></b>)</a>. The term
"<b>Method</b>" appears in the MicroBIGG-E column header, and "<b><i>amr_method</i></b>" (with an underscore bar instead of a space) is the string you should use if you want to search that data field directly.</li>
<li>Brief <b><i>italicized search examples</i></b> are also provided for each data field, when possible, showing how to query the data field directly. The values represent text strings <b>exactly as they appear in the data fields</b>, including upper case and lower case letters, <a href="#special-characters">special characters</a> such as hyphens, etc. The <span style="background-color: #ffff00">data field names and values are <a href="#case-sensitive"><b>case sensitive</b></a></span>.</li>
</ul>
<span id="microbigge-data-fields-list"><b>The available data fields in the <a href="/pathogens/isolates#/microbigge/">MicroBIGG-E</a> include the following:</b></span> <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#microbigge"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="MicroBIGG-E help, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br />
Note that each field is written in this format: &#160;&#160;<b>Display name</b> (<b><i>data_field_name</i></b>)<br />
The "Display name" is the column header that appears in the MicroBIGG-E web interface, and the "<i>data_field_name</i>" is the <a href="#case-sensitive">case-sensitive</a> string you should enter if you want to search the data field directly using a <a href="#solr">SOLR query</a>:<br />
<!-- ========== MicroBIGG-E_DATA_FIELDS_MINI_TOC =========== -->
<table width="100%">
<tr>
<td width="50%" valign="top">
<a href="#microbigge-data-field-group-isolate"><b>Isolate data fields:</b></a><br />
<div style="padding-left: 2em">
<a href="#microbigge-data-field-scientific-name">Scientific name (<b><i>scientific_name</i></b>)</a><br />
<a href="#microbigge-data-field-organism-group">Organism group (<b><i>taxgroup_name</i></b>)</a><br />
<a href="#microbigge-data-field-serovar">Serovar (<b><i>serovar</i></b>)</a><br />
<a href="#microbigge-data-field-strain">Strain (<b><i>strain</i></b>)</a><br />
<a href="#microbigge-data-field-isolate">Isolate (<b><i>target_acc</i></b>)</a><br />
<a href="#microbigge-data-field-isolation-source">Isolation source (<b><i>isolation_source</i></b>)</a><br />
<a href="#microbigge-data-field-isolation-type">Isolation type (<b><i>epi_type</i></b>)</a><br />
<a href="#microbigge-data-field-bioproject">BioProject (<b><i>bioproject_acc</i></b>)</a><br />
<a href="#microbigge-data-field-biosample">BioSample (<b><i>biosample_acc</i></b>)</a><br />
<a href="#microbigge-data-field-collection-date">Collection date (<b><i>collection_date</i></b>)</a><br />
<a href="#microbigge-data-field-createdate">Create date (<b><i>creation_date</i></b>)</a><br />
<a href="#microbigge-data-field-location">Location (<b><i>geo_loc_name</i></b>)</a><br />
<a href="#microbigge-data-field-host">Host (<b><i>host</i></b>)</a><br />
<a href="#microbigge-data-field-run">Run (<b><i>Run</i></b>)</a><br />
<a href="#microbigge-data-field-assembly">Assembly (<b><i>asm_acc</i></b>)</a><br />
</div>
<a href="#microbigge-data-field-group-element"><b>Element data fields:</b></a><br />
<div style="padding-left: 2em">
<a href="#microbigge-data-field-element-symbol">Element symbol (<b><i>element_symbol</i></b>)</a><!-- was Gene (<b><i>gene_symbol</i></b>) --><br />
<a href="#microbigge-data-field-element-name">Element name (<b><i>element_name</i></b>)</a><!-- was Gene (<b><i>gene_symbol</i></b>) --><br />
<a href="#microbigge-data-field-element-length">Element length (<b><i>element_length</i></b>)</a><br />
<a href="#microbigge-data-field-protein">Protein (<b><i>protein_acc</i></b>)</a><br />
<a href="#microbigge-data-field-contig">Contig (<b><i>contig_acc</i></b>)</a><br />
<a href="#microbigge-data-field-start">Start (<b><i>start_on_contig</i></b>)</a><br />
<a href="#microbigge-data-field-stop">Stop (<b><i>end_on_contig</i></b>)</a><br />
<a href="#microbigge-data-field-strand">Strand (<b><i>strand</i></b>)</a><br />
<a href="#microbigge-data-field-type">Type (<b><i>type</i></b>)</a><br />
<a href="#microbigge-data-field-subtype">Subtype (<b><i>subtype</i></b>)</a><br />
<a href="#microbigge-data-field-class">Class (<b><i>class</i></b>)</a><br />
<a href="#microbigge-data-field-subclass">Subclass (<b><i>subclass</i></b>)</a><br />
<a href="#microbigge-data-field-scope">Scope (<b><i>scope</i></b>)</a><br />
</div>
</td>
<td width="50%" valign="top">
<a href="#microbigge-data-field-group-reference"><b>Reference data fields:</b></a><br />
<div style="padding-left: 2em">
<a href="#microbigge-data-field-closest-reference-accession">Closest reference accession (<b><i>closest_reference_acc</i></b>)</a><br />
<a href="#microbigge-data-field-closest-reference-name">Closest reference name (<b><i>closest_reference_name</i></b>)</a><br />
<a href="#microbigge-data-field-reference-element-length">Reference element length (<b><i>reference_element_length</i></b>)</a><br />
<a href="#microbigge-data-field-hmm-acc">HMM Accession (<b><i>hmm_acc</i></b>)</a><br />
<a href="#microbigge-data-field-hmm-description">HMM Description (<b><i>hmm_description</i></b>)</a><br />
<a href="#microbigge-data-field-hierarchy-node">Hierarchy node (<b><i>hierarchy_node</i></b>)</a><br />
</div>
<a href="#microbigge-data-field-group-analysis-results"><b>Analysis results (Element vs Reference) data fields:</b></a><br />
<div style="padding-left: 2em">
<a href="#microbigge-data-field-method">Method (<b><i>amr_method</i></b>)</a><br />
<a href="#microbigge-data-field-alignment-length">Alignment length (<b><i>align_length</i></b>)</a><br />
<a href="#microbigge-data-field-identity">% Identity to reference
(<b><i>pct_ref_identity</i></b>)</a><br />
<a href="#microbigge-data-field-coverage">% Coverage of reference (<b><i>pct_ref_coverage</i></b>)</a><br />
<a href="#microbigge-data-field-contig-coverage">Contig coverage (<b><i>contig_coverage</i></b>)</a><br />
<a href="#microbigge-data-field-relative-assembly-coverage">Relative assembly coverage (<b><i>rel_asm_cov</i></b>)</a><br />
<a href="#microbigge-data-field-assembly-coverage">Assembly coverage (<b><i>asm_coverage</i></b>)</a><br />
</div>
<a href="#microbigge-data-field-group-analysis-log"><b>Analysis log data fields:</b></a><br />
<div style="padding-left: 2em">
<a href="#microbigge-data-field-analysis-type">AMRFinderPlus analysis type (<b><i>amrfinderplus_analysis_type</i></b>)</a><br />
<a href="#microbigge-data-field-amrfinderplus-version">AMRFinderPlus version (<b><i>amrfinderplus_version</i></b>)</a><br />
<a href="#microbigge-data-field-refgene-db-version">PD Ref Gene Catalog Version (<b><i>refgene_db_version</i></b>)</a><br />
</div>
<!-- a href="#microbigge-data-field-______">______ (<b><i>______</i></b>)</a><br / -->
</td>
</tr>
</table>
<br />
<!-- ========= END_MicroBIGG-E_DATA_FIELDS_MINI_TOC ========= -->
<!-- ========= MicroBIGG-E_DATA_FIELDS_DESCRIPTIONS =========== -->
<!-- ======== MicroBIGG-E_DATA_FIELD_GROUP_ISOLATE ========== -->
<span id="microbigge-data-field-group-isolate" style="background-color: #cde1ff"><b>Isolate data fields:</b></span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#microbigge-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of MicroBIGG-E data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
<ul>
<!-- ======== MicroBIGG-E_DATA_FIELD_Scientific_name ========== -->
<li id="microbigge-data-field-scientific-name">
<span style="background-color: #cde1ff">Scientific name (<b><i>scientific_name</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#microbigge-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of MicroBIGG-E data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
<i>This data field also appears in the Pathogens Isolates Browser; a <a href="#isolates-browser-data-field-ScientificName">description of Scientific name</a> and examples of queries for that field appear in the <a href="#isolates-browser-data-fields-list">Isolates Browser data fields</a> help section.</i>
</li>
<!-- ======== END_MicroBIGG-E_DATA_FIELD_scientific_name ========== -->
<!-- ======== MicroBIGG-E_DATA_FIELD_Organism_group ========== -->
<li id="microbigge-data-field-organism-group">
<span style="background-color: #cde1ff">Organism group (<b><i>taxgroup_name</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#microbigge-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of MicroBIGG-E data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
<i>This data field also appears in the Pathogens Isolates Browser; a <a href="#isolates-browser-data-field-OrganismGroup">description of Organism group</a> and examples of queries for that field appear in the <a href="#isolates-browser-data-fields-list">Isolates Browser data fields</a> help section.</i>
</li>
<!-- ======= END_MicroBIGG-E_DATA_FIELD_Organism_group ======= -->
<!-- ======== MicroBIGG-E_DATA_FIELD_Serovar ========== -->
<li id="microbigge-data-field-serovar">
<span style="background-color: #cde1ff">Serovar (<b><i>serovar</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#microbigge-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of MicroBIGG-E data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
<i>This data field also appears in the Pathogens Isolates Browser; a <a href="#isolates-browser-data-field-Serovar">description of Serovar</a> and examples of queries for that field appear in the <a href="#isolates-browser-data-fields-list">Isolates Browser data fields</a> help section.</i>
</li>
<!-- ======== END_MicroBIGG-E_DATA_FIELD_Serovar ========== -->
<!-- ======== MicroBIGG-E_DATA_FIELD_Strain ========== -->
<li id="microbigge-data-field-strain">
<span style="background-color: #cde1ff">Strain (<b><i>strain</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#microbigge-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of MicroBIGG-E data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
<i>This data field also appears in the Pathogens Isolates Browser; a <a href="#isolates-browser-data-field-Strain">description of Strain</a> and examples of queries for that field appear in the <a href="#isolates-browser-data-fields-list">Isolates Browser data fields</a> help section.</i>
</li>
<!-- ======== END_MicroBIGG-E_DATA_FIELD_Strain ========== -->
<!-- ======== MicroBIGG-E_DATA_FIELD_Isolate ========== -->
<li id="microbigge-data-field-isolate">
<span style="background-color: #cde1ff">Isolate (<b><i>target_acc</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#microbigge-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of MicroBIGG-E data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
<i>This data field also appears in the Pathogens Isolates Browser; a <a href="#isolates-browser-data-field-Isolate">description of Isolate</a> and examples of queries for that field appear in the <a href="#isolates-browser-data-fields-list">Isolates Browser data fields</a> help section.</i>
</li>
<!-- ======== END_MicroBIGG-E_DATA_FIELD_Isolate ========== -->
<!-- ======== MicroBIGG-E_DATA_FIELD_Isolation_source ========== -->
<li id="microbigge-data-field-isolation-source">
<span style="background-color: #cde1ff">Isolation source (<b><i>isolation_source</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#microbigge-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of MicroBIGG-E data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
<i>This data field also appears in the Pathogens Isolates Browser; a <a href="#isolates-browser-data-field-IsolationSource">description of Isolation Source</a> and examples of queries for that field appear in the <a href="#isolates-browser-data-fields-list">Isolates Browser data fields</a> help section.</i>
</li>
<!-- ====== END_MicroBIGG-E_DATA_FIELD_Isolation_source ======= -->
<!-- ======== MicroBIGG-E_DATA_FIELD_Isolation_type ======= -->
<li id="microbigge-data-field-isolation-type">
<span style="background-color: #cde1ff">Isolation type (<b><i>epi_type</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#microbigge-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of MicroBIGG-E data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
<i>This data field also appears in the Pathogens Isolates Browser; a <a href="#isolates-browser-data-field-IsolationType">description of Isolation type</a> and examples of queries for that field appear in the <a href="#isolates-browser-data-fields-list">Isolates Browser data fields</a> help section.</i>
</li>
<!-- ====== END_MicroBIGG-E_DATA_FIELD_Isolation_type ======= -->
<!-- ======== MicroBIGG-E_DATA_FIELD_BioSample ========== -->
<li id="microbigge-data-field-biosample">
<span style="background-color: #cde1ff">BioSample (<b><i>biosample_acc</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#microbigge-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of MicroBIGG-E data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
<i>This data field also appears in the Pathogens Isolates Browser; a <a href="#isolates-browser-data-field-BioSample">description of BioSample</a> and examples of queries for that field appear in the <a href="#isolates-browser-data-fields-list">Isolates Browser data fields</a> help section.</i>
</li>
<!-- ======== END_MicroBIGG-E_DATA_FIELD_BioSample ========== -->
<!-- ======== MicroBIGG-E_DATA_FIELD_BioProject ========== -->
<li id="microbigge-data-field-bioproject">
<span style="background-color: #cde1ff">BioProject (<b><i>bioproject_acc</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#microbigge-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of MicroBIGG-E data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
<i>This field also appears in the Pathogens Isolates Browser; a <a href="#isolates-browser-data-field-BioProject">description of BioProject</a> and examples of queries for that field appear in the <a href="#isolates-browser-data-fields-list">Isolates Browser data fields</a> help section.</i>
</li>
<!-- ======== END_MicroBIGG-E_DATA_FIELD_BioProject ========== -->
<!-- ======== MicroBIGG-E_DATA_FIELD_Collection_date ========== -->
<li id="microbigge-data-field-collection-date">
<span style="background-color: #cde1ff">Collection date (<b><i>collection_date</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#microbigge-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of MicroBIGG-E data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
<i>This data field also appears in the Pathogens Isolates Browser; a <a href="#isolates-browser-data-field-CollectionDate">description of Collection Date</a> and examples of queries for that field appear in the <a href="#isolates-browser-data-fields-list">Isolates Browser data fields</a> help section.</i>
</li>
<!-- ====== END_MicroBIGG-E_DATA_FIELD_Collection_date ======= -->
<!-- ====== MicroBIGG-E_DATA_FIELD_CreateDate ====== -->
<li id="microbigge-data-field-createdate">
<span style="background-color: #cde1ff">Create date (<b><i>creation_date</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#microbigge-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of MicroBIGG-E data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
<i>This data field also appears in the Pathogens Isolates Browser; a <a href="#isolates-browser-data-field-CreateDate">description of Create date</a> and examples of queries for that field appear in the <a href="#isolates-browser-data-fields-list">Isolates Browser data fields</a> help section.</i>
</li>
<!-- ======== MicroBIGG-E_DATA_FIELD_Location ========== -->
<li id="microbigge-data-field-location">
<span style="background-color: #cde1ff">Location (<b><i>geo_loc_name</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#microbigge-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of MicroBIGG-E data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
<i>This data field also appears in the Pathogens Isolates Browser; a <a href="#isolates-browser-data-field-Location">description of Location</a> and examples of queries for that field appear in the <a href="#isolates-browser-data-fields-list">Isolates Browser data fields</a> help section.</i>
</li>
<!-- ======= END_MicroBIGG-E_DATA_FIELD_Location ======== -->
<!-- ======== MicroBIGG-E_DATA_FIELD_Host ========== -->
<li id="microbigge-data-field-host">
<span style="background-color: #cde1ff">Host (<b><i>host</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#microbigge-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of MicroBIGG-E data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
<i>This data field also appears in the Pathogens Isolates Browser; a <a href="#isolates-browser-data-field-Host">description of Host</a> and examples of queries for that field appear in the <a href="#isolates-browser-data-fields-list">Isolates Browser data fields</a> help section.</i>
</li>
<!-- ======== END_MicroBIGG-E_DATA_FIELD_Host ========== -->
<!-- ======== MicroBIGG-E_DATA_FIELD_Run ========== -->
<li id="microbigge-data-field-run">
<span style="background-color: #cde1ff">Run (<b><i>Run</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#microbigge-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of MicroBIGG-E data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
<i>This data field also appears in the Pathogens Isolates Browser; a <a href="#isolates-browser-data-field-Run">description of Run</a> and examples of queries for that field appear in the <a href="#isolates-browser-data-fields-list">Isolates Browser data fields</a> help section.</i>
</li>
<!-- ======== END_MicroBIGG-E_DATA_FIELD_Run ========== -->
<!-- ======== MicroBIGG-E_DATA_FIELD_Assembly ========== -->
<li id="microbigge-data-field-assembly">
<span style="background-color: #cde1ff">Assembly (<b><i>asm_acc</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#microbigge-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of MicroBIGG-E data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
<i>This data field also appears in the Pathogens Isolates Browser; a <a href="#isolates-browser-data-field-Assembly">description of Assembly</a> and examples of queries for that field appear in the <a href="#isolates-browser-data-fields-list">Isolates Browser data fields</a> help section.</i>
</li>
<!-- ======== END_MicroBIGG-E_DATA_FIELD_Assembly ========== -->
</ul>
<!-- ======== END_MicroBIGG-E_DATA_FIELD_GROUP_ISOLATE ======== -->
<!-- ======== MicroBIGG-E_DATA_FIELD_GROUP_ELEMENT ========== -->
<span id="microbigge-data-field-group-element" style="background-color: #cde1ff"><b>Element data fields:</b></span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#microbigge-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of MicroBIGG-E data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
<ul>
<!-- ======== MicroBIGG-E_DATA_FIELD_Element_symbol ========== -->
<li id="microbigge-data-field-element-symbol">
<span style="background-color: #cde1ff">Element symbol (<b><i>element_symbol</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#microbigge-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of MicroBIGG-E data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
The symbol assigned to the element by AMRFinderPlus.
Examples include an allele symbol (blaKPC-2), a protein symbol (blaKPC), or a point mutation symbol (gyrA_G81D). It can also be a very broad symbol representing a large family of proteins (bla) that you would not find in the reference gene catalog, but would find in the <a href="/pathogens/docs/gene_hierarchy/">Reference Gene Hierarchy</a>. This happens when AMRFinderPlus lacks evidence to use a more specific element symbol. After the inclusion of AMRFinderPlus 4.0.3 the Element symbol (<em>element_symbol</em>) field can also contain Stx operon calls made by <a href="https://github.com/ncbi/stxtyper">StxTyper</a> that look like <em>stx_operon</em> or <em>stx2a_operon</em>. <br /><br />
Data field names and values are <a href="#case-sensitive"><b>case sensitive</b></a>, as shown in the examples below. Additional sections of this document provide tips about search terms that contain <a href="#special-characters">special characters</a> (such as the parentheses, hyphens, and apostrophes), and the use of <a href="#wildcards">wildcards</a> (such as the asterisk or question mark).<br /><br />
<b>Examples:</b>
<ul>
<li>To search this field directly, enter a query such as: &#160;
<i>element_symbol:searchterm</i></li>
<li>Search for: &#160; <i>element_symbol:blaKPC</i><br />
to show all genetic/genomic elements with that exact symbol.</li>
<li>Search for: &#160; <i>element_symbol:blaKPC OR element_symbol:blaKPC-2</i><br />
to show all genetic/genomic elements that have either of those exact symbols.</li>
</ul>
</li>
<!-- ======== END_MicroBIGG-E_DATA_FIELD_Element_symbol ========== -->
<!-- ======== MicroBIGG-E_DATA_FIELD_Element_name ========== -->
<li id="microbigge-data-field-element-name">
<span style="background-color: #cde1ff">Element name (<b><i>element_name</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#microbigge-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of MicroBIGG-E data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
The name of the element assigned by AMRFinderPlus. These can be names/descriptions of genes, point mutations, or stx operon calls from <a href="https://github.com/ncbi/stxtyper">StxTyper</a> See the <a href="https://github.com/ncbi/stxtyper#--amrfinder-output">StxTyper documentation</a> for details.<br /><br />
Data field names and values are <a href="#case-sensitive"><b>case sensitive</b></a>, as shown in the examples below. Use <b><a href="#query-tips-phrase-search-quotes">quotes to search for phrases</a></b>, as shown in the examples below. Additional sections of this document provide tips about search terms that contain <a href="#special-characters">special characters</a> (such as the parentheses, hyphens, and apostrophes), and the use of <a href="#wildcards">wildcards</a> (such as the asterisk or question mark).<br /><br />
<b>Examples:</b>
<ul>
<li>To search this field directly, enter a query such as: &#160;
<i>element_name:searchterm</i></li>
<li>Search for: &#160; <i>element_name:"KPC family carbapenem-hydrolyzing class A beta-lactamase"</i><br />
to show genetic/genomic elements with that name.</li>
<li>Search for: &#160; <i>element_name:"KPC family carbapenem-hydrolyzing class A beta-lactamase" OR element_name:"carbapenem-hydrolyzing class A beta-lactamase KPC-2"</i><br />
to show all genetic/genomic elements that have either of those names.</li>
</ul>
</li>
<!-- ======== END_MicroBIGG-E_DATA_FIELD_Element_name ========== -->
<!-- ======== MicroBIGG-E_DATA_FIELD_Element_length ========== -->
<li id="microbigge-data-field-element-length">
<span style="background-color: #cde1ff">Element length (<b><i>element_length</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#microbigge-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of MicroBIGG-E data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
The length of this element in amino acids (AA) for protein elements, and in base pairs (bp) for nucleotide elements. For StxTyper output see the <a href="https://github.com/ncbi/stxtyper#--amrfinder-output">StxTyper documentation</a> for details.<br /><br />
Data field names and values are <a href="#case-sensitive"><b>case sensitive</b></a>, as shown in the examples below.<br />
This data field can be queried by a <a href="#range-searches">range search</a>, as shown in the example below.<br /><br />
<b>Examples:</b>
<ul>
<li>To search this field directly, enter a query such as: &#160;
<i>element_length:searchterm</i></li>
<li>To search for a <b>range of values</b>, enter a query such as: &#160;<i>element_length:[value1 TO value2]</i></li>
<li>Search for: &#160; <i>element_length:234</i><br />
to show genetic/genomic elements are have a length of 234 amino acids (or 234 nucleotides).</li>
<li>Search for: &#160; <i>element_length:[200 TO 250]</i><br />
to show genetic/genomic elements that range in length between 200 and 250 amino acids (or between 200 and 250 nucleotides).</li>
</ul>
</li>
<!-- ======== END_MicroBIGG-E_DATA_FIELD_Element_length ========== -->
<!-- ======== MicroBIGG-E_DATA_FIELD_Protein ========== -->
<li id="microbigge-data-field-protein">
<span style="background-color: #cde1ff">Protein (<b><i>protein_acc</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#microbigge-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of MicroBIGG-E data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
The accession of the protein sequence record for this element.<br /><br />
Data field names and values are <a href="#case-sensitive"><b>case sensitive</b></a>, as shown in the examples below. Additional sections of this document provide tips about search terms that contain <a href="#special-characters">special characters</a> (such as the parentheses, hyphens, and apostrophes), and the use of <a href="#wildcards">wildcards</a> (such as the asterisk or question mark).<br /><br />
<b>Examples:</b>
<ul>
<li>To search this field directly, enter a query such as: &#160;
<i>protein_acc:searchterm</i></li>
<li>Search for: &#160; <i>protein_acc:WP_004199234.1</i><br />
to show genetic/genomic elements that have the protein sequence shown in the RefSeq record <a href="https://www.ncbi.nlm.nih.gov/protein/WP_004199234.1">WP_004199234.1</a>. This search retrieves more genetic/genomic elements from a large number of isolates, because the sequence has been found to be a multipecies protein.</li>
<li>Search for: &#160; <i>protein_acc:WP_124042569.1</i><br />
to show the genetic/genomic elements that have the protein sequence shown in the RefSeq record <a href="https://www.ncbi.nlm.nih.gov/protein/WP_124042569.1">WP_124042569.1</a>. As of May 23, 2020, this search retrieves a single element, from the E. coli isolate <a href="/pathogens/isolates#/search/PDT000411318.1">PDT000411318.1</a>.</li>
</ul>
</li>
<!-- ======== END_MicroBIGG-E_DATA_FIELD_Protein ========== -->
<!-- ======== MicroBIGG-E_DATA_FIELD_Contig ========== -->
<li id="microbigge-data-field-contig">
<span style="background-color: #cde1ff">Contig (<b><i>contig_acc</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#microbigge-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of MicroBIGG-E data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
The accession of the contig sequence record on which this element appears.<br /><br />
Data field names and values are <a href="#case-sensitive"><b>case sensitive</b></a>, as shown in the examples below. Additional sections of this document provide tips about search terms that contain <a href="#special-characters">special characters</a> (such as the parentheses, hyphens, and apostrophes), and the use of <a href="#wildcards">wildcards</a> (such as the asterisk or question mark).<br /><br />
<b>Examples:</b>
<ul>
<li>To search this field directly, enter a query such as: &#160;
<i>contig_acc:searchterm</i></li>
<li>Search for: &#160; <i>contig_acc:NZ_UWVC01000003.1</i><br />
to show the genetic/genomic elements that have been identified on the sequence of contig <a href="https://www.ncbi.nlm.nih.gov/nuccore/NZ_UWVC01000003.1">NZ_UWVC01000003.1</a>.</li>
</ul>
</li>
<!-- ======== END_MicroBIGG-E_DATA_FIELD_Contig ========== -->
<!-- ======== MicroBIGG-E_DATA_FIELD_Start ========== -->
<li id="microbigge-data-field-start">
<span style="background-color: #cde1ff">Start (<b><i>start_on_contig</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#microbigge-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of MicroBIGG-E data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
The start coordinate for the element on the contig sequence.<br />
</li>
<!-- ======== END_MicroBIGG-E_DATA_FIELD_Start ========== -->
<!-- ======== MicroBIGG-E_DATA_FIELD_Stop ========== -->
<li id="microbigge-data-field-stop">
<span style="background-color: #cde1ff">Stop (<b><i>end_on_contig</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#microbigge-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of MicroBIGG-E data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
The stop coordinate for the element on the contig sequence.<br />
</li>
<!-- ======== END_MicroBIGG-E_DATA_FIELD_Stop ========== -->
<!-- ======== MicroBIGG-E_DATA_FIELD_Strand ========== -->
<li id="microbigge-data-field-strand">
<span style="background-color: #cde1ff">Strand (<b><i>strand</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#microbigge-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of MicroBIGG-E data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
The strand (+/-) on which the genetic or genomic element appears, relative to the nucleotide sequence that appears in the contig accession listed for the element.
</li>
<!-- ======== END_MicroBIGG-E_DATA_FIELD_Strand ========== -->
<!-- ======== MicroBIGG-E_DATA_FIELD_Type ========== -->
<li id="microbigge-data-field-type">
<span style="background-color: #cde1ff">Type (<b><i>type</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#microbigge-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of MicroBIGG-E data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
Classification for the type of gene found, such as AMR, STRESS, or VIRULENCE.<br /><br />
A more detailed description of the type and subtype fields is available on the <a href="https://github.com/ncbi/amr/wiki/Interpreting-results#element-type-and-subtype">AMRFinderPlus wiki</a><br /><br />
<i>This data field also appears in the Pathogen Detection Reference Gene Catalog; a <a href="#refgene-data-field-type">description of Type</a> and examples of queries for that field appear in the <a href="#refgene-data-fields-list">Reference Gene Catalog data fields</a> help section.</i><br /><br />
<i>(In general, <a href="#refgene-data-field-type">type</a> and <a href="#refgene-data-field-subtype">subtype</a> refer to the category of gene or genetic element, while <a href="#refgene-data-field-class">class</a> and <a href="#refgene-data-field-subclass">subclass</a> refer to the substrate.)</i>
</li>
<!-- ======== END_MicroBIGG-E_DATA_FIELD_Type ========== -->
<!-- ======== MicroBIGG-E_DATA_FIELD_Subtype ========== -->
<li id="microbigge-data-field-subtype">
<span style="background-color: #cde1ff">Subtype (<b><i>subtype</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#microbigge-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of MicroBIGG-E data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
Classification for the subtype of gene found.
A more detailed description of the type and subtype fields is available on the <a href="https://github.com/ncbi/amr/wiki/Interpreting-results#element-type-and-subtype">AMRFinderPlus wiki</a><br /><br />
<i>This data field also appears in the Pathogen Detection Reference Gene Catalog; a <a href="#refgene-data-field-subtype">description of Subtype</a> and examples of queries for that field appear in the <a href="#refgene-data-fields-list">Reference Gene Catalog data fields</a> help section.</i><br /><br />
<i>(In general, <a href="#refgene-data-field-type">type</a> and <a href="#refgene-data-field-subtype">subtype</a> refer to the category of gene or genetic element, while <a href="#refgene-data-field-class">class</a> and <a href="#refgene-data-field-subclass">subclass</a> refer to the substrate.)</i>
</li>
<!-- ======== END_MicroBIGG-E_DATA_FIELD_Subtype ========== -->
<!-- ======== MicroBIGG-E_DATA_FIELD_Class ========== -->
<li id="microbigge-data-field-class">
<span style="background-color: #cde1ff">Class (<b><i>class</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#microbigge-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of MicroBIGG-E data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
Class of resistance for "core" genes (see <a href="#refgene-data-field-scope">scope</a>), and typing information for some virulence genes and <a href="https://github.com/ncbi/stxtyper#--amrfinder-output">Stx type</a> for <i>E. coli</i> and <i>Shigella</i>.<br /><br />
<i>This data field also appears in the Pathogen Detection Reference Gene Catalog; a <a href="#refgene-data-field-class">description of Class</a> and examples of queries for that field appear in the <a href="#refgene-data-fields-list">Reference Gene Catalog data fields</a> help section.</i><br /><br />
<i>(In general, <a href="#refgene-data-field-type">type</a> and <a href="#refgene-data-field-subtype">subtype</a> refer to the category of gene or genetic element, while <a href="#refgene-data-field-class">class</a> and <a href="#refgene-data-field-subclass">subclass</a> refer to the substrate.)</i>
</li>
<!-- ======== END_MicroBIGG-E_DATA_FIELD_Class ========== -->
<!-- ======== MicroBIGG-E_DATA_FIELD_Subclass ========== -->
<li id="microbigge-data-field-subclass">
<span style="background-color: #cde1ff">Subclass (<b><i>subclass</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#microbigge-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of MicroBIGG-E data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
Where it is known, "Subclass" provides a more specific definition of the particular antibiotics or classes that are affected by the gene or point mutation (e.g., that are resisted by the gene/allele). While most subclass designations are self-explanatory, a few others have particular meanings. Specifically, "CEPHALOSPORIN" is equivalent to the Lahey 2be definition; "CARBAPENEM" means the protein has carbapenemase activity, but it might or might not confer resistance to other beta-lactams; "QUARTERNARY AMMONIUM" are quarternary ammonium compounds. In addition, stx subtypes (e.g., STX2E) and intimin subtypes (e.g., ALPHA) are defined for Shiga toxin proteins (class of STX1 or STX2, see <a href="https://github.com/ncbi/stxtyper">StxTyper</a> for more details) and intimins (class of INTIMIN) respectively. Where the phenotypic information is incomplete, contradictory, or unclear, the "Class" value is used for the "Subclass" value.<br /><br />
More information about the class and subclass fields can be found on the <a href="https://github.com/evolarjun/amr/wiki/Interpreting-results#class-and-subclass">AMRFinderPlus wiki</a> <br /><br />
<i>This data field also appears in the Pathogen Detection Reference Gene Catalog; a <a href="#refgene-data-field-subclass">description of Subclass</a> and examples of queries for that field appear in the <a href="#refgene-data-fields-list">Reference Gene Catalog data fields</a> help section.</i><br /><br />
<i>(In general for resistance genes, <a href="#refgene-data-field-type">type</a> and <a href="#refgene-data-field-subtype">subtype</a> refer to the category of gene or genetic element, while <a href="#refgene-data-field-class">class</a> and <a href="#refgene-data-field-subclass">subclass</a> refer to the substrate or antimicrobial.)</i>
</li>
<!-- ====== END_MicroBIGG-E_DATA_FIELD_Subclass ======== -->
<!-- ======== MicroBIGG-E_DATA_FIELD_Scope ========== -->
<li id="microbigge-data-field-scope">
<span style="background-color: #cde1ff">Scope (<b><i>scope</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#microbigge-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of MicroBIGG-E data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
<i>This data field also appears in the Pathogen Detection Reference Gene Catalog; a <a href="#refgene-data-field-scope">description of Scope</a> and examples of queries for that field appear in the <a href="#refgene-data-fields-list">Reference Gene Catalog data fields</a> help section.</i>
</li>
<!-- ======== END_MicroBIGG-E_DATA_FIELD_Scope ========== -->
</ul>
<!-- ======== END_MicroBIGG-E_DATA_FIELD_GROUP_ELEMENT ======= -->
<!-- ======== MicroBIGG-E_DATA_FIELD_GROUP_REFERENCE ========== -->
<span id="microbigge-data-field-group-reference" style="background-color: #cde1ff"><b>Reference data fields:</b></span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#microbigge-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of MicroBIGG-E data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
<ul>
<!-- === MicroBIGG-E_DATA_FIELD_Closest_reference_accession === -->
<li id="microbigge-data-field-closest-reference-accession">
<span style="background-color: #cde1ff">Closest reference accession (<b><i>closest_reference_acc</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#microbigge-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of MicroBIGG-E data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
The accession of closest reference sequence. Note that only one reference will be chosen if the blast hit is equidistant from multiple references (NA if HMM-only hit). For point mutations the reference is the sensitive "wild-type" allele, and the element symbol describes the specific mutation. Check the <a href="/pathogens/refgene/">Reference Gene Catalog</a> for more information on specific mutations or reference genes.<br /><br />
For <a href="https://github.com/ncbi/stxtyper">StxTyper</a> calls this field may be two comma-separated values indicating the accessions of the two subunits identified. These accessions may not match those identified for the individual genes by AMRFinderPlus due to differences in alignment characteristics and databases, and, due to an oversight, the accession may not appear in the Reference Gene Catalog even though the protein sequences will be there associated with a different accession. This will be corrected with the next database release.<br /><br />
Data field names and values are <a href="#case-sensitive"><b>case sensitive</b></a>, as shown in the examples below. Additional sections of this document provide tips about search terms that contain <a href="#special-characters">special characters</a> (such as the parentheses, hyphens, and apostrophes), and the use of <a href="#wildcards">wildcards</a> (such as the asterisk or question mark).<br /><br />
<b>Examples:</b>
<ul>
<li>To search this field directly, enter a query such as: &#160;
<i>closest_reference_acc:searchterm</i></li>
<li>Search for: &#160; <i>closest_reference_acc:WP_001083725.1</i><br />
to show genetic/genomic elements whose protein sequence is most closely related to the sequence in RefSeq record <a href="https://www.ncbi.nlm.nih.gov/protein/WP_001083725.1">https://www.ncbi.nlm.nih.gov/protein/WP_001083725.1</a>.<br /><br />
Note that some elements retrieved by the search above will list that accession in both the <i>closest_reference_acc</i> and <i>protein_acc</i> columns, while other proteins will list it only in the <i>closest_reference_acc</i> column. You can retrieve either subset with the following searches:<br />
Search for: &#160; <i>closest_reference_acc:WP_001083725.1 AND protein_acc:WP_001083725.1</i><br />
Search for: &#160; <i>closest_reference_acc:WP_001083725.1 NOT protein_acc:WP_001083725.1</i><br />
</li>
</ul>
</li>
<!-- === END_MicroBIGG-E_DATA_FIELD_Closest_reference_accession === -->
<!-- ====== MicroBIGG-E_DATA_FIELD_Closest_reference_name ====== -->
<li id="microbigge-data-field-closest-reference-name">
<span style="background-color: #cde1ff">Closest reference name (<b><i>closest_reference_name</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#microbigge-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of MicroBIGG-E data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
The name of closest reference sequence.<br /><br />
Data field names and values are <a href="#case-sensitive"><b>case sensitive</b></a>, as shown in the examples below. Use <b><a href="#query-tips-phrase-search-quotes">quotes to search for phrases</a></b>, as shown in the examples below. Additional sections of this document provide tips about search terms that contain <a href="#special-characters">special characters</a> (such as the parentheses, hyphens, and apostrophes), and the use of <a href="#wildcards">wildcards</a> (such as the asterisk or question mark).<br /><br />
<b>Examples:</b>
<ul>
<li>To search this field directly, enter a query such as: &#160;
<i>closest_reference_name:searchterm</i></li>
<li>Search for: &#160; <i>closest_reference_name:"trimethoprim-resistant dihydrofolate reductase DfrA12"</i><br />
to show genetic/genomic elements whose closes RefSeq protein sequence is named "trimethoprim-resistant dihydrofolate reductase DfrA12."</li>
</ul>
</li>
<!-- ===== END_MicroBIGG-E_DATA_FIELD_Closest_reference_name ==== -->
<!-- ==== MicroBIGG-E_DATA_FIELD_Reference_element_length ===== -->
<li id="microbigge-data-field-reference-element-length">
<span style="background-color: #cde1ff">Reference element length (<b><i>reference_element_length</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#microbigge-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of MicroBIGG-E data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
Length of the reference sequence in amino acids (AA) for protein elements, and in base pairs (bp) for nucleotide elements.<br /><br />
For Stx operons this is the combined amino-acid length of the identified subunits. See the <a href="https://github.com/ncbi/stxtyper/#--amrfinder-output">StxTyper output documentation</a> for more details.<br /><br />
Data field names and values are <a href="#case-sensitive"><b>case sensitive</b></a>, as shown in the examples below.<br />
This data field can be queried by a <a href="#range-searches">range search</a>, as shown in the example below.<br /><br />
<b>Examples:</b>
<ul>
<li>To search this field directly, enter a query such as: &#160;
<i>reference_element_length:searchterm</i></li>
<li>To search for a <b>range of values</b>, enter a query such as: &#160;<i>reference_element_length:[value1 TO value2]</i></li>
<li>Search for: &#160; <i>reference_element_length:284</i><br />
to show genetic/genomic elements whose reference elements have a length of 234 amino acids (or 234 nucleotides).</li>
<li>Search for: &#160; <i>reference_element_length:[200 TO 250]</i><br />
to show genetic/genomic elements whose reference elements range in length between 200 and 250 amino acids (or between 200 and 250 nucleotides).</li>
</ul>
</li>
<!-- ==== END_MicroBIGG-E_DATA_FIELD_Reference_element_length ==== -->
<!-- ======== MicroBIGG-E_DATA_FIELD_HMM_Accession ========== -->
<li id="microbigge-data-field-hmm-acc">
<span style="background-color: #cde1ff">HMM Accession (<b><i>hmm_acc</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#microbigge-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of MicroBIGG-E data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
The accession of the Hidden Markov Model (HMM) that hits this element above cutoff (if any). Clicking the HMM accession will take you to the HMM page in the <a href="https://www.ncbi.nlm.nih.gov/protfam/">Protein Family Models</a> database. From that page you can download the HMM itself and get additional information including the curated cutoffs, the seed alignment, and RefSeq sequences identified by this HMM.<br /><br />
Data field names and values are <a href="#case-sensitive"><b>case sensitive</b></a>, as shown in the examples below. Additional sections of this document provide tips about search terms that contain <a href="#special-characters">special characters</a> (such as the parentheses, hyphens, and apostrophes), and the use of <a href="#wildcards">wildcards</a> (such as the asterisk or question mark).<br /><br />
<b>Examples:</b>
<ul>
<li>To search this field directly, enter a query such as: &#160;
<i>hmm_acc:searchterm</i></li>
<li>Search for: &#160; <i>hmm_acc:NF000053.2</i><br />
to show genetic/genomic elements that have a match to the Hidden Markov Model with accession NF000053.2 (trimethoprim-resistant dihydrofolate reductase DfrA12).</li>
</ul>
</li>
<!-- ====== END_MicroBIGG-E_DATA_FIELD_HMM_Accession ======= -->
<!-- ======= MicroBIGG-E_DATA_FIELD_HMM_Description ======== -->
<li id="microbigge-data-field-hmm-description">
<span style="background-color: #cde1ff">HMM Description (<b><i>hmm_description</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#microbigge-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of MicroBIGG-E data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
The name of the Hidden Markov Model (HMM) that hits this element (if any).<br /><br />
Data field names and values are <a href="#case-sensitive"><b>case sensitive</b></a>, as shown in the examples below. Use <b><a href="#query-tips-phrase-search-quotes">quotes to search for phrases</a></b>, as shown in the example below. Additional sections of this document provide tips about search terms that contain <a href="#special-characters">special characters</a> (such as the parentheses, hyphens, and apostrophes), and the use of <a href="#wildcards">wildcards</a> (such as the asterisk or question mark).<br /><br />
<b>Examples:</b>
<ul>
<li>To search this field directly, enter a query such as: &#160;
<i>hmm_description:searchterm</i></li>
<li>Search for: &#160; <i>hmm_description:"trimethoprim-resistant dihydrofolate reductase DfrA12"</i><br />
to show genetic/genomic elements that have a match to the Hidden Markov Model with the name "trimethoprim-resistant dihydrofolate reductase DfrA12."</li>
</ul>
</li>
<!-- ======= END_MicroBIGG-E_DATA_FIELD_HMM_Description ======= -->
<!-- ======= MicroBIGG-E_DATA_FIELD_hierarchy_node ======= -->
<li id="microbigge-data-field-hierarchy-node">
<span style="background-color: #cde1ff">Hierarchy node (<b><i>hierarchy_node</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#microbigge-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of MicroBIGG-E data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
The hierarchy node(s) that this element was identified as. The <a href="/pathogens/genehierarchy">Reference Gene Hierarchy</a> organizes the proteins and HMMs in the database into a hierarchy that is used for naming including higher level nodes that do not have a specific family name (for example bla for an unknown family beta-lactamase). <b>Clicking on an entry in this field will take you to that node in the <a href="/pathogens/genehierarchy">Reference Gene Hierarchy</a>.</b> Multiple values are possible for this field for fusion genes where one node may used for each of the functions separately since they have different functional names. Multiple values may also be included for stx operons identified with <a href="https://github.com/ncbi/stxtyper">StxTyper</a> where there is a separate protein node for each of the stxA and stxB subunits. For point mutations (subtype:POINT), clicking the entry will display a "No Matching Results" message in the <a href="/pathogens/genehierarchy">Reference Gene Hierarchy</a> since point mutations lack nodes in the <a href="/pathogens/genehierarchy">Reference Gene Hierarchy.</a><br /><br />
Data field names and values are <a href="#case-sensitive"><b>case sensitive</b></a>, and though node IDs may look like gene symbols, they are, for convenience often the same as a gene symbol, they are internal database IDs used to identify a node at a place in the hierarchy and not gene symbols. Multiple hierarchy nodes may share the same gene symbol. See the <a href="/pathogens/docs/gene_hierarchy/#node-id-node_id">Documentation for the node_id column in the Reference Gene Hierarchy</a> for a more detailed explanation.<br /><br />
</li>
<!-- ======= END_MicroBIGG-E_DATA_FIELD_hierarchy_node ======= -->
</ul>
<!-- ======== END_MicroBIGG-E_DATA_FIELD_GROUP_REFERENCE ======== -->
<!-- ====== MicroBIGG-E_DATA_FIELD_GROUP_ANALYSIS_RESULTS ======== -->
<span id="microbigge-data-field-group-analysis-results" style="background-color: #cde1ff"><b>Analysis results (Element vs Reference) data fields:</b></span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#microbigge-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of MicroBIGG-E data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
<ul>
<!-- ======== MicroBIGG-E_DATA_FIELD_Method ========== -->
<li id="microbigge-data-field-method">
<span style="background-color: #cde1ff">Method (<b><i>amr_method</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#microbigge-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of MicroBIGG-E data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
The method used by AMRFinderPlus to identify this element. A separate section of this document provides a <a href="/pathogens/docs/data_processing/#genotype-categories">table that summarizes AMRFinderPlus methods</a> that are used by the tool to analyze pathogen isolate genome assemblies and identify genetic and genomic elements. The <a href="https://github.com/ncbi/amr/wiki">AMRFinderPlus Wiki</a> provides <a href="https://github.com/ncbi/amr/wiki/Methods">additional details about the methods</a> and the <a href="https://github.com/ncbi/stxtyper#output">StxTyper "operon" field documentation</a> contains more information about how this is defined for StxTyper results.<br /><br />
Data field names and values are <a href="#case-sensitive"><b>case sensitive</b></a>, as shown in the examples below. Additional sections of this document provide tips about search terms that contain <a href="#special-characters">special characters</a> (such as the parentheses, hyphens, and apostrophes), and the use of <a href="#wildcards">wildcards</a> (such as the asterisk or question mark).<br /><br />
<b>Examples:</b>
<ul>
<li>To search this field directly, enter a query such as: &#160;
<i>amr_method:searchterm</i></li>
<li>Search for: &#160; <i>amr_method:HMM</i><br />
to show proteins that were found by HMM only, more distant to reference proteins than our BLAST cutoffs.</li>
<li>Search for: &#160; <i>amr_method:POINTN OR amr_method:POINTP OR amr_method:POINTX</i><br />
to show point mutations that were identified using nucleotide BLAST (BLASTN), protein BLAST (BLASTP), or translated BLAST (BLASTX).</li>
</ul>
</li>
<!-- ======== END_MicroBIGG-E_DATA_FIELD_Method ========== -->
<!-- ======== MicroBIGG-E_DATA_FIELD_Alignment_length ========== -->
<li id="microbigge-data-field-alignment-length">
<span style="background-color: #cde1ff">Alignment length (<b><i>align_length</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#microbigge-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of MicroBIGG-E data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
The length of the alignment between the genetic/genomic element, which was identified by AMRFinderPlus in the isolate genome assembly, and the reference element. The length is measured in amino acids (AA) for protein elements, and in base pairs (bp) for nucleotide elements. For StxTyper results this is the total amino acid length of the translated BLAST subunit alignments. See the <a href="https://github.com/ncbi/stxtyper">StxTyper documentation</a> for more information.<br /><br />
Data field names and values are <a href="#case-sensitive"><b>case sensitive</b></a>, as shown in the examples below.<br />
This data field can be queried by a <a href="#range-searches">range search</a>, as shown in the example below.<br /><br />
<b>Examples:</b>
<ul>
<li>To search this field directly, enter a query such as: &#160;
<i>align_length:searchterm</i></li>
<li>To search for a <b>range of values</b>, enter a query such as: &#160;<i>align_length:[value1 TO value2]</i></li>
<li>Search for: &#160; <i>align_length:[200 TO 250]</i><br />
to show genetic/genomic elements whose alignment to the closest reference element ranges in length between 200 and 250 amino acids (or between 200 and 250 nucleotides).</li>
</ul>
</li>
<!-- ====== END_MicroBIGG-E_DATA_FIELD_Alignment_length ====== -->
<!-- ======== MicroBIGG-E_DATA_FIELD_Identity ========== -->
<li id="microbigge-data-field-identity">
<span style="background-color: #cde1ff">% Identity (<b><i>pct_ref_identity</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#microbigge-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of MicroBIGG-E data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
The percent of identical amino acids or base pairs within the aligned region of the genetic/genomic element (identified by AMRFinderPlus in the isolate genome assembly) and the reference element. For StxTyper results this is the combined amino-acid percent identity of the stx subunits. See the <a href="https://github.com/ncbi/stxtyper">StxTyper documentation</a> for more information.<br /><br />
Data field names and values are <a href="#case-sensitive"><b>case sensitive</b></a>, as shown in the examples below.<br />
This data field can be queried by a <a href="#range-searches">range search</a>, as shown in the example below.<br /><br />
<b>Examples:</b>
<ul>
<li>To search this field directly, enter a query such as: &#160;
<i>pct_ref_identity:searchterm</i></li>
<li>To search for a <b>range of values</b>, enter a query such as: &#160;<i>pct_ref_identity:[value1 TO value2]</i></li>
<li>Search for: &#160; <i>pct_ref_identity:100</i><br />
to show genetic/genomic elements that have a 100% identity to the reference element, within the aligned region.</li>
<li>Search for: &#160; <i>pct_ref_identity:[98 TO 100]</i><br />
to show genetic/genomic elements that have an identity that ranges from 98% to 100% to the reference element, within the aligned region.</li>
</ul>
</li>
<!-- ======== END_MicroBIGG-E_DATA_FIELD_Identity ========== -->
<!-- ======== MicroBIGG-E_DATA_FIELD_Coverage ========== -->
<li id="microbigge-data-field-coverage">
<span style="background-color: #cde1ff">% Coverage (<b><i>pct_ref_coverage</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#microbigge-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of MicroBIGG-E data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
The proportion of the reference sequence covered by the alignment between the target element and the reference element.<br />
For example, a coverage of 90% means that the alignment between the target element and the reference element covers 90% of the reference sequence's length.<br /><br />
Data field names and values are <a href="#case-sensitive"><b>case sensitive</b></a>, as shown in the examples below.<br />
This data field can be queried by a <a href="#range-searches">range search</a>, as shown in the example below.<br /><br />
<b>Examples:</b>
<ul>
<li>To search this field directly, enter a query such as: &#160;
<i>pct_ref_coverage:searchterm</i></li>
<li>To search for a <b>range of values</b>, enter a query such as: &#160;<i>pct_ref_coverage:[value1 TO value2]</i></li>
<li>Search for: &#160; <i>pct_ref_coverage:100</i><br />
to show genetic/genomic elements whose alignment to the closest reference element covers 100% of the reference element's length.</li>
<li>Search for: &#160; <i>pct_ref_coverage:[50 TO 75]</i><br />
to show genetic/genomic elements whose alignment to the closest reference element covers 50% to 75% of the reference element's length.</li>
</ul>
</li>
<!-- ======== END_MicroBIGG-E_DATA_FIELD_Coverage ========== -->
<!-- ======== MicroBIGG-E_DATA_FIELD_Contig_coverage ========== -->
<li id="microbigge-data-field-contig-coverage">
<span style="background-color: #cde1ff">Contig coverage (<b><i>contig_coverage</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#microbigge-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of MicroBIGG-E data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
Contig coverage is the mean coverage of aligned reads for the contig containing this hit. This is a decimal (floating point) number &gt; 0, not a percentage.<br /><br />
Data field names and values are <a href="#case-sensitive"><b>case sensitive</b></a>, as shown in the examples below.<br />
This data field can be queried by a <a href="#range-searches">range search</a>, as shown in the example below.<br /><br />
<b>Example:</b>
<ul>
<li>To search this field directly, enter a query such as: &#160;
<i>contig_coverage:searchterm</i></li>
<li>To search for a <b>range of values</b>, enter a query such as: &#160;<i>contig_coverage:[value1 TO value2]</i></li>
<li>Search for: &#160; <i>contig_coverage:[96 TO 106]</i><br />
to show genetic/genomic elements that have a contig coverage between 96 and 106.</li>
</ul>
</li>
<!-- ======== END_MicroBIGG-E_DATA_FIELD_Contig_coverage ========== -->
<!-- ==== MicroBIGG-E_DATA_FIELD_Relative_assembly_coverage ==== -->
<li id="microbigge-data-field-relative-assembly-coverage">
<span style="background-color: #cde1ff">Relative assembly coverage (<b><i>rel_asm_cov</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#microbigge-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of MicroBIGG-E data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
This is the mean coverage by aligned reads of the entire contig divided by the mean coverage by aligned reads of the entire assembly. Mathematically the value is contig_coverage / asm_coverage. This is a ratio, a decimal (floating point) number &gt; 0, not a percentage.
<!-- mouseover: Average coverage of reads aligned to the assembly for the contig divided by average coverage of reads aligned to the entire assembly --><br /><br />
Data field names and values are <a href="#case-sensitive"><b>case sensitive</b></a>, as shown in the examples below.<br />
This data field can be queried by a <a href="#range-searches">range search</a>, as shown in the example below.<br /><br />
<b>Example:</b>
<ul>
<li>To search this field directly, enter a query such as: &#160;
<i>rel_asm_cov:searchterm</i></li>
<li>To search for a <b>range of values</b>, enter a query such as: &#160;<i>rel_asm_cov:[value1 TO value2]</i></li>
<li>Search for: &#160; <i>rel_asm_cov:[1.190 TO 1.202]</i><br />
to show genetic/genomic elements that have relative assembly coverage between 1.190 TO 1.202.</li>
<li>Search for: &#160; <i>rel_asm_cov:[1.1 TO 1.2]</i><br />
to show genetic/genomic elements that have relative assembly coverage between 1.100 TO 1.200.</li>
</ul>
</li>
<!-- ==== END_MicroBIGG-E_DATA_FIELD_Relative_assembly_coverage ==== -->
<!-- ======== MicroBIGG-E_DATA_FIELD_Assembly_coverage ======= -->
<li id="microbigge-data-field-assembly-coverage">
<span style="background-color: #cde1ff">Assembly coverage (<b><i>asm_coverage</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#microbigge-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of MicroBIGG-E data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
Assembly coverage is the mean coverage of aligned reads for the entire assembly. This is a decimal (floating point) number &gt; 0, not a percentage.<br /><br />
Data field names and values are <a href="#case-sensitive"><b>case sensitive</b></a>, as shown in the examples below.<br />
This data field can be queried by a <a href="#range-searches">range search</a>, as shown in the example below.<br /><br />
<b>Example:</b>
<ul>
<li>To search this field directly, enter a query such as: &#160;
<i>rel_asm_cov:searchterm</i></li>
<li>To search for a <b>range of values</b>, enter a query such as: &#160;<i>asm_coverage:[value1 TO value2]</i></li>
<li>Search for: &#160; <i>asm_coverage:[98 TO 110]</i><br />
to show genetic/genomic elements that have assembly coverage between 98 TO 110.</li>
</ul>
</li>
<!-- ====== END_MicroBIGG-E_DATA_FIELD_Assembly_coverage ====== -->
</ul>
<!-- ====== END_MicroBIGG-E_DATA_FIELD_GROUP_ANALYSIS_RESULTS ====== -->
<!-- ======== MicroBIGG-E_DATA_FIELD_GROUP_ANALYSIS_LOG ========== -->
<span id="microbigge-data-field-group-analysis-log" style="background-color: #cde1ff"><b>Analysis log data fields:</b></span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#microbigge-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of MicroBIGG-E data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
<ul>
<!-- ==== MicroBIGG-E_DATA_FIELD_AMRFinderPlus_analysis_type ==== -->
<li id="microbigge-data-field-analysis-type">
<span style="background-color: #cde1ff">AMRFinderPlus analysis type (<b><i>amrfinderplus_analysis_type</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#microbigge-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of MicroBIGG-E data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
<i>This data field also appears in the Pathogens Isolates Browser; a <a href="#isolates-browser-data-field-amrfinderplus-analysis-type">description of AMRFinderPlus analysis type</a> and examples of queries for that field appear in the <a href="#isolates-browser-data-fields-list">Isolates Browser data fields</a> help section.</i>
</li>
<!-- === END_MicroBIGG-E_DATA_FIELD_AMRFinderPlus_analysis_type === -->
<!-- ==== MicroBIGG-E_DATA_FIELD_AMRFinderPlus_version ==== -->
<li id="microbigge-data-field-amrfinderplus-version">
<span style="background-color: #cde1ff">AMRFinderPlus version (<b><i>amrfinderplus_version</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#microbigge-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of MicroBIGG-E data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
<i>This data field also appears in the Pathogens Isolates Browser; a <a href="#isolates-browser-data-field-amrfinderplus-version">description of AMRFinderPlus version</a> and examples of queries for that field appear in the <a href="#isolates-browser-data-fields-list">Isolates Browser data fields</a> help section.</i>
</li>
<!-- ==== END_MicroBIGG-E_DATA_FIELD_AMRFinderPlus_version ==== -->
<!-- ==== MicroBIGG-E_DATA_FIELD_PD_Ref_Gene_Catalog_Version ==== -->
<li id="microbigge-data-field-refgene-db-version">
<span style="background-color: #cde1ff">PD Ref Gene Catalog Version (<b><i>refgene_db_version</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#microbigge-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of MicroBIGG-E data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
<i>This data field also appears in the Pathogens Isolates Browser; a <a href="#isolates-browser-data-field-refgene-db-version">description of PD Ref Gene Catalog Version</a> and examples of queries for that field appear in the <a href="#isolates-browser-data-fields-list">Isolates Browser data fields</a> help section.</i>
</li>
<!-- === END_MicroBIGG-E_DATA_FIELD_PD_Ref_Gene_Catalog_Version === -->
</ul>
<!-- ======== END_MicroBIGG-E_DATA_FIELD_GROUP_ANALYSIS_LOG ======== -->
<!-- ======== MicroBIGG-E_DATA_FIELD_GROUP_XXXXXXX ========== -->
<!-- span id="microbigge-data-field-group-________" style="background-color: #cde1ff"><b>______ fields:</b></span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#microbigge-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of MicroBIGG-E data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br / -->
<!-- ul -->
<!-- ======== MicroBIGG-E_DATA_FIELD_XXXXXXXXXX ========== -->
<!-- li id="microbigge-data-field-________">
<span style="background-color: #cde1ff">________ (<b><i>________</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#microbigge-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of MicroBIGG-E data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
DataFieldDescription_____________________________<br /><br />
Data field names and values are <a href="#case-sensitive"><b>case sensitive</b></a>, as shown in the examples below. Additional sections of this document provide tips about search terms that contain <a href="#special-characters">special characters</a> (such as the parentheses, hyphens, and apostrophes), and the use of <a href="#wildcards">wildcards</a> (such as the asterisk or question mark).<br /><br />
<b>Examples:</b>
<ul>
<li>To search this field directly, enter a query such as: &#160;
<i>_______:searchterm</i></li>
<li>Search for: &#160; <i>_______:_______</i><br />
to show genetic/genomic elements for __________.</li>
<li>Search for: &#160; <i>_________:_________ AND _________:_________</i><br />
to show ___________________________.</li>
</ul>
</li -->
<!-- ======== END_MicroBIGG-E_DATA_FIELD_XXXXXXX ========== -->
<!-- ======== MicroBIGG-E_DATA_FIELD_XXXXXXX ========== -->
<!-- li id="microbigge-data-field-XXXXXXXX">
<span style="background-color: #cde1ff">_________ (<b><i>_________</i></b>)</span>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#microbigge-data-fields-list"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="list of MicroBIGG-E data fields" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
DataFieldDescription_____________________________<br /><br />
Data field names and values are <a href="#case-sensitive"><b>case sensitive</b></a>, as shown in the examples below. Additional sections of this document provide tips about search terms that contain <a href="#special-characters">special characters</a> (such as the parentheses, hyphens, and apostrophes), and the use of <a href="#wildcards">wildcards</a> (such as the asterisk or question mark).<br /><br />
<b>Examples:</b>
<ul>
<li>To search this field directly, enter a query such as: &#160;
<i>_______:searchterm</i></li>
<li>Search for: &#160; <i>_______:_______</i><br />
to show genetic/genomic elements for __________.</li>
<li>Search for: &#160; <i>_________:_________ AND _________:_________</i><br />
to show ___________________________.</li>
</ul>
</li -->
<!-- ======== END_MicroBIGG-E_DATA_FIELD_XXXXXXX ========== -->
<!-- /ul -->
<!-- ======== END_MicroBIGG-E_DATA_FIELD_GROUP_XXXXXXX ======== -->
<!-- ========= END_MicroBIGG-E_DATA_FIELDS_DESCRIPTIONS =========== -->
</div>
<!-- =========== END_MicroBIGG-E_DATA_FIELDS ============ -->
<!-- =========== MicroBIGG-E_OUTPUT ============ -->
<h4 id="microbigge-output">Output from MicroBIGG-E <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#microbigge"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="MicroBIGG-E help, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h4>
<div style="padding-left: 2em">
<!-- ========= MicroBIGG-E_OUTPUT_TABLE ============ -->
<span id="microbigge-output-table"><b>Tabular list of genes and genetic elements</b></span> <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#microbigge"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="MicroBIGG-E help, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br />
<ul>
<li>Upon opening the <a href="/pathogens/isolates#/microbigge/">MicroBIGG-E</a> web interface, a table displays data for <b>all genetic and genomic elements</b> that have been identified in isolates genomes that have been deposited into GenBank.</li>
<li><b>Every row</b> in the <a href="/pathogens/isolates#/microbigge/">MicroBIGG-E</a> display is an <b>anti-microbial resistance (AMR)</b>, <b>stress response</b>, and/or <b>virulence</b> gene that has been identified in an isolate by the <a href="/pathogens/docs/data_processing">data processing pipeline</a>.</li>
<li>The data available for each item can include gene name, type, subtype, class, subclass, method used to identify the element, supporting evidence, and more, as available. (See the <a href="#microbigge-data-fields">MicroBIGG-E data fields</a> for a complete list.) Some of the data elements, such as accessions for BioSample, nucleotide sequence, and protein sequence records, <b>link</b> to additional information in the corresponding databases.</li>
<li>The genes can be <b>sorted</b> by clicking on column headers, <b>faceted</b> by using <a href="#microbigge-output-filters">filters</a> (e.g., class:AMINOGLYCOSIDE), or <b>searched</b> using <a href="#microbigge-basic-search">basic</a> or <a href="#microbigge-advanced-search">advanced</a> search techniques. <!-- (see <a href="#microbigge-sample-searches"><span style="color:#d70000">use cases/sample searches</span> of MicroBIGG-E</a> and an <a href="#microbigge-illustration"><span style="color:#d70000">illustrated example</span> of search results</a>). --></li>
</ul>
<!-- ========= END_MicroBIGG-E_OUTPUT_TABLE ============ -->
<!-- ========= MicroBIGG-E_FILTERS ============ -->
<span id="microbigge-output-filters"><b>Filters to refine results</b></span> <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#microbigge"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="MicroBIGG-E help, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br />
<ul>
<li>The "Filters" menu options in the <a href="/pathogens/isolates#/microbigge/">MicroBIGG-E</a> web interface enable you to <b>facet or subset the data</b> in a variety of ways, and therefore can be used to refine your results, whether you have done a <a href="#microbigge-basic-search">basic search</a> or an <a href="#microbigge-advanced-search">advanced search</a>.</li>
<li>By default, each filter displays the <b>top 100 terms</b> (based on the number of genes/alleles retrieved by a term) listed by count of value within that set of top 100.</li>
<li id="microbigge-filters-on-the-fly"><b>Filters are generated on the fly</b>. The choices listed in the "Filters" tab depend on the data set you are currently displaying in the browser, and reflect the attributes of the genes and alleles in that data set.</li>
<li>A separate section of this document provides <a href="#microbigge-filters">additional information about Filters</a>.</li>
</ul>
<!-- ========= END_MicroBIGG-E_FILTERS ============ -->
<!-- ========= MicroBIGG-E_OUPUT_DISPLAY_OPTIONS ========= -->
<span id="microbigge-display-options"><b>Customize the MicroBIGG-E display</b></span> <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#microbigge"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="MicroBIGG-E help, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br />
<ul>
<li>The columns displayed by MicroBIGG-E reflect the <a href="#microbigge-data-fields">data fields</a>. By default, the MicroBIGG-E displays only a subset of the available data fields.</li>
<li id="microbigge-choose-columns">You can use the "<b>Choose Columns</b>" option at the top of the tabular list of genes in order to remove columns, select additional columns to display, and/or change the order of the columns.</li>
<li>The options you select will <b>persist</b> within a given browser (e.g., Chrome, Edge, Internet Explorer, Firefox, Safari) until that browser's cookies are cleared/reset.</li>
</ul>
<!-- ========= END_MicroBIGG-E_OUPUT_DISPLAY_OPTIONS ========= -->
<!-- ========= MicroBIGG-E_cross_browser ========= -->
<span id="microbigge-cross-browser-selection"><b>Cross-browser selection</b></span> <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#microbigge"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="MicroBIGG-E help, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br />
<ul>
<li>It is possible to view isolates that you have identified in MicroBIGG-E in the <a href="#isolates-browser">Isolates Browser</a></li>
<li>Click the <b>Cross-browser selection</b> button to the right of the Download button (you must be logged into your myNCBI account for this functionality). By default, all of the isolates for every row of your MicroBIGG-E search will be selected, as indicated by the checkbox column; however, you can deselect rows manually.</li>
<li>Then click the <b>Show in Isolates</b> button. A new tab will open with the Isolates browser results for the selected elements in MicroBIGG-E. You can then examine clusters of interest using the <a href="#snp-tree-viewer">SNP Tree Viewer</a>, or perform other tasks in the <a href="#isolates-browser">Isolates Browser</a>.</li>
</ul>
<!-- ========= END_crossbrowswer ========= -->
</div>
<!-- =========== END_MicroBIGG-E_OUTPUT ============ -->
<!-- =========== MicroBIGG-E_SAMPLE_SEARCHES ============ -->
<h4 id="microbigge-sample-searches">Use cases/sample searches of MicroBIGG-E <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#microbigge"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="MicroBIGG-E help, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h4>
<ul>
<li><a href="#microbigge-sample-search-genes-co-occur-on-contig">Identify hits from isolates with specific genes that co-occur on the same contig</a></li>
<li><a href="#microbigge-sample-search-partial-gene-in-middle-of-contig">Identify partial gene sequences in the middle of contigs</a></li>
<li><a href="#microbigge-sample-search-find-alleles-described-by-publication">Find the isolates and alleles described by a publication of interest</a></li>
<li><a href="#microbigge-sample-search-isolates-with-co-occurring-genes">Display isolates in isolates browser that have the same set of genes co-occurring on the same contig</a></li>
<li><a href="#microbigge-sample-search-hits-from-isolates-with-co-occurring-genes">Display hits from isolates with co-occurring genes</a></li>
<!-- li><a href="#microbigge-sample-search-_______">___________</a></li -->
</ul>
<!-- ====== MicroBIGG-E_SAMPLE_SEARCH_isolates_with_same_genes_that_co_occur_on_the_same_contig =========== -->
<span id="microbigge-sample-search-genes-co-occur-on-contig"><b>Identify hits from isolates with specific genes that co-occur on the same contig</b></span> <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#microbigge-sample-searches"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="MicroBIGG-E help, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
<div style="padding-left: 2em">
As an example, identify hits from contigs that have a set of genes (e.g., blaTEM-1 and blaKPC*) co-occurring on the same contig. A researcher might want to know which contigs (likely plasmids) have TEM-1 and a KPC allele, as opposed to a specific allele, since a single mutational event can alter the KPC allele and its clinical phenotype (such as KPC-3 and KPC-28), in order to understand the co-transmission and co-evolution of these two gene families.<br />
<ul>
<li>Open the <a href="/pathogens/isolates#/microbigge/">MicroBIGG-E</a>: <b>Micro</b>bial <b>B</b>rowser for <b>I</b>dentification of <b>G</b>enetic and <b>G</b>enomic <b>E</b>lements.</li>
<li>Search for contigs with genes of interest (e.g., blaTEM-1 and blaKPC*)</li>
<li>To do this, enter a search such as:<br />
<i><a href="/pathogens/isolates#/microbigge/genes_on_contig:blaTEM-1%20AND%20genes_on_contig:blaKPC*">genes_on_contig:blaTEM-1 AND genes_on_contig:blaKPC*</a></i><br />
(Note that field-specified searches are <a href="#case-sensitive"><b>case-sensitive</b></a>, and separate sections of this document provide tips about search terms that contain <a href="#special-characters">special characters</a> (such as the parentheses, hyphens, and apostrophes), and the use of <a href="#wildcards">wildcards</a> such as the asterisk.)
</li>
<li>Examine if genes of interest co-occur on same contig, either by clicking Download or visual inspection.</li>
</ul>
</div>
<!-- ====== END_MicroBIGG-E_SAMPLE_SEARCH_isolates_with_same_genes_that_co_occur_on_the_same_contig =========== -->
<!-- ====== MicroBIGG-E_SAMPLE_SEARCH_partial_gene_in_middle_of_contig =========== -->
<span id="microbigge-sample-search-partial-gene-in-middle-of-contig"><b>Identify partial gene sequences in the middle of contigs</b></span> <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#microbigge-sample-searches"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="MicroBIGG-E help, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
<div style="padding-left: 2em">
As an example, identify partial gene sequences in the middle of contigs, as that form of partiality might imply loss or alteration of function, and might need to be excluded or treated differently:<br />
<ul>
<li>Open the <a href="/pathogens/isolates#/microbigge/">MicroBIGG-E</a>: <b>Micro</b>bial <b>B</b>rowser for <b>I</b>dentification of <b>G</b>enetic and <b>G</b>enomic <b>E</b>lements.</li>
<li>For a given isolate and gene sequence (i.e., row), exclude columns where method equals "PARTIAL_CONTIG_ENDP" or "PARTIAL_CONTIG_ENDX".</li> <li>To do this, enter a search such as:<br />
<i><a href="/pathogens/isolates#/microbigge/amr_method:PARTIAL*%20AND%20NOT%20amr_method:PARTIAL_CONTIG_END*">amr_method:PARTIAL* AND NOT amr_method:PARTIAL_CONTIG_END*</a></i><br />
(Note that field-specified searches are <a href="#case-sensitive"><b>case-sensitive</b></a>, and separate sections of this document provide tips about search terms that contain <a href="#special-characters">special characters</a> (such as the parentheses, hyphens, and apostrophes), and the use of <a href="#wildcards">wildcards</a> such as the asterisk.)
</li>
</ul>
</div>
<!-- ====== END_MicroBIGG-E_SAMPLE_SEARCH_partial_gene_in_middle_of_contig =========== -->
<!-- ====== Begin_MicroBIGG-E_SAMPLE_SEARCH_genes_on_same_contig_isolates_browser =========== -->
<span id="microbigge-sample-search-isolates-with-co-occurring-genes"><b>Display isolates in isolates browser that have the same set of genes co-occurring on the same contig</b></span> <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#microbigge-sample-searches"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="MicroBIGG-E help, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
<div style="padding-left: 2em">
Having identified which contigs (likely plasmids) have TEM-1 and a KPC allele, a researcher might want to see their phylogenetic context in the SNP Tree Viewer
<ul>
<li>Open the <a href="/pathogens/isolates#/microbigge/">MicroBIGG-E</a>: <b>Micro</b>bial <b>B</b>rowser for <b>I</b>dentification of <b>G</b>enetic and <b>G</b>enomic <b>E</b>lements.</li>
<li>Search for contigs that have a blaKPC gene and a blaTEM-1 allele.</li> <li>To do this, enter the following search:<br />
<i><a href="/pathogens/isolates/#/microbigge/genes_on_contig:blaTEM-1%20AND%20genes_on_contig:blaKPC*">genes_on_contig:blaTEM-1 AND genes_on_contig:blaKPC*</a></i><br />
(Note that field-specified searches are <a href="#case-sensitive"><b>case-sensitive</b></a>, and separate sections of this document provide tips about search terms that contain <a href="#special-characters">special characters</a> (such as the parentheses, hyphens, and apostrophes), and the use of <a href="#wildcards">wildcards</a> such as the asterisk.)
</li>
<li>Click the <a href="#microbigge-cross-browser-selection">Cross-browser selection</a> button to the right of the Download button (you must be logged into your myNCBI account for this functionality).</li>
<li>A new tab will open in the Isolates Browser containing all of the isolates meeting your search criteria. You can then examine clusters of interest using the <a href="#snp-tree-viewer">SNP Tree Viewer</a>, or perform other tasks in the <a href="#isolates-browser">Isolates Browser.</a></li>
</ul>
</div>
<!-- ====== End_MicroBIGG-E_SAMPLE_SEARCH_genes_on_same_contig_isolates_browser =========== -->
<!-- ====== Begin_MicroBIGG-E_SAMPLE_SEARCH_co-ocurring_genes =========== -->
<span id="microbigge-sample-search-hits-from-isolates-with-co-occurring-genes"><b>Display hits from isolates with co-occurring genes</b></span> <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#microbigge-sample-searches"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="MicroBIGG-E help, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
<div style="padding-left: 2em">
Get all hits from isolates that share a set of genes. Can then link to <a href="#isolates-browser">isolates browser</a> (and subsequently <a href="#snp-tree-viewers">SNP Tree Viewer</a>) to get more information about those isolates using <a href="#microbigge-cross-browser-selection">Cross-browser selection</a>. E.g., get a set of hits from all isolates that share a blaTEM-1 and blaKPC gene.
<ul>
<li>Open the <a href="/pathogens/isolates#/microbigge/">MicroBIGG-E</a>: <b>Micro</b>bial <b>B</b>rowser for <b>I</b>dentification of <b>G</b>enetic and <b>G</b>enomic <b>E</b>lements.</li>
<li>Search for hits from isolates that have a blaKPC gene and a blaTEM-1 allele.</li> <li>To do this, enter the following search:<br />
<i><a href="/pathogens/isolates/#/microbigge/genes_on_isolate:blaTEM-1%20AND%20genes_on_isolate:blaKPC*">genes_on_isolate:blaTEM-1 AND genes_on_isolate:blaKPC*</a></i><br />
(Note that field-specified searches are <a href="#case-sensitive"><b>case-sensitive</b></a>, and separate sections of this document provide tips about search terms that contain <a href="#special-characters">special characters</a> (such as the parentheses, hyphens, and apostrophes), and the use of <a href="#wildcards">wildcards</a> such as the asterisk.)
</li>
<li>Click the <a href="#microbigge-cross-browser-selection">Cross-browser selection</a> button to the right of the Download button (you must be logged into your myNCBI account for this functionality).</li>
<li>A new tab will open in the Isolates Browser containing all of the isolates meeting your search criteria. You can then examine clusters of interest using the <a href="#snp-tree-viewer">SNP Tree Viewer</a>, or perform other tasks in the <a href="#isolates-browser">Isolates Browser.</a></li>
</ul>
</div>
<!-- ====== Begin_MicroBIGG-E_SAMPLE_SEARCH_co-ocurring_genes =========== -->
<!-- ====== MicroBIGG-E_SAMPLE_SEARCH_find-isolates-and-alleles-described-by-publication =========== -->
<span id="microbigge-sample-search-find-alleles-described-by-publication"><b>Find the isolates and alleles described by a publication of interest</b></span> <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#microbigge-sample-searches"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="MicroBIGG-E help, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
<div style="padding-left: 2em">
As an example, the paper by Shields, et al., describes a two amino-acid deletion in blaACT alleles that confers resistance to ceftazidime-avibactam (<a href="https://pubmed.ncbi.nlm.nih.gov/32236408/">PubMed ID 32236408</a>)<!--https://academic.oup.com/cid/advance-article/doi/10.1093/cid/ciaa355/5814288 -->. Use the publication and MicroBIGG-E to retrieve and examine the isolates and specific alleles reported in the paper:<br />
<ul>
<li>Identify the isolates, "Surv196" and "ENT630," from the paper that have these blaACT variants.</li>
<li>Open the <a href="/pathogens/isolates#/microbigge/">MicroBIGG-E</a>: <b>Micro</b>bial <b>B</b>rowser for <b>I</b>dentification of <b>G</b>enetic and <b>G</b>enomic <b>E</b>lements.</li>
<li>Search for the isolates in the <a href="#microbigge-data-field-strain">strain</a> data field by entering the following query:<br />
<i><a href="/pathogens/isolates/#/microbigge/strain:Surv196%20OR%20strain:ENT630">strain:Surv196 OR strain:ENT630</a></i><br />
(Note that field-specified searches are <a href="#case-sensitive"><b>case-sensitive</b></a>, and separate sections of this document provide tips about search terms that contain <a href="#special-characters">special characters</a> (such as the parentheses, hyphens, and apostrophes), and the use of <a href="#wildcards">wildcards</a> such as the asterisk.)</li>
<li>Identify the <i>blaACT</i> alleles among the genetic/genomic elements that are retrieved by MicroBIGG-E.</li>
<li>For the allele of interest, retrieve the corresponding WP_* accession from the <a href="https://www.ncbi.nlm.nih.gov/protein/">Protein database</a> to view the RefSeq protein sequence record. In this case, the accessions for the <i>blaACT</i> proteins that were identified on the isolate genomes are: <a href="https://www.ncbi.nlm.nih.gov/protein/WP_154123408.1">WP_154123408.1</a> (on the Surv196 isolate) and <a href="https://www.ncbi.nlm.nih.gov/protein/WP_152819218.1">WP_152819218.1</a> (on the ENT630 isolate).</li>
<!-- li>TESTING NOTES: For the blaACT allele in the isolate strain Surv196, the <a href="#microbigge-data-field-protein"><i>protein_acc</i></a> column lists <a href="https://www.ncbi.nlm.nih.gov/protein/WP_154123408.1">WP_154123408.1</a> and the <a href="#microbigge-data-field-closest-reference-accession"><i>closest_reference_acc</i></a> column lists <a href="https://www.ncbi.nlm.nih.gov/protein/WP_032652275.1">WP_032652275.1</a>. The latter accession is linked to the corresponding protein sequence record.)</li -->
<!-- li>TESTING NOTES: For the blaACT allele in the isolate strain ENT630, note that the <a href="#microbigge-data-field-protein"><i>protein_acc</i></a> column lists <a href="https://www.ncbi.nlm.nih.gov/protein/WP_152819218.1">WP_152819218.1</a> and the <a href="#microbigge-data-field-closest-reference-accession"><i>closest_reference_acc</i></a> column lists <a href="https://www.ncbi.nlm.nih.gov/protein/WP_017694683.1">WP_017694683.1</a>. The latter accession is linked to the corresponding protein sequence record.)</li -->
<li>Note that a WP_* accession can appear in the <a href="#microbigge-data-field-protein"><i>protein_acc</i></a> column and/or the <a href="#microbigge-data-field-closest-reference-accession"><i>closest_reference_acc</i></a> column.
<ul>
<li>Use the <a href="#microbigge-choose-columns">choose columns</a> function to display the desired data fields, as only a subset are displayed by default.</li>
<li>The <a href="#microbigge-data-field-protein"><i>protein_acc</i></a> column and <a href="#microbigge-data-field-closest-reference-accession"><i>closest_reference_acc</i></a> column might contain the <b>same value</b> (if the protein sequence of the element that was annotated on the isolate genome is identical to the reference protein sequence), or <b>different values</b> (if the protein sequence of the element that was annotated on the isolate genome is not identical to the reference protein sequence).</li>
<li>If a WP_* accession is not linked to the <a href="https://www.ncbi.nlm.nih.gov/protein/">Protein database</a>, you can search for the accession number directly in the Protein database.</li>
</ul>
</li>
</ul>
</div>
<!-- ====== END_MicroBIGG-E_SAMPLE_SEARCH_find-isolates-and-alleles-described-by-publication =========== -->
<!-- ====== MicroBIGG-E_SAMPLE_SEARCH_XXXXXXXXXX =========== -->
<!-- span id="microbigge-sample-search-_______"><b>___TEMPLATE_single_line_summary_of_use_case____</b></span> <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#microbigge-sample-searches"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="MicroBIGG-E help, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
<div style='padding-left: 2em'>
As an example, _______________:<br />
<ul>
<li>Open the <a href="/pathogens/isolates#/microbigge/">MicroBIGG-E</a>: <b>Micro</b>bial <b>B</b>rowser for <b>I</b>dentification of <b>G</b>enetic and <b>G</b>enomic <b>E</b>lements.</li>
<li>_____________________</li>
<li>_____________________</li>
<li>_____________________</li>
</ul>
</div -->
<!-- ====== END_MicroBIGG-E_SAMPLE_SEARCH_XXXXXXXXXX ======== -->
<!-- ====== MicroBIGG-E_SAMPLE_SEARCH_XXXXXXXXXX =========== -->
<!-- span id="microbigge-sample-search-_______"><b>___TEMPLATE_single_line_summary_of_use_case_that_uses_FILTERS_function____</b></span> <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#microbigge-sample-searches"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="MicroBIGG-E help, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a><br /><br />
<div style='padding-left: 2em'>
As an example:<br />
<ul>
<li>Open the <a href="/pathogens/isolates#/microbigge/">MicroBIGG-E</a>: <b>Micro</b>bial <b>B</b>rowser for <b>I</b>dentification of <b>G</b>enetic and <b>G</b>enomic <b>E</b>lements.</li>
<li>Open the "<b><i>Filters</i></b>" function.</li>
<li>By <b>default</b>, each filter shows the <b>top 10 terms</b> (based on the number of genes/alleles retrieved by a term).</li>
<li>In the <b><i>_____</i></b> section of the filters, click on "<b><i>[+]more</i></b>" to see the up to the <b>top 100 terms</b> available (based on the number of genes/alleles retrieved by a term, and listed alphabetically within that set of top 100).</li>
<li>"<b><i>_____</i></b>" now appears as an option under <b><i>_____</i></b>. Select that option. Upon this action, the Filters display will refresh itself to show only the set of filters that apply to that ______, and the tabular list of genes and alleles will refresh itself to show only the items that fall in that class.</li>
</ul>
<i>An alternative method for retrieving those genetic elements is to search the ______ data field directly. To do this, open <a href="/pathogens/isolates#/microbigge/">MicroBIGG-E</a> and enter the query:<br /> <b>_____:______</b><br />
Separate sections of this file provides details about <a href="#microbigge-filters">filters</a>, and about how to directly search specific <a href="#microbigge-data-fields">data fields</a>, such as the <a href="#microbigge-data-field-____">____</a> and <a href="#microbigge-data-field-_____">_____</a> fields, and <a href="#case-sensitive">case sensitive</a> searches.</i><br /><br />
</div -->
<!-- ====== END_MicroBIGG-E_SAMPLE_SEARCH_XXXXXXXXXX ======== -->
<!-- =========== END_MicroBIGG-E_SAMPLE_SEARCHES ============ -->
</div>
<!-- =========== END_MicroBIGG-E ============ -->
<!-- =========== AMR_SUBMIT_DATA ============ -->
<h3 id="amr-submit">Submit sequence and phenotype data related to AMR <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#amr"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Antimicrobial resistance (AMR) resources, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h3>
<ul>
<li><a href="/pathogens/submit-data/">Submit data for real-time analysis</a></li>
<li><a href="https://www.ncbi.nlm.nih.gov/biosample/docs/antibiogram/">Submit antibiograms to the BioSample database</a></li>
<li><a href="/pathogens/submit-beta-lactamase/">Request new alleles for Beta-Lactamase, MCR, and Qnr Genes</a></li>
</ul>
<!-- =========== END_AMR_SUBMIT_DATA ============ -->
<!-- =========== AMR_FTP_RAW_DATA ============ -->
<h3 id="amr-ftp">Download AMR Raw Data <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#amr"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Antimicrobial resistance (AMR) resources, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h3>
<div style="padding-left: 2em">
The AMR subdirectory of the Pathogens FTP site allows <a href="https://ftp.ncbi.nlm.nih.gov/pathogen/Antimicrobial_resistance">Raw Data Download</a>. It includes AMRFinderPlus data files and the Bacterial Antimicrobial Resistance Reference Gene Database (BioProject <a href="https://www.ncbi.nlm.nih.gov/bioproject/PRJNA313047">PRJNA313047</a>).<br />
<i>(An <a href="#ftp">overview of the Pathogens FTP site</a> is provided below.)</i>
</div>
<br />
<!-- =========== END_FTP_RAW_DATA ============ -->
<!-- ######## END_H2_SECTION:ANTIMICROBIAL_RESISTANCE_AMR_RESOURCES ######## -->
<!-- ======== HORIZONTAL_RULE ============ -->
<hr />
<!-- ======== END_HORIZONTAL_RULE ======== -->
<!-- ########## H2_SECTION:FTP_SITE ########## -->
<h2 id="ftp">FTP Site help <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h2>
<!-- div style='padding-left: 2em'>
<a href="#ftp-what-is">What data are on the FTP site?</a><br />
<a href="#ftp-directory-structure">How are the data organized?</a><br />
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="20" height="1" border="0" /><a href="#ftp-results">Results directory</a><br />
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="20" height="1" border="0" /><a href="#ftp-reference">Reference directory</a><br />
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="20" height="1" border="0" /><a href="#ftp-antimicrobial-resistance">Antimicrobial_resistance directory</a><br />
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="20" height="1" border="0" /><a href="#ftp-other">Other directories</a><br />
<a href="#ftp-readme">FTP Readme File</a><br />
</div -->
<ul>
<li><a href="#ftp-what-is">What data are on the FTP site?</a></li>
<li><a href="#ftp-directory-structure">How are the data organized?</a>
<ul>
<!-- li><a href="#FTPParentDirectory">Parent directory</a></li -->
<li><a href="#ftp-results">Results directory</a></li>
<li><a href="#ftp-reference">Reference directory</a></li>
<li><a href="#ftp-antimicrobial-resistance">Antimicrobial_resistance directory</a></li>
<li><a href="#ftp-other">Other directories</a></li>
</ul>
</li>
<li><a href="#ftp-readme">FTP Readme File</a></li>
</ul>
<!-- ========= FTP_SITE_WHAT_IS ============ -->
<h3 id="ftp-what-is">What data are on the Pathogens FTP site? <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#ftp"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="FTP site, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h3>
<div style="padding-left: 2em">
The NCBI Pathogen Detection analysis pipeline artifacts are copied to FTP for bulk downloading. The data that are available include metadata tables, cluster lists, and individual SNP trees, and mimic what is available in the Pathogen Browser. In addition, there are files that support efforts for antimicrobial resistance gene detection including reference tables, and files used by NCBI <a href="/pathogens/antimicrobial-resistance/AMRFinder/">AMRFinderPlus</a>.
</div>
<!-- ======== END_FTP_SITE_WHAT_IS ========= -->
<!-- ========= FTP_SITE_DIRECTORY_STRUCTURE ============ -->
<h3 id="ftp-directory-structure">How are the Pathogens data organized on the <a href="https://ftp.ncbi.nlm.nih.gov/pathogen/">FTP site?</a> <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#ftp"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="FTP site, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h3>
<div style="padding-left: 2em">
<a href="#ftp-results">Results directory</a> | <a href="#ftp-reference">Reference directory</a> | <a href="#ftp-antimicrobial-resistance">Antimicrobial Resistance directory</a> | <a href="#ftp-other">Other directories</a>
</div>
<ul>
<!-- ======= FTP_RESULTS_DIRECTORY ======= -->
<li id="ftp-results"><b><a href="https://ftp.ncbi.nlm.nih.gov/pathogen/Results/">Results directory</a></b>:<br />
Individual phylogenetic trees for each SNP cluster are available in the Pathogens FTP <a href="https://ftp.ncbi.nlm.nih.gov/pathogen/Results/">"Results" directory</a>.<br /><br />
Note: Individual phylogenetic trees for each SNP cluster are also accessible from the NCBI Pathogen Detection Isolates Browser. In the Isolates Browser, isolates that have "PDS*" accession number in the "SNP Cluster" column have a link to the SNP Tree Viewer, which provides an interactive display of the SNP cluster. <i>(<a href="#snp-tree-viewer">read more...</a>)</i><br /><br />
Each folder in this directory contains the data analysis results, such as phylogenetic distance trees, for a given organism group. The folders contain the results of the most current data analyses, as well as archival results from previous analyses. The results for a given organism group are <b>updated daily</b> for each taxgroup, only if new data arrives. Archived results are stored according to the <a href="#data-retention">data retention policy</a>.<br />
<ul>
<li id="ftp-organism-specific"><b>Organism group folders</b> - These folders contains the results of data analyses, such as phylogenetic distance trees, that were done on the genome assemblies of isolates within each organism group in the Pathogen Detection Project.
Within an given organism group, the subfolder named with the most recent Pathogen Detection Group accession.version number (PDGxxxxxxxxxx.xxx*) contains the most recent results. The results for a given organism group are <b>updated daily</b> for each taxgroup, only if new data arrives. The "<b>latest_kmer</b>" and "<b>latest_snps</b>" links provide updated links to the most recent results for kmer and SNP analyses, respectively, which may be asynchronously produced (may point to different PDG versions); otherwise they will both point to the most recent PDG version.<br />
<ul>
<li id="ftp-rapid-reports"><b>Rapid_reports for select organisms</b> - This directory is a pilot phase test of rapid reporting based solely on wgMLST allele differences and is only operational for a few submitters for a few organisms. The FTP Rapid Reports for a given organism are <b>updated on average within an hour</b> of receiving sequence read submissions for a new isolate.</li>
</ul>
</li>
</ul>
</li>
<!-- ======= FTP_REFERENCE_DIRECTORY ======= -->
<li id="ftp-reference"><b><a href="https://ftp.ncbi.nlm.nih.gov/pathogen/Reference/">Reference directory</a></b>:<br />
This directory does NOT include real-time analysis results, and is only based on genomes available in GenBank that are not submitted as part of surveillance networks to SRA.
</li>
<!-- ======= FTP_ANTIMICROBIAL_RESISTANCE_DIRECTORY ======= -->
<li id="ftp-antimicrobial-resistance"><b><a href="https://ftp.ncbi.nlm.nih.gov/pathogen/Antimicrobial_resistance/">Antimicrobial_resistance directory</a></b>:<br />
This directory contains the reference table for AMR genes, and the data files used for AMRFinderPlus.<br />
For more information on NCBI's efforts on antimicrobial resistance, see this page:<br />
<a href="/pathogens/antimicrobial-resistance/">/pathogens/antimicrobial-resistance/</a>.<br />
For more information on AMRFinderPlus see this page:<br />
<a href="/pathogens/antimicrobial-resistance/AMRFinder/">/pathogens/antimicrobial-resistance/AMRFinder/</a>.
</li>
<!-- ======= FTP_OTHER_DIRECTORIES ======= -->
<li id="ftp-other"><b><a href="https://ftp.ncbi.nlm.nih.gov/pathogen/Reference/">Other directories</a></b>:<br />
For descriptions of the other subdirectories see the <a href="https://ftp.ncbi.nlm.nih.gov/pathogen/ReadMe.txt">FTP README file.</a>
</li>
</ul>
<!-- ======== END_FTP_SITE_DIRECTORY_STRUCTURE ========= -->
<!-- ========= FTP_SITE_README ============ -->
<h3 id="ftp-readme">FTP Readme File <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#ftp"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="FTP site, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h3>
<ul>
<li>For more information on directory structure, filetypes, and details on what data are available, please see the Pathogens Detection Project FTP readme file available at: <a href="https://ftp.ncbi.nlm.nih.gov/pathogen/ReadMe.txt"><b>https://ftp.ncbi.nlm.nih.gov/pathogen/ReadMe.txt</b></a></li>
</ul>
<br />
<!-- ======== END_FTP_SITE_README ========= -->
<!-- ########## END_H2_SECTION:FTP_SITE ########## -->
<!-- ======== HORIZONTAL_RULE ============ -->
<hr />
<!-- ======== END_HORIZONTAL_RULE ======== -->
<!-- ########## H2_SECTION:DATA_SUBMISSIONS ########## -->
<h2 id="submit">Data Submissions <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h2>
<!-- div style='padding-left: 2em' -->
<li>Please refer to <a href="https://www.ncbi.nlm.nih.gov/pathogens/submit-data/">these instructions to submit data to NCBI Pathogen Detection resource.</a></li><br />
<br />
<!-- ########## END_H2_SECTION:DATA_SUBMISSIONS ########## -->
<!-- ======== HORIZONTAL_RULE ============ -->
<hr />
<!-- ======== END_HORIZONTAL_RULE ======== -->
<!-- ########## H2_SECTION:DATA_PROCESSING ########## -->
<h2 id="data-processing">Data Processing Pipeline<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h2>
<!-- ========== MINI-TOC =========== -->
<div style="padding-left: 2em">
Please refer to <a href="/pathogens/docs/data_processing">Data Processing Pipeline</a>
<br /><br />
</div>
<!-- ########## END_H2_SECTION:DATA_PROCESSING ########## -->
<!-- ======== HORIZONTAL_RULE ============ -->
<hr />
<!-- ======== END_HORIZONTAL_RULE ======== -->
<!-- ########## H2_SECTION:DATA_RETENTION_HISTORY_TRACKING ########## -->
<h2 id="data-retention">Data Retention and History Tracking<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h2>
<!-- div style='padding-left: 2em'>
<a href="#data-evolve"><b>Pathogen data</b> and analysis results continue to <b>evolve</b></a><br />
<a href="#three-critical-data-objects"><b>Three critical data objects</b> are <b>tracked</b></a><br />
<a href="#accession-version"><b>Accession.Versions</b> are used to <b>track changes</b></a><br />
<a href="#data-retention-display-previous-data"><b>Two interactions</b> that may not present the most up-to-date information</a><br />
<a href="#data-retention-two-states"><b>Two states for data retention</b> besides the most up-to-date version</a><br />
<a href="#data-retention-scenarios"><b>Example scenarios</b>: requests for previous versions of data that are older than <b>30 days</b></a><br />
<a href="#data-retention-share"><b>Shared URLs</b> are valid for <b>60 days</b></a>
<a href="#data-retention-ftp">Data retention policy for ftp</a>
</div -->
<ul>
<li><a href="#isolates-browser-data-retention">Pathogen Detection Isolates Browser data retention</a> </li>
<ul>
<li><a href="#data-evolve">Pathogen data and analysis results continue to evolve</a></li>
<li><a href="#three-critical-data-objects">Three critical data objects are tracked</a></li>
<li><a href="#accession-version">Accession.Versions are used to track changes</a></li>
<li><a href="#data-retention-display-previous-data">Two interactions that may not present the most up-to-date information</a></li>
<li><a href="#data-retention-two-states">Two states for data retention besides the most-up-to date version</a></li>
<li><a href="#data-retention-scenarios">Example scenarios: responses to requests for previous versions of data that are older than 30 days</a></li>
<li><a href="#data-retention-share">Shared URLs are valid for 60 days</a></li>
<li><a href="#data-retention-ftp">Data retention policy for ftp</a></li>
</ul>
<li><a href="#microbigge-data-retention">MicroBIGG-E data retention</a></li>
<li><a href="#reference-data-retention">Reference data retention</a>
(Reference Gene Catalog, Reference Gene Hierarchy, Reference HMM Catalog, and AMRFinderPlus database)
</li>
</ul>
<!-- ========= EVOLVING_DATA_AND_ANALYSIS_RESULTS ============ -->
<h3 id="data-evolve">Pathogen Reference Data and Analysis Results Continue to Evolve <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#data-retention"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Data Submissions, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h3>
<ul>
<li>Unlike many other databases and resources at NCBI, the <b><a href="/pathogens/">Pathogen Detection Project</a> was designed to provide updates of analyses in real-time. Therefore, the content of the resource may be updated multiple times per day.</b> For any given <b>pathogen isolate, organism group, or SNP cluster</b>, the Pathogen Detection Browsers display, by default, the <b>most current data and analysis results</b>, including the relationships among isolates that have been calculated by the <a href="/pathogens/docs/data_processing">data processing pipeline</a>. Therefore, for most uses of the browsers, the latest data are being presented.
Of the browsers only the isolates browser retains some tracking of history as <a href="#three-critical-data-objects">described below</a>. The Reference Browsers (<a href="/pathogens/refgene">Reference Gene Catalog</a>, <a href="/pathogens/genehierarchy">Reference Gene Hierarchy</a>, and <a href="/pathogens/hmm">Reference HMM Catalog</a>) all only show data for the most recent release. A complete history is maintained on the FTP site. See <a href="#amrfinder-data-retention">AMRFinderPlus Reference Data Retention</a> for details</li>
</ul>
<!-- ========= END_EVOLVING_DATA_AND_ANALYSIS_RESulTS ============ -->
<!-- ========= ISOLATES_BROWSER_DATA_RETENTION ======== -->
<h3 id="isolates-browser-data-retention">Isolates Browser data retention <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#data-retention"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Data Submissions, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h3>
<!-- ======== THREE_CRITICAL_DATA_OBJECTS_ARE_TRACKED ====== -->
<h4 id="three-critical-data-objects">Three critical Isolates Browser data objects are tracked <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#data-retention"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Data Submissions, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h4>
<ul>
<li>The system tracks versions for three critical data objects:
<ol>
<li>the assembly of any <b>isolate</b> ("<a href="#accession-prefix-pdt">PDT</a>")</li>
<li>the <b>SNP cluster</b> of an isolate if it belongs to one ("<a href="#accession-prefix-pds">PDS</a>")</li>
<li>the <b>organism group</b> ("<a href="#accession-prefix-pdg">PDG</a>")</li>
</ol>
The organism group is the entire package of new isolate updates, which could consist of both new or updated assemblies as well as new or updated clusters. Updates of each organism group could occur as frequently as every 24 hours, and as each organism group is independent of one another, multiple organism groups could be updated in a given day.
</li>
</ul>
<!-- ====== END_THREE_CRITICAL_DATA_OBJECTS_ARE_TRACKED ======= -->
<!-- ========= ACCESSION.VERSIONS_USED_TO_TRACK_CHANGES ============ -->
<h4 id="accession-version">Accession.Versions are used to track changes <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#data-retention"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Data Submissions, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h4>
<ul>
<li>The Pathogen Detection Project assigns an <b>accession.version</b> to each isolate genome assembly, organism group, and SNP cluster in order to track changes to the pathogens data and analysis results. For example:<br /><br />
<ul>
<li id="pdt-accession-version">The <b>Pathogen Detection Target</b> ("<b>PDT</b>" accession.version) is the genome assembly for an individual <b>isolate</b>.<br />
A new version of a <a href="#accession-prefix-pdt">PDT</a> record indicates a change in the assembly.</li>
<li id="pds-accession-version">The <b>Pathogen Detection SNP cluster</b> ("<b>PDS</b>" accession.version) is a group of <b>isolates that are closely related</b>, based on the SNP distance between their genome assemblies as calculated by the Pathogen Detection Project <a href="/pathogens/docs/data_processing">data processing pipeline</a>.<br />
A new version of a <a href="#accession-prefix-pds">PDS</a> record may indicate changes such as the following:<br />
<ul>
<li>The SNP cluster changed its membership.</li>
<li>Some of its SNP distances have changed among the isolates that are members of the SNP cluster<!-- Some of its inter-target distances changed --></li>
</ul>
<br />
</li>
<li id="pdg-accession-version">The <b>Pathogen Detection Group</b> ("<b>PDG</b>" accession.version) is also known as an <b>organism group</b>.<br />
A new version of a <a href="#accession-prefix-pdg">PDG</a> record includes additions or deletions of isolates, changes to isolate assemblies. All of these isolate assembly changes may or may not include changes to SNP clusters (additions, deletions, modifications). The Pathogens Detection Project retains the <b>most recent 300 versions</b> of a PDG.<br />
<ul>
<li><i>Technical note: An organism group (PDG) contains one or more targets (PDTs). A PDT is a member of zero or one SNP cluster (PDS), and never more than one cluster. A SNP cluster is composed of two or more PDTs, and each ach PDS is completely contained within a PDG.</i></li></ul><br />
</li>
</ul>
As the data and analysis results evolve, the Pathogen Detection Project applies data retention and history tracking policies as described below.
</li>
</ul>
<!-- ======== END_ACCESSION.VERSIONS_USED_TO_TRACK_CHANGES ========= -->
<!-- ======== TWO_INTERACTIONS_THAT_MAY_DISPLAY_PREVIOUS_DATA ====== -->
<h4 id="data-retention-display-previous-data">Two interactions that may not present the most up to date information <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#data-retention"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Data Submissions, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h4>
<ul>
<li>As noted under <a href="#data-evolve">Pathogen Data and Analysis Results Continue to Evolve</a>, the <b>latest data are presented by default</b> for most uses of the browser. There are <b>only two specific user interactions with the browser that may not present the most up-to-date information</b>: 1) searches with specific accession.versions of one of the <a href="#three-critical-data-objects">three objects</a> mentioned above (PDT, PDG, PDS) that are from older analyses, and 2) the <a href="#data-retention-share">"share URL"</a> button on the SNP Tree Viewer. For both of these cases there is a data retention policy is place that culls older data (i.e., removes versions of isolates, organism groups, and SNP clusters that were retired more than 30 days ago) so that the system does not need to retain every single piece of data ever calculated.</li>
</ul>
<!-- ====== END_TWO_INTERACTIONS_THAT_MAY_DISPLAY_PREVIOUS_DATA ======= -->
<!-- ============ TWO_STATES_FOR_DATA_RETENTION =========== -->
<h4 id="data-retention-two-states">Two states for data retention besides the most up to date version <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#data-retention"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Data Submissions, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h4>
<ul>
<li>There are two states for data retention besides the most up to date version. These include a window of 30 days where older data can be viewed, including the SNP tree as it looked for that particular version, and beyond that, the interface will present the user with links to the most current versions of that data.</li>
</ul>
<!-- ====== END_TWO_STATES_FOR_DATA_RETENTION ======= -->
<!-- == EXAMPLE_SCENARIOS_REQUEST_PREVIOUS_VERSIONS_OLDER_THAN_30_DAYS == -->
<h4 id="data-retention-scenarios">Example scenarios: requests for previous versions of data that are older than 30 days <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#data-retention"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Data Submissions, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h4>
<ul>
<li><b>If you try to view previous versions of the data, the following scenarios can occur:</b><br />
<ul>
<li><b>If you are requesting an accesion/version that is older than the 30 day retention period</b>, you can no longer see the content (e.g., phylogenetic tree, SNP distances, metadata) for a target or cluster. However, the Pathogen Browser will indicate the current version of a requested target or cluster. It can also help you find successor target or cluster(s) if the requested target or cluster no longer exists. These hints are displayed at the top of the Browser.<br />
<ul>
<li>For example, if you enter PDT000000625.5 in the Search Isolates box, you get a message like this:<br />
<i>Record PDT000000625.5 replaced by PDG000000002.1212/PDT000000625.6. The system is directing you to the newer version PDT000000625.6 published in PDG version PDG000000002.1212.</i></li>
</ul><br />
</li>
<li><b>If the requested cluster no longer exists</b>, then a list of one or more successor clusters may be presented. The Pathogen Browser determines the past target membership of the requested cluster and traces forward to the current clusters that contain those targets. This allows forward tracking of a cluster when the cluster has split or merged over time, or has been completely replaced.<br />
<ul>
<li>For example, if you enter PDS000029842.1 in the Search Isolates box, you get message like this:<br />
<i>SNP cluster(s) succeeded by PDG000000002.1212/PDS000032550.9.</i></li>
</ul><br />
</li>
<li><b>Occasionally a target may be withdrawn (taken out of service) usually as a result of data retraction by a submitter</b>. When you request such a target, the Pathogen Browser will try to direct you to the cluster (or its successor(s)) that once included the target as a member.<br />
<ul>
<li>For example, if you enter PDT000111278.1 you will get a message like this:<br />
<i>Record removed: PDT000111278.1 SNP cluster(s) succeeded by PDG000000002.1212/PDS000028815.20.</i></li>
</ul><br />
</li>
<li><b>Using a <a href="#data-retention-share">shared URL</a> that you either made in the past or got from a collaborator</b> could result in any one of the following, depending on the age of the shared URL and whether the URL refers to actual content within the 30d retention period:<br />
<ul>
<li>A <b>tree viewer display</b> (if the URL refers to current data, or to data that is still available as a result of the 30 day retention policy)<br />OR</li>
<li>A <b>history tracking message</b> such as the ones in the examples above (if the URL is less than 60 days old and refers to data that is no longer available in its previous form)<br />OR</li>
<li>A <b>message saying the URL has expired</b> (if the URL is more than 60 days old). In that case, if you are still interested in viewing the isolate, organism group, or SNP cluster that is cited in the URL, you can enter the corresponding PDT*, PDG*, or PDS* accession number in the <a href="/pathogens/isolates#/search/">Isolates Browser</a> to access the most recent version of the data.</li>
</ul>
</li>
</ul>
</li>
</ul>
<!-- == END_EXAMPLE_SCENARIOS_REQUEST_PREVIOUS_VERSIONS_OLDER_THAN_30_DAYS == -->
<!-- ======== SHARED_URLs_VALID_FOR_60_DAYS ====== -->
<h4 id="data-retention-share">Shared URLs are valid for 60 days <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#data-retention"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Data Submissions, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h4>
<ul>
<li>A "<b>Share</b>" button is available in the SNP Tree Viewer display (as shown in part C of the <a href="#snp-tree-viewer-illustration"><span style="color:#d70000">illustrated example</span> of a SNP Tree Viewer display</a>). It produces a <b>URL that captures your customized view of the tree</b>, which can then be copied and shared with others to reproduce the same view.</li>
<li>The URL is <b>temporary</b>, remaining valid for <b>60 days</b>:<br /><br />
<ul>
<li>For the <b>first 30 days</b>, the URL will open the customized display, showing the isolates you selected and any other customizations you made to the view.</li>
<li>For the <b>second 30 days</b>, the URL continues to be valid, but during that time, it will only show a link to the default display for the most recent version of the SNP cluster. That is, the URL will not open the original customized view, but instead will redirect to a version of the phylogenetic distance tree that reflects the most recent for the tree.</li>
</ul>
<i>As mentioned near the top of this section on <a href="#data-retention">data retention and history tracking</a>, the composition of a tree can <a href="#data-evolve">change over time</a> as new data are added to the Pathogen Detection Project. Even if a tree remains unchanged, however, a saved URL is only retained in the system for 60 days.</i>
</li>
</ul>
<!-- ======== END_SHARED_URLs_VALID_FOR_60_DAYS ====== -->
<!-- ======== DATA_RETENTION_ON_FTP ====== -->
<h4 id="data-retention-ftp">Isolates browser data published to FTP are also subject to retention policies</h4>
<ul>
<li>Progressive retention policy:<br /><br />
<ul>
<li>Every publication within 30 days</li>
<li>One publication per week after 30 days but within 6 months</li>
<li>One publication per month after 6 months but within 1 year</li>
<li>One publication per year thereafter</li>
</ul>
<i>For latest details <a href="https://ftp.ncbi.nlm.nih.gov/pathogen/ReadMe.txt">please consult the FTP ReadMe.txt file.</a></i>
</li>
</ul>
<!-- ======== END_DATA_RETENTION_ON_FTP ====== -->
<!-- ========= END_ISOLATES_BROWSER_DATA_RETENTION ======== -->
<!-- MICROBIGGE_DATA_RETENTION -->
<h3 id="microbigge-data-retention">MicroBIGG-E data retention <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#data-retention"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Data Submissions, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h3>
<ul>
<li><a href="/pathogens/microbigge">MicroBIGG-E</a> and the <a href="/pathogens/docs/microbigge_gcp/"><code>ncbi-pathogen-detect.pdbrowser.microbigge</code> BigQuery table</a> only show the most recent available data. NCBI Pathogen Detection does not archive past results.</li>
</ul>
<!-- END_MICROBIGGE_DATA_RETENTION -->
<!-- REFERENCE_BROWSER_DATA_RETENTION -->
<h3 id="reference-data-retention">Reference browser data retention <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#data-retention"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Data Submissions, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h3>
<ul>
<li>The three reference browsers (<a href="/pathogens/refgene">Reference Gene Catalog</a>, <a href="/pathogens/genehierarchy">Reference Gene Hierarchy</a>, and <a href="/pathogens/hmm">Reference HMM Catalog</a>) only show data from the most recent release. The release version is shown above the upper left of the table (e.g., <b>db version:</b> 2022-08-09.1).</li>
<li>All release versions and the data behind them are archived on the Pathogen Detection FTP site at <a href="https://ftp.ncbi.nlm.nih.gov/pathogen/Antimicrobial_resistance/AMRFinderPlus/database">https://ftp.ncbi.nlm.nih.gov/pathogen/Antimicrobial_resistance/AMRFinderPlus/database</a>. This includes all the data files for the <a href="/pathogens/refgene">Reference Gene Catalog</a>, the <a href="/pathogens/genehierarchy">Reference Gene Hierarchy</a>, and the <a href="/pathogens/hmm">Reference HMM Catalog</a>, the <a href="https://github.com/ncbi/amr/wiki/AMRFinderPlus-database">AMRFinderPlus database</a>, a change log (<a href="https://ftp.ncbi.nlm.nih.gov/pathogen/Antimicrobial_resistance/AMRFinderPlus/database/latest/changes.txt">changes.txt</a>), and the data behind the browsers in tab-delimited text format. See the <a href="https://ftp.ncbi.nlm.nih.gov/pathogen/Antimicrobial_resistance/AMRFinderPlus/database">AMRFinderPlus wiki</a> for a detailed list of files and the formats of those files.</li>
</ul>
<!-- END_REFERENCE_BROWSER_DATA_RETENTION -->
<!-- ########## END_H2_SECTION:DATA_RETENTION_HISTORY_TRACKING ########## -->
<!-- ======== HORIZONTAL_RULE ============ -->
<hr />
<!-- ======== END_HORIZONTAL_RULE ======== -->
<!-- ########## H2_SECTION:CHANGE_LOG ########## -->
<h2 id="change-log">Log of Changes to Pathogen Detection Project <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h2>
<br>Contents:</br>
<ul>
<li><a href="https://ftp.ncbi.nlm.nih.gov/pathogen/Antimicrobial_resistance/AMRFinderPlus/database/latest/changes.txt">AMRFinderPlus database change log</a></li>
<li><a href="#change-log-features">Feature deployment history</a></li>
<li><a href="#change-log-organism-groups">Organism Group history</a></li>
</ul>
<h3 id="change-log-features">Feature deployment <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#change-log"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Log of Changes to Pathogen Detection Project" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h3>
<ul>
<!-- li><b>DD MMM YYYY</b> - ____Description______</li>
<li><b>DD MONTH YYYY</b> - ____Description______</li><br / -->
<li><b>SEPT 2024</b> - <a href="https://ncbiinsights.ncbi.nlm.nih.gov/2024/09/03/milestone-ncbi-pathogen-detection-2m-isolates/">Pathogen Detection hits 2M isolates.</a></li>
<li><b>JULY 2024</b> - Upgraded SeqSero2 to version 1.3.1 (Used for <a href="#isolates-browser-data-field-ComputedTypes">Computed types</a>)</li>
<li><b>APRIL 2024</b> - Released the AST Browser (<a href="/pathogens/ast/">AST Browser</a>).</li>
<li><b>OCTOBER 2023</b> - Released the MicroBIGG-E Map (<a href="/pathogens/microbigge_map">MicroBIGG-E Map</a>).</li>
<li><b>AUGUST 2022</b> - Isolates Browser and MicroBIGG-E data <a href="/pathogens/docs/gcp">available in Google Cloud Platform</a>. </li>
<li><b>JUNE 2022</b> - Reference sequence downloads from the <a href="/pathogens/refgene/">Reference Gene Catalog</a>.</li>
<li><b>OCTOBER 2021</b> - Released the Pathogen Detection Reference Gene Hierarchy (<a href="/pathogens/genehierarchy/">Reference Gene Hierarchy</a>). </li>
<li><b>AUGUST 2021</b> - Changed the Isolation Type / <em>epi_type</em> attribute that affects min-same/min-diff computation to default to NULL instead of environmental/other in the <a href="/pathogens/isolates/">Isolates Browser</a>, <a href="/pathogens/microbigge/">MicroBIGG-E</a>, and <a href="#snp-tree-viewer">SNP Tree Viewer</a>. This means that the min-same/min-diff values for an isolate may show n/a, and other min-same/min-diff values for isolates may change.
Added the <a href="#isolates-browser-data-field-ComputedTypes">Computed types / <em>computed_types</em></a> field to the <a href="/pathogens/isolates/">Isolates Browser</a> and <a href="#snp-tree-viewer">SNP Tree Viewer</a>.</li>
<li><b>MARCH 2021</b> - Released the Pathogen Detection Reference HMM Catalog (<a href="/pathogens/docs/HMM_catalog/">Reference HMM Catalog</a>).</li>
<li><b>JULY 2020</b> - Released the Microbial Browser for Genetic and Genomic Identification (<a href="#microbigge">MicroBIGG-E</a>).</li>
<li><b>FEBRUARY 2020</b> - Added five new data fields to the <a href="/pathogens/isolates#/search/">Isolates Browser</a>, including:
<a href="#isolates-browser-data-field-amrfinderplus-analysis-type">amrfinderplus_analysis_type</a>,
<a href="#isolates-browser-data-field-amrfinderplus-version">amrfinderplus_version</a>,
<a href="#isolates-browser-data-field-refgene-db-version">refgene_db_version</a>,
<a href="#isolates-browser-data-field-stress-genotypes">stress_genotypes</a>, and
<a href="#isolates-browser-data-field-virulence-genotypes">virulence_genotypes</a>. Added a <a href="#isolates-browser-share">"Share" function</a> to the Isolates Browser; it produces a URL that captures your search strategy, which can then be copied and shared with others to execute the search. (The results of the search will change over time as new data become available.) In the SNP Tree Viewer, enhanced the <a href="#search-in-tree">Search &amp; Highlight in Tree</a> function so it now searches all labels that are currently displayed by the SNP Tree Viewer, including custom labels you might have added to the tree. (Previously, the "Search in tree" function searched only the default set of labels.)</li>
<li><b>FALL 2019</b> - Released AMRFinderPlus with <a href="#refgene-data-field-organism">blacklist options</a> for certain genes ubiquitous in some species. Incorporated first fungal pathogen: <a href="/pathogens/isolates#/search/taxgroup_name:%22Candida%20auris%22"><i>Candida auris</i></a>.</li>
<li><b>SUMMER 2019</b> - Released <a href="https://github.com/ncbi/amr/wiki">AMRFinderPlus</a> with additional virulence and stress response genes. Publication by <a href="https://doi.org/10.1128/AAC.00483-19">Feldgarden et al. (2019)</a>, describing the NCBI <a href="#amr-finder">AMRFinder tool</a>, became available in <b><i>Antimicrob Agents Chemother</i></b> as an e-pub ahead of print (<a href="https://www.ncbi.nlm.nih.gov/pubmed/31427293">PubMed PMID: 31427293</a>; <a href="https://aac.asm.org/content/early/2019/08/27/AAC.00483-19.long">Full text at AAC</a>, <a href="https://doi.org/10.1128/AAC.00483-19">doi: 10.1128/AAC.00483-19</a>).</li>
<li><b>SPRING 2019</b> - Released <a href="#amr">Antimicrobial Resistance (AMR) resources</a>, including an <a href="/pathogens/antimicrobial-resistance/">AMR landing page</a>, <a href="/pathogens/antimicrobial-resistance/resources/">AMR resources page</a>, and the <a href="/pathogens/isolates#/refgene/">Pathogen Detection Reference Gene Catalog</a>. Preprint by <a href="https://doi.org/10.1101/550707">Feldgarden et al. (2019)</a>, describing the NCBI <a href="#amr-finder">AMRFinder tool</a>, became available in <b><i>BioRxiv</i></b>, <a href="https://doi.org/10.1101/550707">doi.org/10.1101/550707</a>. Released a new service that enables you to receive <a href="#automated-searches">Automatic e-mail notifications of new data</a>. Released the <a href="/pathogens/pathogens_help/">Pathogens help document</a>.
<!-- Released <b>Antimicrobial Resistance (AMR) resources</b>, including an <a href="/pathogens/antimicrobial-resistance/"><b>AMR landing page</b></a>, <a href="/pathogens/antimicrobial-resistance/resources/">AMR resources page</a>, and the <a href="/pathogens/isolates#/refgene/">Pathogen Detection Reference Gene Catalog</a>. Released a new service that enables you to <a href="#automated-searches"><b>Automatic e-mail notifications of new data</b></a>, either for <a href="#automated-searches-save">searches you have <b>saved</b></a> in the <a href="#isolates-browser">Isolates Browser</a>, or for <a href="#automated-searches-watch">isolates you have chosen to <b>watch</b></a> in the <a href="#snp-tree-viewer">SNP Tree Viewer</a>. Added new <a href="#snp-tree-viewer-controls"><b>SNP Tree Viewer display controls</b></a> that enable you to <a href="#expand">expand</a> or <a href="#collapse">collapse</a> tree branches, launch a <a href="#subtree">subtree view</a>, find <a href="#neighbors">neighbors</a> of selected isolates (i.e., genome assemblies that differ by no more than the number of SNPs you have specified), <a href="#search-in-tree">search and highlight isolates</a> in the tree that contain a term(s) of interest, choose <a href="#labels">labels</a> to display for all isolates in the tree, and <a href="#load-labels">load custom labels</a> for one or more specified isolates in a tree view. Released the <a href="/pathogens/pathogens_help/"><b>Pathogens help document</b></a>. --></li>
<!-- li><b>FALL 2018</b> - Additional genes/proteins reported into pathogen browser; additional organisms like Staphylococcus added to the system.[source: IEB seminar, Bill Klimke, 20180215_slide24]</li><br -->
<li><b>SUMMER 2018</b> - Switch to wgMLST clustering begins.</li>
<li><b>MAY 2018</b> - Updated version of pathogen browser to improve navigation within larger SNP trees.</li>
<li><b>FEB 2018</b> - Beta release of Pathogen Browser.</li>
<li><b>Jul 2017</b> - Alpha release of new Pathogen Browser.</li>
<li><b>MAY 2017</b> - Development of rapid reports based on SKESA/wgMLST.</li>
<li><b>DEC 2016</b> - Addition of antimicrobial resistant genotypes/phenotypes to Pathogen Browser.</li>
<li><b>MAY 2016</b> - NCBI Pathogen Browser released.</li>
<li><b>DEC 2015</b> - Automated delivery of SNP trees to FTP from NCBI pipeline.</li>
<li><b>SPRING 2015</b> - Whitehouse initiative on Combatting Antibiotic Resistant Bacteria (CARB), includes building a national database of resistant pathogens; NCBI working on a system to identify resistance genes per isolate and the system to capture resistance phenotypes per isolate.</li>
<li><b>FALL 2014</b> - Automated delivery of NCBI analysis results, k-mer trees, work begins on detection of AMR genes/proteins.</li>
<li><b>SUMMER 2013</b> - Data starts to arrive at NCBI in summer of 2013.</li>
<li><b>JAN 2013</b> - NCBI begins modeling data systems/pipelines for Pathogen Detection.</li>
<li><b>MAR 2012</b> - NCBI begins integration of analysis pipeline into gpipe, k-mer analysis, assembly, SNP calling.</li>
<li><b>OCT 2011</b> - NCBI begins R&amp;D into a framework for analysis following the 2nd Global Microbial Identifier (GMI) meeting.</li>
<li><b>SEP 2011</b> - 1st Global Microbial Identifier (GMI) meeting: <a href="http://www.globalmicrobialidentifier.org/">http://www.globalmicrobialidentifier.org/</a>, <a href="http://science.sciencemag.org/content/333/6051/1818.full">http://science.sciencemag.org/content/333/6051/1818.full</a>.</li>
</ul>
<h3 id="change-log-organism-groups">Organism Group Changes <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" />
<a href="#change-log"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="Log of Changes to Pathogen Detection Project" /></a>
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a>
</h3>
<ul>
<li><b>2024-12-03</b> - Organism group <i>Candida auris</i> (PDG000000067) renamed to <i>Candidozyma auris</i>.</li>
<li><b>2024-10-11</b> - Organism group <i>Streptococcus mutans</i> (PDG000000140) introduced.</li>
<li><b>2024-10-10</b> - Organism group <i>Haemophilus influenzae</i> (PDG000000139) introduced.</li>
<li><b>2024-09-04</b> - The <i>Vibrio parahaemolyticus</i> organism group clustering method has been changed to use a wgMLST schema, starting with edition PDG000000023.956. Clustering results for the existing isolates have changed. In addition, non-<i>Vibrio parahaemolyticus</i> species formerly in this organism group were split to new organism groups:
<ul>
<li><i>Vibrio alginolyticus</i> (PDG000000136.1)</li>
<li><i>Vibrio antiquarius</i> (PDG000000137.1)</li>
<li><i>Vibrio diabolicus</i> (PDG000000138.1)</li>
</ul>
</li>
<li><b>2024-08-05</b> - Several <i>Neisseria</i> organism groups introduced:
<ul>
<li><i>Neisseria bacilliformis</i> (PDG000000129)</li>
<li><i>Neisseria cinerea</i> (PDG000000130)</li>
<li><i>Neisseria elongata</i> (PDG000000131)</li>
<li><i>Neisseria oralis</i> (PDG000000132)</li>
<li><i>Neisseria perflava</i> (PDG000000133)</li>
<li><i>Neisseria subflava</i> (PDG000000134)</li>
<li><i>Neisseria weaveri</i> (PDG000000135)</li>
</ul>
</li>
<li><b>2024-08-01</b> - The <i>Vibrio cholerae</i> organism group clustering threshold has been lowered, starting with edition PDG000000055.602. More than 350 new isolates have been included in clustering as a result. Clustering results for the existing isolates did not change however. In addition, non-<i>Vibrio cholerae</i> species formerly in this organism group were split to new organism groups:
<ul>
<li><i>Vibrio mimicus</i> (PDG000000127)</li>
<li><i>Vibrio metoecus</i> (PDG000000128)</li>
</ul>
</li>
<li><b>2024-07-10</b> - Additional <i>Legionella</i> organism groups introduced:
<ul>
<li><i>Legionella anisa</i> (PDG000000123)</li>
<li><i>Legionella bozemanae</i> (PDG000000126)</li>
<li><i>Legionella cherrii</i> (PDG000000125)</li>
<li><i>Legionella feeleii</i> (PDG000000124)</li>
</ul>
</li>
<li><b>2024-07-03</b> - The <i>Legionella pneumophila</i> organism group clustering method has changed to use a wgMLST schema, starting with edition PDG000000026.306. There are significant changes to clusters and isolates in clusters, please take a look if you are using specific clusters in this organism group.
</li>
<li><b>2024-01-18</b> - The <i>Enterococcus faecium</i> organism group (PDG000000071) has been split into its constituent species-specific organism groups as follows: <i>Enterococcus faecium</i> remains PDG000000071,
and <i>Enterococcus hirae</i> has been split to a new organism group (PDG000000122). In addition, the wgMLST locus found QC threshold has been lowered for <i>Enterococcus faecium</i>
thus admitting more isolates into the SNP clustering process.
</li>
<li><b>2023-03-14</b> - The <i>Enterobacter</i> organism group (PDG000000028) has been split into its constituent species-specific organism groups: <i>Enterobacter</i> has been renamed to <i>Enterobacter cloacae</i> (remains PDG000000028).
New organism groups have been created by splitting off the respective isolates as follows:
<ul>
<li><i>Enterobacter asburiae</i> (PDG000000106)</li>
<li><i>Enterobacter bugandensis</i> (PDG000000111)</li>
<li><i>Enterobacter cancerogenus</i> (PDG000000107)</li>
<li><i>Enterobacter chengduensis</i> (PDG000000118)</li>
<li><i>Enterobacter chuandaensis</i> (PDG000000119)</li>
<li><i>Enterobacter hormaechei</i> (PDG000000105)</li>
<li><i>Enterobacter kobei</i> (PDG000000108)</li>
<li><i>Enterobacter ludwigii</i> (PDG000000109)</li>
<li><i>Enterobacter mori</i> (PDG000000110)</li>
<li><i>Enterobacter oligotrophicus</i> (PDG000000121)</li>
<li><i>Enterobacter roggenkampii</i> (PDG000000116)</li>
<li><i>Enterobacter sichuanensis</i> (PDG000000117)</li>
<li><i>Enterobacter soli</i> (PDG000000112)</li>
<li><i>Kosakonia oryzendophytica</i> (PDG000000113)</li>
<li><i>Kosakonia oryziphila</i> (PDG000000114)</li>
<li><i>Phytobacter massiliensis</i> (PDG000000115)</li>
</ul>
</li>
<li><b>2023-02-08</b> - Organism group <i>Treponema pallidum</i> (PDG000000104) introduced.</li>
<li><b>2023-01-12</b> - Organism groups <i>Streptococcus equi</i> (PDG000000103), <i>Streptococcus suis</i> (PDG000000100), <i>Mannheimia haemolytica</i> (PDG000000101), and <i>Pasteurella multocida</i> (PDG000000102) introduced.</li>
<li><b>2023-01-05</b> - Organism groups <i>Vibrio metschnikovii</i> (PDG000000098) and <i>Vibrio fluvialis</i> (PDG000000099) introduced.</li>
<li><b>2022-11-21</b> - The <i>Neisseria</i> organism group (PDG000000032) has been split into its constituent species-specific organism groups: <i>Neisseria</i> has been renamed to <i>Neisseria gonorrhoeae</i> (remains PDG000000032).
New organism groups have been created by splitting off the respective isolates as follows: <i>Neisseria meningitidis</i> (PDG000000097), <i>Neisseria lactamica</i> (PDG000000095), <i>Neisseria polysaccharea</i> (PDG000000096)</li>
<li><b>2022-08-30</b> - Organism group <i>Burkholderia cepacia complex</i> (PDG000000094) introduced.</li>
<li><b>2022-07-08</b> - Organism groups <i>Pluralibacter gergoviae</i> (PDG000000092), <i>Stenotrophomonas maltophilia</i> (PDG000000093) introduced.</li>
<li><b>2022-06-01</b> - The <i>Listeria</i> organism group has been reorganized. All <i>Listeria monocytogenes</i> isolates continue to be clustered as before under <i>Listeria monocytogenes</i> (PDG000000001).
<i>Listeria innocua</i> isolates can now be found in a new organism group called <i>Listeria innocua</i> (PDG000000091).</li>
<li><b>2022-02-24</b> - Organism group <i>Streptococcus pyogenes</i> (PDG000000090) introduced.</li>
<li><b>2021-12-17</b> - Organism group <i>Streptococcus agalactiae</i> (PDG000000089) introduced.</li>
<li><b>2021-11-20</b> - Organism group <i>Bacillus cereus group</i> (PDG000000088) introduced.</li>
<li><b>2021-11-05</b> - Organism group <i>Yersinia enterocolitica</i> (PDG000000087) introduced.</li>
<li><b>2021-11-04</b> - New species <i>Aeromonas dhakensis</i> added to organism group <i>Aeromonas hydrophila</i> (PDG000000068).</li>
<li><b>2021-11-04</b> - Organism group <i>Yersinia ruckeri</i> (PDG000000086) introduced.</li>
<li><b>2021-11-04</b> - Organism groups <i>Aeromonas sobria</i> (PDG000000082), <i>Shewanella algae</i> (PDG000000084), <i>Streptococcus iniae</i> (PDG000000085), and <i>Vibrio harveyi</i> (PDG000000083) introduced.</li>
<li><b>2021-11-02</b> - Organism groups <i>Edwardsiella piscicida</i> (PDG000000080) and <i>Edwardsiella tarda</i> (PDG000000081) introduced.</li>
<li><b>2021-10-28</b> - Organism group <i>Edwardsiella ictaluri</i> (PDG000000079) introduced.</li>
<li><b>2021-10-27</b> - Organism group <i>Flavobacterium psychrophilum</i> introduced (PDG000000078)</li>
<li><b>2021-10-26</b> - Organism group <i>Aeromonas salmonicida</i> (PDG000000077) introduced.</li>
<li><b>2021-10-23</b> - Organism group <i>Aeromonas veronii</i> (PDG000000076) introduced.</li>
<li><b>2021-09-29</b> - Organism group <i>Pseudomonas putida</i> (PDG000000075) introduced.</li>
<li><b>2021-05-07</b> - Organism group <i>Streptococcus pneumoniae</i> (PDG000000074) introduced.</li>
<li><b>2021-04-13</b> - Organism group <i>Clostridium perfringens</i> (PDG000000061) expanded to include <i>Clostridium innocuum</i>.</li>
<li><b>2020-08-19</b> - Organism group <i>Staphylococcus aureus</i> (PDG000000073) introduced.</li>
<li><b>2020-03-06</b> - Organism groups <i>Enterococcus faecium</i> (PDG000000071) and <i>Enterococcus faecalis</i> (PDG000000072) introduced.</li>
<li><b>2019-11-24</b> - Organism group <i>Aeromonas hydrophila</i> (PDG000000068) introduced.</li>
<li><b>2019-09-17</b> - Organism group <i>Candida auris</i> (PDG000000067) introduced. This is the first fungal genome supported by Pathogen Detection.</li>
<li><b>2019-07-04</b> - Organism group <i>Pseudomonas aeruginosa</i> converted to wgMLST clustering starting with PDG000000036.199</li>
<li><b>2019-05-03</b> - Organism group <i>Klebsiella pneumoniae</i> converted to wgMLST clustering starting with PDG000000012.433</li>
<li><b>2019-02-13</b> - Organism group <i>Corynebacterium striatum</i> introduced (PDG000000064)</li>
<li><b>2019-01-31</b> - Organism group <i>Photobacterium damselae</i> introduced (PDG000000065)</li>
<li><b>2019-01-12</b> - Organism group <i>Vibrio vulnificus</i> introduced (PDG000000058)</li>
<li><b>2019-01-12</b> - Organism group <i>Clostridium botulinum</i> introduced (PDG000000059)</li>
<li><b>2019-01-09</b> - Organism group <i>Vibrio cholerae</i> (PDG000000055.1) introduced. This organism group uses wgMLST clustering.</li>
<li><b>2018-09-11</b> - Organism group <i>Clostridioides difficile</i> converted to wgMLST clustering starting with PDG000000045.44</li>
<li><b>2018-08-22</b> - Organism group <i>E.coli and Shigella</i> converted to wgMLST clustering starting with PDG000000004.987</li>
<li><b>2018-08-11</b> - Organism group <i>Salmonella enterica</i> converted to wgMLST clustering starting with PDG000000002.1173</li>
<li><b>2018-07-16</b> - Organism group <i>Listeria monocytogenes</i> converted to wgMLST clustering starting with PDG000000001.941</li>
<li><b>2018-06-12</b> - Organism group <i>Campylobacter jejuni</i> converted to wgMLST clustering starting with PDG000000003.579</li>
<li><b>2017-12-01</b> - Organism group <i>Clostridioides difficile</i> introduced (PDG000000045)</li>
<li><b>2017-11-17</b> - Organism group <i>Cronobacter</i> introduced (PDG000000043)</li>
<li><b>2017-07-29</b> - Organism group <i>Staphylococcus pseudintermedius</i> introduced (PDG000000042)</li>
<li><b>2017-01-14</b> - Organism group <i>Kluyvera_intermedia</i> introduced (PDG000000040)</li>
<li><b>2017-01-14</b> - Organism group <i>Citrobacter freundii</i> (PDG000000039) introduced.</li>
<li><b>2017-01-04</b> - Organism group <i>Pseudomonas aeruginosa</i> introduced (PDG000000036)</li>
<li><b>2016-12-20</b> - Organism group <i>Mycobacterium tuberculosis</i> (PDG000000034) introduced.</li>
<li><b>2016-11-09</b> - Organism group <i>Klebsiella oxytoca</i> introduced (PDG000000030)</li>
<li><b>2016-08-23</b> - Organism group <i>Vibrio parahaemolyticus</i> introduced (PDG000000023)</li>
<li><b>2016-06-01</b> - Organism group <i>Providencia alcalifaciens</i> introduced (PDG000000021)</li>
<li><b>2016-06-01</b> - Organism group <i>Morganella morganii</i> (PDG000000020) introduced.</li>
<li><b>2016-03-23</b> - Organism group <i>Serratia marcescens</i> introduced (PDG000000016)</li>
<li><b>2016-03-20</b> - Organism group <i>Elizabethkingia anophelis</i> introduced (PDG000000014)</li>
<li><b>2016-03-03</b> - Organism group <i>Klebsiella pneumoniae</i> introduced (PDG000000012)</li>
<li><b>2016-03-08</b> - Organism group <i>Acinetobacter</i> (PDG000000010) introduced.</li>
<li><b>2015-01-09</b> - Initial food-borne organism groups introduced
<ul>
<li><i>Listeria</i> (PDG000000001)</li>
<li><i>Salmonella</i> (PDG000000002)</li>
<li><i>Campylobacter</i> (PDG000000003)</li>
<li><i>Escherichia_coli / Shigella</i> (PDG000000004)</li>
</ul>
</li>
</ul>
<!-- ########## END_H2_SECTION:CHANGE_LOG ########## -->
<!-- ======== HORIZONTAL_RULE ============ -->
<hr />
<!-- ======== END_HORIZONTAL_RULE ======== -->
<!-- ########## H2_SECTION:REFERENCES ########## -->
<h2 id="references">References <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h2>
<div style="padding-left: 2em">
<a href="#citing">Citing the Pathogen Detection Project</a><br />
<a href="#ncbi-references-methods">NCBI Publications/Methods used by the Pathogen Detection Project</a><br />
<a href="#third-party-references-methods">Third party Publications/Methods used by the Pathogen Detection Project</a><br />
<a href="#references-other">Publications from Other Sources using the Pathogen Detection Browser</a><br />
<a href="#references-external">Publications from External Labs using the Pathogen Detection Browser</a><br />
<a href="#references-presentations">Presentations about the Pathogen Detection Project</a><br />
<a href="#references-genomics-food-safety">References about the Genomics for Food Safety (GenFS) initiative</a><br />
<a href="#references-fda-genometrakr">References about the FDA GenomeTrakr project and WGS activities</a><br />
<a href="#references-cdc-pulsenet">References about the CDC PulseNet network and WGS activities</a><br />
<a href="#references-phe">References about Public Health England WGS activities</a><br />
<a href="#references-other">Other related references</a><br />
<a href="#references-amr">References on antimicrobial resistance</a>, including <a href="#AMRFinder_2019">AMRFinder</a>
</div>
<!-- ul>
<li><a href="#citing">Citing the NCBI Pathogen Detection Project</a></li>
<li><a href="#references-methods">Publications/Methods about the Pathogen Detection Project</a></li>
<li><a href="#references-external">Publications from External Labs using the Pathogen Detection Browser</a></li>
<li><a href="#references-presentations">Presentations about the Pathogen Detection Project</a></li>
<li><a href="#references-genomics-food-safety">References about the Genomics for Food Safety (GenFS) initiative</a></li>
<li><a href="#references-fda-genometrakr">References about the FDA GenomeTrakr project and WGS activities</a></li>
<li><a href="#references-cdc-pulsenet">References about the CDC PulseNet network and WGS activities</a></li>
<li><a href="#references-other">Other related references</a></li>
<li><a href="#references-amr">References on antimicrobial resistance</a></li>
</ul -->
<!-- ======== CITING ============ -->
<h3 id="citing">Citing the NCBI Pathogen Detection Project <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#references"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="References, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h3>
<ul>
<li id="PathogensWebsite_2016">The NCBI Pathogen Detection Project. National Center for Biotechnology Information, National Library of Medicine, National Institutes of Health, Bethesda, MD 20894, USA. 2016 May [cited YYYY MMM DD]. Available from: <a href="/pathogens/">https://www.ncbi.nlm.nih.gov/pathogens/</a></li>
</ul>
<!-- citation format for the website is based on Chapter 25 of Citing Medicine: The NLM Style Guide for Authors, Editors, and Publishers [Internet]. 2nd edition. https://www.ncbi.nlm.nih.gov/books/NBK7274/
TEMPLATE:
<a href="__________">Author AB. Title [Internet]. Bethesda (MD): National Library of Medicine (US), National Center for Biotechnology Information. 2016 May [updated YYYY MMM DD; cited YYYY MMM DD]. Available from: _____url_____.</a>
-->
<!-- ======== END_CITING ============ -->
<!-- ======== REFERENCES_METHODS ============ -->
<h3 id="ncbi-references-methods">NCBI Publications/Methods used by the Pathogen Detection Project <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#references"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="References, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h3>
<div style="padding-left: 2em">
<i>The SAUTE reference-guided assembler is used in the Pathogen Detection pipeline in conjunction with gene sequences from the AMRFinderPlus data release. Software is available at <a href="https://github.com/ncbi/skesa/releases">https://github.com/ncbi/skesa/releases</a></i>
<ul>
<li id="SAUTE_2021">Souvorov A and Agarwala R. SAUTE: sequence assembly using target enrichment. <b><i>BMC Bioinformatics.</i> 2021</b> Jul 21;22(1):375. doi: 10.1186/s12859-021-04174-9. <a href="https://www.ncbi.nlm.nih.gov/pubmed/34289805">PubMed PMID: 34289805</a>; <a href="https://bmcbioinformatics.biomedcentral.com/articles/10.1186/s12859-021-04174-9">Full text at BMC</a>.</li>
</ul>
<i>The SKESA assembler is used in the Pathogen Detection pipeline. Software is available at <a href="https://github.com/ncbi/SKESA">https://github.com/ncbi/SKESA</a></i>
<ul>
<li id="SKESA_2018">Souvorov A, Agarwala R, Lipman DJ. SKESA: strategic k-mer extension for scrupulous assemblies. <b><i>Genome Biol.</i> 2018</b> Oct 4;19(1):153. doi: 10.1186/s13059-018-1540-z. <a href="https://www.ncbi.nlm.nih.gov/pubmed/30286803">PubMed PMID: 30286803</a>; <a href="https://www.ncbi.nlm.nih.gov/pmc/articles/PMC6172800/">Full text in PubMed Central PMCID: PMC6172800</a>; <a href="https://genomebiology.biomedcentral.com/articles/10.1186/s13059-018-1540-z">Full text at BMC</a>.</li>
</ul>
<i>The maximum compatibility algorithm is used to create the SNP trees in the Pathogen Detection browser. Software available at <a href="https://ftp.ncbi.nih.gov/pub/jcherry/compat/">https://ftp.ncbi.nih.gov/pub/jcherry/compat/</a></i>
<ul>
<li id="MaximumCompatibilityAlgorithm_2017">
Cherry JL. A practical exact maximum compatibility algorithm for
reconstruction of recent evolutionary history. <b><i>BMC Bioinformatics</i> 2017</b> Feb 23;18(1):127. doi: 10.1186/s12859-017-1520-4. <a href="https://www.ncbi.nlm.nih.gov/pubmed/28231758">PubMed PMID: 28231758</a>; <a href="https://www.ncbi.nlm.nih.gov/pmc/articles/PMC5324209/">Full text in PubMed Central PMCID: PMC5324209</a>; <a href="https://bmcbioinformatics.biomedcentral.com/articles/10.1186/s12859-017-1520-4">Full text at BMC</a>.</li>
</ul>
<p id="amrfinder_citations"><i>The <b>AMRFinderPlus</b> software is used to identify antimicrobial resistance genes plus select virulence, biocide, metal, and stress resistance genes. Software is available at <a href="https://github.com/ncbi/amr">https://github.com/ncbi/amr/wiki</a></i></p>
<ul>
<li id="AMRFinder_2022a">Feldgarden M, Brover V, Fedorov B, Haft DH, Prasad AB, Klimke W. Curation of the AMRFinderPlus databases: applications, functionality and impact.
<b><i>Microb Genome.</i> 2022</b> Jun;8(6). doi: 10.1099/mgen.0.000832. <a href="https://pubmed.ncbi.nlm.nih.gov/35675101/">PubMed PMID: 35675101</a>; <a href="https://doi.org/10.1099/mgen.0.000832">Full text at Microbial Genomics</a>.</li>
<li id="AMRFinder_2021a">Feldgarden M, Brover V, Gonzalez-Escalona N, Frye JG, Haendiges J, Haft DH, Hoffmann M, Pettengill JB, Prasad AB, Tillman GE, Tyson GH, Klimke W. AMRFinderPlus and the Reference Gene Catalog facilitate examination of the genomic links among antimicrobial resistance, stress response, and virulence.
<b><i>Sci Rep.</i> 2021</b> June 16;11(1):12728. https://doi.org/10.1038/s41598-021-91456-0. <a href="https://pubmed.ncbi.nlm.nih.gov/34135355/">PubMed PMID: 34135355</a>; <a href="https://www.nature.com/articles/s41598-021-91456-0">Full text at Nature Scientific Reports</a>.</li>
<li id="AMRFinder_2019a">
Feldgarden M, Brover V, Haft DH, Prasad AB, Slotta DJ, Tolstoy I, Tyson GH, Zhao S, Hsu C-H, McDermott PF, Tadesse DA, Morales C, Simmons M, Tillman G, Wasilenko J, Folster JP, Klimke W. Validating the NCBI AMRFinder Tool and Resistance Gene Database Using Antimicrobial Resistance Genotype-Phenotype Correlations in a Collection of NARMS Isolates. <b><i>Antimicrobial Agents and Chemotherapy. 2019</i></b> Nov 1;63(11). doi: e10.1128/AAC.00483-19 <a href="/pubmed/31427293">PubMed PMID: 31427293</a>; <a href="https://www.ncbi.nlm.nih.gov/pmc/articles/PMC6811410/">Full text in PubMed Central PMCID: PMC6811410</a>; <a href="https://aac.asm.org/content/63/11/e00483-19">Full text at AAC</a>.</li>
</ul>
<i>The PGAP annotation pipeline is used to annotate bacterial assemblies. Software is available at: <a href="https://github.com/ncbi/pgap">https://github.com/ncbi/pgap</a></i>
<ul>
<li id="PGAP_2018">
Haft DH, DiCuccio M, Badretdin A, Brover V, Chetvernin V, O'Neill K, Li W, Chitsaz F, Derbyshire MK, Gonzales NR, Gwadz M, Lu F, Marchler GH, Song JS, Thanki N, Yamashita RA, Zheng C, Thibaud-Nissen F, Geer LY, Marchler-Bauer A, Pruitt KD. RefSeq: an update on prokaryotic genome annotation and curation. <b><i>Nucleic Acids Research. 2018 </i></b> Jan 4;46(D1):D851-D860. doi: 10.1093/nar/gkx1068 <a href="/pubmed/29112715">PubMed PMID: 29112715</a>; <a href="https://www.ncbi.nlm.nih.gov/pmc/articles/pmid/29112715/">Full text in PubMed Central PMCID: PMC5753331</a>; <a href="https://academic.oup.com/nar/article-lookup/doi/10.1093/nar/gkx1068">Full text at Oxford University Press</a>.</li>
</ul>
</div>
<h3 id="third-party-references-methods">Third Party Publications/Methods used by the Pathogen Detection Project <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#references"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="References, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h3>
<div style="padding-left: 2em">
<i>SeqSero2 is run on Salmonella assemblies to populate the serotype and antigen_formula values in the computed_types field of the Pathogen Detection Isolates Browser.</i>
<ul>
<li id="seqsero2_2019">
Zhang S, den Bakker HC, Li S, Chen J, Dinsmore BA, Lane C, Lauer AC, Fields PI, Deng X. SeqSero2: Rapid and Improved Salmonella Serotype Determination Using Whole-Genome Sequencing Data. <b><i>Appl Environ Microbiol. 2019</i></b> Nov 14;85(23):e01746-19. <a href="https://doi.org/10.1128/AEM.01746-19">doi: 10.1128/AEM.01746-19</a>. <a href="/pubmed/31540993">PubMed PMID: 31540993</a>; <a href="/pmc/articles/PMC6856333/">Full text at PubMed Central PMCID: PMC6856333</a>.
</li>
<li id="seqsero2_2015">
Zhang S, Yin Y, Jones MB, Zhang Z, Deatherage Kaiser BL, Dinsmore BA, Fitzgerald C, Fields PI, Deng X. Salmonella serotype determination utilizing high-throughput genome sequencing data. <b><i>J Clin Microbiol. 2015</i></b> May;53(5):1685-92. <a href="https://doi.org/10.1128/JCM.00323-15">doi: 10.1128/JCM.00323-15</a>. Epub 2015 Mar 11. <a href="/pubmed/25762776">PubMed PMID: 25762776</a>; <a href="/pmc/articles/PMC4400759">Full text at PubMed Central PMCID: PMC4400759</a>.
</li>
</ul>
<i>HiSat2 is used to align reads to assemblies for coverage metrics.</i>
<ul>
<li id="hisat2_2019">
Kim D, Paggi JM, Park C, Bennett C, Salzberg SL. Graph-based genome alignment and genotyping with HISAT2 and HISAT-genotype. <b><i>Nat Biotechnol. 2019</i></b> Aug 2;37:907-915. <a href="https://doi.org/10.1038/s41587-019-0201-4">doi:10.1038/s41587-019-0201-4</a>; <a href="/pubmed/31375807/">PubMed PMID:31375807</a>; <a href="/pmc/articles/PMC7605509">Full text at PubMed Central PMCID: PMC7605509</a>.
</li>
</ul>
</div>
<!-- ======== END_REFERENCES_METHODS ============ -->
<!-- ======== REFERENCES_OTHER ============ -->
<h3 id="references-other">Publications from other sources using the Pathogen Detection Browser <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#references"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="References, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h3>
<div style="padding-left: 2em">
<i>Pro Publica Used Genomic Sequencing Data to Track an Ongoing Salmonella Outbreak.</i>
<ul>
<li id="PP_genomes">ProPublica (2021) Uses NCBI Pathogen Detection to look at Salmonella Infantis problem in food products. <a href="https://www.propublica.org/article/how-propublica-used-genomic-sequencing-data-to-track-an-ongoing-salmonella-outbreak">https://www.propublica.org/article/how-propublica-used-genomic-sequencing-data-to-track-an-ongoing-salmonella-outbreak</a> <a href="https://www.propublica.org/article/salmonella-chicken-usda-food-safety">https://www.propublica.org/article/salmonella-chicken-usda-food-safety</a></li>
</ul>
</div>
<!-- ======== END_REFERENCES_OTHER ============ -->
<!-- ======== REFERENCES_EXTERNAL ============ -->
<h3 id="references-external">Publications from External Labs using the Pathogen Detection Browser <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#references"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="References, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h3>
<div style="padding-left: 2em">
<i>Scientists use the Pathogen Detection System to link isolates from Southeast Asia to clinical cases in England and the US, some with a history of travel.</i>
<ul>
<li id="Cambodia_Corvallis">Schwan CL, Dallman TJ, Cook PW, Vipham J (2022) A case report of Salmonella enterica serovar Corvallis from environmental isolates from Cambodia and clinical isolates in the UK. Access Microbiology: Vol4(1) <a href="https://doi.org/10.1099/acmi.0.000315">https://doi.org/10.1099/acmi.0.000315</a></li>
</ul>
<i>Economic evaluation of whole genome sequence analysis using the publicly available data in the Pathogen Detection System.</i>
<ul>
<li id="FDA_econ_2021">Brown B, Allard M, Bazaco MC, Blankenship J, Minor T (2021) An economic evaluation of the Whole Genome Sequencing source tracking program in the U.S. PLoS ONE 16(10): e0258262. <a href="https://doi.org/10.1371/journal.pone.0258262">https://doi.org/10.1371/journal.pone.0258262</a></li>
</ul>
<i>Scientists in Oregon public health institutions use NCBI Pathogen Detection Browser to identify pathogenic Escherichia coli O157:H7 from venison from harvested deer and clinical cases from hunters in the same area. </i>
<ul>
<li id="OHA_E_coli_2021">Ladd-Wilson SG, Morey K, Turpen L, DeMarco K,Van Der Veen G,Fontana JL, Dannenhoffer RL, Tenney K, Kutumbaka KK, Samadpour M, Cieslak PR. Escherichia coli O157:H7 Cluster Associated With Deer Harvested at a Single Wildlife Hunting Area, Oregon, 2017. <a href="https://doi.org/10.1177%2F00333549211046111">Full text at Public Health Reports</a>.</li>
</ul>
<i>Scientists at multiple institutions use NCBI Pathogen Detection Browser for evaluation of Shigella isolates. Analysis includes evaluation of macrolide resistance, plasmid structure, and identified multiple outbreaks in the United States and evidence of intercontinental transmission </i>
<ul>
<li id="Wadsworth_shigella_2021">Worley JN, Javkar K, Hoffmann M, Hysell K, Garcia-Williams A, Tagg K, Kanjilal S, Strain E, Pop M, Allard M, Francois Watkins L, Bry L. Genomic Drivers of Multidrug-Resistant Shigella Affecting Vulnerable Patient Populations in the United States and Abroad. <a href="https://www.ncbi.nlm.nih.gov/pubmed/33500335">PubMed PMID: 33500335</a>; <a href="https://mbio.asm.org/content/12/1/e03188-20">Full text at mBio</a>.</li>
</ul>
<i>Scientists at New York State Department of Health use NCBI Pathogen Detection Browser retrospective analysis of Clostridium prefringens outbreaks</i>
<ul>
<li id="NY_Cper">Carey J, Cole J, Venkata SLG, Hoyt H, Mingle L, Nicholas D, Musser KA, Wolfgang WJ. Genomic Epidemiology of Historical Clostridium perfringens Outbreaks in New York State Using Two Web-based Platforms: National Center for Biotechnology Information-Pathogen Detection and FDA-GalaxyTrakr. <a href="https://www.ncbi.nlm.nih.gov/pubmed/33177125">PubMed PMID: 33177125</a>; <a href="https://jcm.asm.org/content/early/2020/11/05/JCM.02200-20">Full text at Journal of Clinical Microbiology</a>.</li>
</ul>
<i>Scientists at multiple public health agencies use NCBI Pathogen Detection Browser for international Listeria outbreak</i>
<ul>
<li id="FDA_enoki">Pettengill J, Markell A, Conrad A, Carleton H, Beal J, Rand H, Musser S, Brown E, Allard M, Huffman J, Harris S, Wise M, Locas A. A multinational listeriosis outbreak and the importance of sharing genomic data. <a href="https://doi.org/10.1016/S2666-5247(20)30122-1">Full text at The Lancet</a>.</li>
</ul>
<i>Scientists at BWH use NCBI Pathogen Detection Browser to examine C. difficile transmission</i>
<ul>
<li id="BWH_CD_2020">Worley J, Delaney ML, Cummins CK, DuBois A, Klompas, Bry L. Genomic determination of relative risks for Clostridioides difficile infection from asymptomatic carriage in ICU patients. <a href="https://www.ncbi.nlm.nih.gov/pubmed/32676661">PubMed PMID: 32676661</a>; <a href="https://doi.org/10.1093/cid/ciaa894">Full text at Clin Infect Dis</a>.</li>
</ul>
<i>Oregon Health Authority uses NCBI Pathogen Detection Browser to Uncover Outbreak</i>
<ul>
<li id="OHA_2018">Ladd-Wilson SG, Morey K, Koske SE, Burkhalter B, Bottichio L, Brandenburg J,Fontana J, Tenney K, Kutumbaka KK, Samadpour M, Kreil K, Cieslak PR. Notes from the Field: Multistate Outbreak of Salmonella Agbeni Associated with Consumption of Raw Cake Mix - Five States, 2018. <a href="https://www.ncbi.nlm.nih.gov/pubmed/31465317">PubMed PMID: 31465317</a>; <a href="https://www.ncbi.nlm.nih.gov/pmc/articles/PMC6715262/">Full text in PubMed Central PMCID: PMC6715262</a>; <a href="https://dx.doi.org/10.15585/mmwr.mm6834a5">Full text at MMWR</a>.</li>
</ul>
<i>Israeli Ministry of Health uses Pathogen Detection Browser and AMRFinder Results to Examine Multi-Drug Resistant Shigella spp.</i>
<ul>
<li id="Shigella_2019">Ezernitchi AV, Sirotkin E, Danino D, Agmon V, Valinsky L,Rokney A. Azithromycin non-susceptible Shigella circulating in Israel, 2014-2016. <b><i>PLoS One.</i> 2019</b> Oct 18;14(10):e0221458. doi: 10.1371/journal.pone.0221458. eCollection 2019. <a href="https://www.ncbi.nlm.nih.gov/pubmed/31626667">PubMed PMID: 31465317</a>; <a href="https://www.ncbi.nlm.nih.gov/pmc/articles/PMC6799884/">Full text in PubMed Central PMCID: PMC6799884</a>; <a href="https://doi.org/10.1371/journal.pone.0221458">Full text at PLoS ONE</a>.</li>
</ul>
<i>Scientists at University of Pretoria, South Africa, use antimicrobial resistance data from the NCBI Pathogen Detection Browser to exammine the genomic epidemiology of African Gram-negative bacteria</i>
<ul>
<li id="SA_genepi">Sekyere JO, and Reta MA. Genomic and Resistance Epidemiology of Gram-Negative Bacteria in Africa: a Systematic Review and Phylogenomic Analyses from a One Health Perspective. <a href="https://pubmed.ncbi.nlm.nih.gov/33234606/">PubMed PMID: 33234606</a>; <a href="https://msystems.asm.org/content/5/6/e00897-20">Full text at mSystems</a>.</li>
</ul>
<i>Department of Civil Engineering, Hawaii, Uses Pathogen Browser for Analysis of Municipal Wastewater Salmonella Isolates</i>
<ul>
<li id="Water_2019">Diemert S, Yan T. Clinically Unreported Salmonellosis Outbreak Detected via Comparative Genomic Analysis of Municipal Wastewater Salmonella Isolates. <b><i>Appl Environ Microbiol.</i> 2019</b> May 2;85(10). pii: e00139-19. doi: 10.1128/AEM.00139-19. Print 2019 May 15 <a href="https://www.ncbi.nlm.nih.gov/pubmed/30902850">PubMed PMID: 30902850</a>; <a href="https://www.ncbi.nlm.nih.gov/pmc/articles/PMC6498150/">Full text in PubMed Central PMCID: PMC6498150</a>; <a href="https://doi.org/10.1128/AEM.00139-19">Full text at Applies and Environmental Microbiology</a>.</li>
</ul>
</div>
<!-- ======== END_REFERENCES_EXTERNAL ============ -->
<!-- ======== PRESENTATIONS ============ -->
<h3 id="references-presentations">Presentations about the Pathogen Detection Project <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#references"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="References, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h3>
<div style="padding-left: 2em">
<i>2018:</i>
<ul>
<li id="NCBIWebinar_20180321">NCBI Webinar: "<b>Introducing the NCBI Pathogen Detection Isolates Browser</b>," March 21, 2018 (<a href="https://ncbiinsights.ncbi.nlm.nih.gov/2018/03/14/march-21-webinar-ncbi-pathogen-detection-isolates-browser/">webinar announcement/description</a>; <a href="https://youtu.be/T8HluuzOb5c">recording of webinar</a> (31:23 minutes); <a href="https://ftp.ncbi.nlm.nih.gov/pub/education/public_webinars/2018/03Mar21_Pathogen_Browser/">slides and questions/answers</a>)</li>
</ul>
<i>2019:</i>
<ul>
<li id="ASM_Microbe_2019"><a href="https://www.asm.org/"><b>American Society for Microbiology</b></a><a href="https://www.asm.org/Events/ASM-Microbe/Home"><b> Microbe Conference</b></a><a href="https://www.abstractsonline.com/pp8/#!/7859"> in San Francisco, CA, June 20-24, 2019</a></li>.<br />
The following presentations by the NCBI Pathogen Detection Project Group and the NCBI Taxonomy Group are available on the NCBI FTP site: <a href="https://ftp.ncbi.nlm.nih.gov/pub/factsheets/ASM2019_Talks_Posters/">https://ftp.ncbi.nlm.nih.gov/pub/factsheets/ASM2019_Talks_Posters/</a>:
</ul>
<ul>
<li id="ASM_Microbe_2019_ncbi_amr_resources"><a href="https://ftp.ncbi.nlm.nih.gov/pub/factsheets/ASM2019_Talks_Posters/ASM2019_Talk_AMR_Resource.pdf">AMR Resources at NCBI's Pathogen Portal</a></li>
<li id="ASM_Microbe_2019_amr_genes_from_whole_genomes"><a href="https://ftp.ncbi.nlm.nih.gov/pub/factsheets/ASM2019_Talks_Posters/ASM2019_Talk_AMR_from_Genomes.pdf">Antibiotic Resistance Genes from Whole Genome Sequences</a></li>
</ul>
<i>2022:</i>
<ul>
<li id="ASM_Microbe_2022"> <a href="https://www.asm.org/Events/ASM-Microbe/Home"><b>ASM Microbe Conference</b></a> in Washington, DC, June 20-24, 2022</li>
</ul>
<ul>
<li id="ASM_Microbe_2022_Elizabeth_King_Lecture"><a href="https://ftp.ncbi.nlm.nih.gov/pub/factsheets/ASM2022/ASM2022_E.O.King_Award_Talk.pptx">ASM Elizabeth King Lecturer Award Talk</a></li>
<li id="ASM_Microbe_2022_PD_Presentation"><a href="https://ftp.ncbi.nlm.nih.gov/pub/factsheets/ASM2022/NCBI_Pathogen_ASM_2022.pptx">ASM Pathogen 2022 Presentation</a></li>
</ul>
<ul>
<li id="ASM_NGS_2022"> <a href="https://asm.org/Events/ASM-NGS/Home"><b>American Society for Microbiology NGS 2022</b></a> in Baltimore, MD, Oct 16-19, 2022</li>
</ul>
<ul>
<li>PD team participated in a <a href="https://github.com/ncbi/workshop-asm-ngs-2022/wiki">workshop</a> at ASM NGS 2022 which included some projects that demonstrate how to use our resources in the cloud.</li>
</ul>
<i>2023:</i>
<ul>
<li id="Webinar_2023"><a href="https://youtu.be/j4dzFOo2FmI">Introduction to NCBI Pathogen Detection and antimicrobial resistance data in Google BigQuery</a></li>
</ul>
</div>
<!-- ======== END_PRESENTATIONS ============ -->
<!-- ======== REFERENCES_GENOMICS_FOOD_SAFETY ============ -->
<h3 id="references-genomics-food-safety">References about the Genomics for Food Safety (GenFS) initiative <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#references"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="References, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h3>
<div style="padding-left: 2em">
<i>The Genomics for Food Safety Interagency Collaboration (CDC, FDA, USDA-FSIS, and NCBI-NLM-NIH) is described including Pathogen Detection.</i>
<ul>
<li id="GenFS2022">Stevens EL, Carleton HA, Beal J, Tillman GE, Lindsey RL, Lauer AC, Pightling A, Jarvis KG, Ottesen A, Ramachandran P, Hintz L, Katz LS, Folster JP, Whichard JM, Trees E, Timme RE, McDERMOTT P, Wolpert B, Bazaco M, Zhao S, Lindley S, Bruce BB, Griffin PM, Brown E, Allard M, Tallent S, Irvin K, Hoffmann M, Wise M, Tauxe R, Gerner-Smidt P, Simmons M, Kissler B, Defibaugh-Chavez S, Klimke W, Agarwala R, Lindsay J, Cook K, Austerman SR, Goldman D, McGARRY S, Hale KR, Dessai U, Musser SM, Braden C. Use of Whole Genome Sequencing by the Federal Interagency Collaboration for Genomics for Food and Feed Safety in the United States. <b><i>J Food Prot.</i> 2022. </b>May 1;85(5):755-772. doi: 10.4315/JFP-21-437. <a href="https://www.ncbi.nlm.nih.gov/pubmed/35259246">PubMed PMID: 35259246</a>; <a href="https://peerj.com/articles/3893/"></a></li>
</ul>
<i>A publication describing datasets for phylogenetic validation based on WGS of four foodborne pathogens from the data standards working group:</i>
<ul>
<li id="BenchmarkDatasets_2017">Timme RE, Rand H, Shumway M, Trees EK, Simmons M, Agarwala R, Davis S, Tillman GE, Defibaugh-Chavez S, Carleton HA, Klimke WA, Katz LS. Benchmark datasets for phylogenomic pipeline validation, applications for foodborne pathogen surveillance. <b><i>PeerJ</i> 2017</b> Oct 6;5:e3893. doi: 10.7717/peerj.3893. eCollection 2017. <a href="https://www.ncbi.nlm.nih.gov/pubmed/29372115">PubMed PMID: 29372115</a>; <a href="https://www.ncbi.nlm.nih.gov/pmc/articles/PMC5782805/">Full text in PubMed Central PMCID: PMC5782805</a>; <a href="https://peerj.com/articles/3893/">Full text at PeerJ</a>.</li>
</ul>
</div>
<!-- ======== END_REFERENCES_GENOMICS_FOOD_SAFETY ============ -->
<!-- ======== REFERENCES_FDA_GENOMETRAKR ============ -->
<h3 id="references-fda-genometrakr">References about the FDA GenomeTrakr project and WGS activities <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#references"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="References, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h3>
<div style="padding-left: 2em">
<i>FDA Podcast on Food Safety and WGS:</i>
<ul>
<li id="FDA_podcast">New Era of Smarter Food Safety TechTalk Podcast. <a href="https://www.fda.gov/food/new-era-smarter-food-safety-techtalk-podcast/techtalk-podcast-episode-2-whole-genome-sequencing-new-era-smarter-food-safety">TechTalk Podcast Episode 2: Whole Genome Sequencing in the New Era of Smarter Food Safety. </a><a href="https://www.fda.gov/media/151392/download">MP3 link.</a></li>
</ul>
<i>FDA 2021 Focus on Regulatory Science:</i>
<ul>
<li id="FDA_2021_focus">FDA Publishes Report on Focus Areas of Regulatory Science. FDA Publishes Report on Focus Areas of Regulatory Science. <a href="https://www.fda.gov/media/145001/download">PDF Version.</a></li>
</ul>
<i>GenomeTrakr proficiency testing:</i>
<ul>
<li id="GenomeTrakr_2018">Timme RE, Rand H, Sanchez Leon M, Hoffmann M, Strain E, Allard M, Roberson D, Baugher JD. GenomeTrakr proficiency testing for foodborne pathogen surveillance: an exercise from 2015. <b><i>Microb Genom.</i> 2018</b> Jul;4(7). doi: 10.1099/mgen.0.000185. Epub 2018 Jun 15. <a href="https://www.ncbi.nlm.nih.gov/pubmed/29906258">PubMed PMID: 29906258</a>; <a href="https://www.ncbi.nlm.nih.gov/pmc/articles/PMC6113870/">Full text in PubMed Central PMCID: PMC6113870</a>; <a href="http://mgen.microbiologyresearch.org/content/journal/mgen/10.1099/mgen.0.000185#tab2">Full text at Microbiology Society</a></li>
</ul>
<i>GenomeTrakr proficiency testing:</i>
<ul>
<li id="GenomeTrakr_2018">Timme RE, Rand H, Sanchez Leon M, Hoffmann M, Strain E, Allard M, Roberson D, Baugher JD. GenomeTrakr proficiency testing for foodborne pathogen surveillance: an exercise from 2015. <b><i>Microb Genom.</i> 2018</b> Jul;4(7). doi: 10.1099/mgen.0.000185. Epub 2018 Jun 15. <a href="https://www.ncbi.nlm.nih.gov/pubmed/29906258">PubMed PMID: 29906258</a>; <a href="https://www.ncbi.nlm.nih.gov/pmc/articles/PMC6113870/">Full text in PubMed Central PMCID: PMC6113870</a>; <a href="http://mgen.microbiologyresearch.org/content/journal/mgen/10.1099/mgen.0.000185#tab2">Full text at Microbiology Society</a></li>
</ul>
<i>Demonstration of the value of WGS and data sharing:</i>
<ul>
<li id="GenomeTrakr_WGS_2016">Allard MW, Strain E, Melka D, Bunning K, Musser SM, Brown EW, Timme R. Practical Value of Food Pathogen Traceability through Building a Whole-Genome Sequencing Network and Database. <b><i>J Clin Microbiol.</i> 2016</b> Aug;54(8):1975-83. doi: 10.1128/JCM.00081-16. Epub 2016 Mar 23. Review. <a href="https://www.ncbi.nlm.nih.gov/pubmed/27008877">PubMed PMID: 27008877</a>; <a href="https://www.ncbi.nlm.nih.gov/pmc/articles/PMC4963501/">Full text in PubMed Central PMCID: PMC4963501</a>; <a href="https://jcm.asm.org/content/54/8/1975.long">Full text at American Society for Microbiology</a></li>
</ul>
<i>FDA uses Isolates Browser for Listeria ice cream outbreak analysis</i>
<ul>
<li id="GenomeTrakr_icecream">Allard MW, Strain E, Rand H, Melka D, Correll WA, Hintz L, Stevens E, Timme R, Lomonaco S, Chen Y, Musser SM, Brown EW. Whole genome sequencing uses for foodborne contamination and compliance: Discovery of an emerging contamination event in an ice cream facility using whole genome sequencing. <b><i>Infect Genet Evol.</i> 2019</b> Sep;73:214-220. doi: 10.1016/j.meegid.2019.04.026. Epub 2019 Apr 27. <a href="https://www.ncbi.nlm.nih.gov/pubmed/31039448">PubMed PMID: 31039448</a>; <a href="https://doi.org/10.1016/j.meegid.2019.04.026">Full text at Infection, Genetics and Evolution</a></li>
</ul>
<i>FDA uses Isolates Browser for Salmonella enterica Analyses</i>
<ul>
<li id="GenomeTrakr_sefeed">Trinetta V, Magossi G, Allard MW, Tallent SM, Brown EW, Lomonaco S. Characterization of Salmonella enterica Isolates From Selected U.S. Swine Feed Mills by Whole-Genome Sequencing. <b><i>Foodborne Pathog Dis.</i> 2020</b> Feb;17(2):126-136. doi: 10.1089/fpd.2019.2701. Epub 2019 Nov 8. <a href="https://www.ncbi.nlm.nih.gov/pubmed/31702400">PubMed PMID: 31702400</a>; <a href="https://doi.org/10.1089/fpd.2019.2701">Full text at Foodborne Pathog Dis.</a></li>
</ul>
<i>FDA Discusses Open Data and Interoperability with Pathogen Detection as a Model</i>
<ul>
<li id="GenomeTrakr_opendata"> Timme RE, Wolfgang WJ, Balkey M, Venkata SLG, Randolph R, Allard M, Strain E. Optimizing open data to support one health: best practices to ensure interoperability of genomic data from bacterial pathogens. <b><i>One Health Outlook.</i> 2020</b> Epub 2020 Oct 19. doi: 10.1186/s42522-020-00026-3. <a href="https://www.ncbi.nlm.nih.gov/pubmed/33103064">PubMed PMID: 33103064</a>; <a href="https://onehealthoutlook.biomedcentral.com/articles/10.1186/s42522-020-00026-3">Full text at One Health Outlook.</a></li>
</ul>
<i><a href="https://www.protocols.io/workspaces/genometrakr1/publications">FDA GenomeTrakr Protocols IO</a></i>
<ul>
<li id="FDA_GT_protocols_NCBIsub"><a href="https://www.protocols.io/view/ncbi-submission-protocol-for-microbial-pathogen-su-bf3xjqpn">NCBI submission protocol for microbial pathogen surveillance V.3</a></li>
<li id="FDA_GT_protocols_NCBImetadata"><a href="https://www.protocols.io/view/populating-the-ncbi-pathogen-metadata-template-be9gjh3w">Populating the NCBI pathogen metadata template V.3</a></li>
<li id="FDA_GT_protocols_NCBIdatacuration"><a href="https://www.protocols.io/view/ncbi-data-curation-protocol-bacaiase">NCBI data curation protocol</a></li>
<li id="FDA_GT_protocols_seqquality"><a href="https://www.protocols.io/view/assessing-sequence-quality-in-galaxytrakr-bdvfi63n">Assessing sequence quality in GalaxyTrakr V.2</a></li>
</ul>
</div>
<!-- ======== END_REFERENCES_FDA_GENOMETRAKR ============ -->
<!-- ======== REFERENCES_CDC_PULSENET ============ -->
<h3 id="references-cdc-pulsenet">References about the CDC PulseNet network and WGS activities <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#references"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="References, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h3>
<div style="padding-left: 2em">
<i>Pathogen Genomes in Public Health - Cites NCBI Pathogen Detection Isolates Browser as a Model for Open Information</i>
<ul>
<li id="Armstrong_2019">Armstrong GL, MacCannell DR, Taylor J, Carleton HA, Neuhaus EB, Bradbury RS, Posey JE, Gwinn M. Pathogen Genomics in Public Health. <b><i>N Engl J Med.</i> 2019</b> Dec 26;381(26):2569-2580. doi: 10.1056/NEJMsr1813907.<a href="https://www.ncbi.nlm.nih.gov/pubmed/31881145">PubMed PMID: 31881145</a>; <a href="https://doi.org/10.1056/NEJMsr1813907">Full text at New England Journal of Medicine</a></li>
</ul>
<i>PulseNet vision statement:</i>
<ul>
<li id="PulseNetVisionStatement_2017">Nadon C, Van Walle I, Gerner-Smidt P, Campos J, Chinen I, Concepcion-Acevedo J, Gilpin B, Smith AM, Man Kam K, Perez E, Trees E, Kubota K, Takkinen J, Nielsen EM, Carleton H; FWD-NEXT Expert Panel. PulseNet International: Vision for the implementation of whole genome sequencing (WGS) for global food-borne disease surveillance. <b><i>Euro Surveill.</i> 2017</b> Jun 8;22(23). pii: 30544. doi: 10.2807/1560-7917.ES.2017.22.23.30544. Review. <a href="https://www.ncbi.nlm.nih.gov/pubmed/28662764">PubMed PMID: 28662764</a>; <a href="https://www.ncbi.nlm.nih.gov/pmc/articles/PMC5479977/">Full text in PubMed Central PMCID: PMC5479977</a>; <a href="https://www.eurosurveillance.org/content/10.2807/1560-7917.ES.2017.22.23.30544">Full text at Eurosurveillance</a></li>
</ul>
<i>PulseNet 20th anniversary announcement:</i>
<ul>
<li id="PulseNet20thAnniversary_2016">Announcement: 20th Anniversary of PulseNet: the National Molecular Subtyping
Network for Foodborne Disease Surveillance - United States, 2016. <b><i>MMWR Morb Mortal Wkly Rep.</i> 2016</b> Jun 24;65(24):636. doi: 10.15585/mmwr.mm6524a5.. <a href="https://www.ncbi.nlm.nih.gov/pubmed/27337605">PubMed PMID: 27337605</a>; <a href="https://www.cdc.gov/mmwr/volumes/65/wr/mm6524a5.htm">Full text at CDC</a></li>
</ul>
<i>Showing that the switch to WGS results in decreased cluster sizes and more outbreaks solved:</i>
<ul>
<li id="ListeriosisOutbreakDetection_2016">Jackson BR, Tarr C, Strain E, Jackson KA, Conrad A, Carleton H, Katz LS, Stroika S, Gould LH, Mody RK, Silk BJ, Beal J, Chen Y, Timme R, Doyle M, Fields A, Wise M, Tillman G, Defibaugh-Chavez S, Kucerova Z, Sabol A, Roache K, Trees E, Simmons M, Wasilenko J, Kubota K, Pouseele H, Klimke W, Besser J, Brown E, Allard M, Gerner-Smidt P. Implementation of Nationwide Real-time Whole-genome Sequencing to Enhance Listeriosis Outbreak Detection and Investigation. <b><i>Clin Infect Dis.</i> 2016</b> Aug 1;63(3):380-6. doi: 10.1093/cid/ciw242. Epub 2016 Apr 18. <a href="https://www.ncbi.nlm.nih.gov/pubmed/27090985">PubMed PMID: 27090985</a>; <a href="https://www.ncbi.nlm.nih.gov/pmc/articles/PMC4946012/">Full text in PubMed Central PMCID: PMC4946012</a>; <a href="https://academic.oup.com/cid/article/63/3/380/2595027">Full text at Oxford Academic</a>.</li>
</ul>
</div>
<!-- ======== END_REFERENCES_CDC_PULSENET ============ -->
<!-- ======== REFERENCES_PHE ============ -->
<h3 id="references-phe">References about Public Health England WGS activities <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#references"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="References, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h3>
<div style="padding-left: 2em">
<i>Public Health England Describes Switch to Whole Genome Sequencing for Pathogen Surveillance for Salmonella - Cites NCBI Pathogen Detection as a Model for Open Information</i>
<ul>
<li id="PHE_2019">Chattaway MA, Dallman TJ, Larkin L, Nair S, McCormick J, Mikhail A, Hartman H, Godbole G, Powell D1, Day M, Smith R, Grant K. The Transformation of Reference Microbiology Methods and Surveillance for Salmonella With the Use of Whole Genome Sequencing in England and Wales. <b><i>Front Public Health.</i> 2019</b> Nov 21;7:317. doi: 10.3389/fpubh.2019.00317. eCollection 2019. <a href="https://www.ncbi.nlm.nih.gov/pubmed/31824904">PubMed PMID: 31824904</a>; <a href="https://www.ncbi.nlm.nih.gov/pmc/articles/PMC6881236/">Full text in PubMed Central PMCID: PMC6881236</a>; <a href="https://doi.org/10.3389/fpubh.2019.00317">Full text at Frontiers in Public Health</a>.</li>
</ul>
</div>
<!-- ======== END_REFERENCES_PHE ============ -->
<!-- ======== OTHER_RELATED_REFERENCES ============ -->
<h3 id="references-other">Other related references <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#references"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="References, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h3>
<ul>
<li id="GMI_Initiative_2011"><b>Global Microbial Identifier (GMI) initiative</b>:<br />
Kupferschmidt K. Epidemiology. Outbreak detectives embrace the genome era.
<i>Science</i>. 2011 Sep 30;333(6051):1818-9. doi: 10.1126/science.333.6051.1818. <a href="https://www.ncbi.nlm.nih.gov/pubmed/21960605">PubMed PMID: 21960605</a>; <a href="http://science.sciencemag.org/content/333/6051/1818.long">Full text at Science Magazine</a><br />
<a href="http://www.globalmicrobialidentifier.org/">GMI website: http://www.globalmicrobialidentifier.org/</a>
<div style="padding-left: 2em">
<i>Note: The Global Microbial Identifier (GMI) initiative is a grassroots attempt to build a global system of DNA genome databases for microbial and infectious disease identification and diagnostics. Sequencing projects that are flagged with the 'GMI' keyword can be found in the NCBI BioProject database via this search: <a href="https://www.ncbi.nlm.nih.gov/bioproject/?term=GMI[keyword]">https://www.ncbi.nlm.nih.gov/bioproject/?term=GMI[keyword]</a></i>
</div>
</li>
<li id="FDA-ARGOS_2019"><b>FDA-ARGOS</b>:<br />
Sichtig H, Minogue T, Yan Y, Stefan C, Hall A, Tallon L, Sadzewicz L, Nadendla S, Klimke W, Hatcher E, Shumway M, Aldea DL, Allen J, Koehler J, Slezak T, Lovell S, Schoepp R, Scherf U. FDA-ARGOS is a database with public quality-controlled reference genomes for diagnostic use and regulatory science.
<i>Nat Commun.</i>. 2019 Jul 25;10(1):3313. doi: 10.1038/s41467-019-11306-6. <a href="https://www.ncbi.nlm.nih.gov/pubmed/31346170">PubMed PMID: 31346170</a>; <a href="https://www.ncbi.nlm.nih.gov/pmc/articles/PMC6658474/">Full text in PubMed Central PMCID: PMC6658474</a>; <a href="https://www.nature.com/articles/s41467-019-11306-6">Full text at Nature Publishing Group</a></li>
</ul>
<!-- ======== END_OTHER_RELATED_REFERENCES ============ -->
<!-- ======== REFERENCES_ANTIMICROBIAL_RESISTANCE ============ -->
<h3 id="references-amr">References on antimicrobial resistance <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#references"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="References, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h3>
<div style="padding-left: 2em">
<i>Using the NCBI AMRFinderPlus Tool:</i>
<ul>
<li id="AMRFinder_2022">Feldgarden M, Brover V, Fedorov B, Haft DH, Prasad AB, Klimke W. Curation of the AMRFinderPlus databases: applications, functionality and impact.
<b><i>Microb Genome.</i> 2022</b> Jun;8(6). doi: 10.1099/mgen.0.000832. <a href="https://pubmed.ncbi.nlm.nih.gov/35675101/">PubMed PMID: 35675101</a>; <a href="https://doi.org/10.1099/mgen.0.000832">Full text at Microbial Genomics</a>.</li>
<li id="AMRFinder_2021">Feldgarden M, Brover V, Gonzalez-Escalona N, Frye JG, Haendiges J, Haft DH, Hoffmann M, Pettengill JB, Prasad AB, Tillman GE, Tyson GH, Klimke W. AMRFinderPlus and the Reference Gene Catalog facilitate examination of the genomic links among antimicrobial resistance, stress response, and virulence.
<b><i>Sci Rep.</i> 2021</b> June 16;11(1):12728. https://doi.org/10.1038/s41598-021-91456-0. <a href="https://pubmed.ncbi.nlm.nih.gov/34135355/">PubMed PMID: 34135355</a>; <a href="https://www.nature.com/articles/s41598-021-91456-0">Full text at Nature Scientific Reports</a>.</li>
<li id="AMRFinder_2019">Feldgarden M, Brover V, Haft DH, Prasad AB, Slotta DJ, Tolstoy I, Tyson GH, Zhao S, Hsu CH, McDermott PF, Tadesse DA, Morales C, Simmons M, Tillman G, Wasilenko J, Folster JP, Klimke W. Validating the NCBI AMRFinder Tool and Resistance Gene Database Using Antimicrobial Resistance Genotype-Phenotype Correlations in a Collection of NARMS Isolates.
<b><i>Antimicrob Agents Chemother</i> 2019</b> Aug 19. pii: AAC.00483-19. doi: 10.1128/AAC.00483-19. [Epub ahead of print] <a href="https://www.ncbi.nlm.nih.gov/pubmed/31427293">PubMed PMID: 31427293</a>; <a href="https://aac.asm.org/content/early/2019/08/27/AAC.00483-19.long">Full text at AAC</a>.</li>
<!-- li id="AMRFinder_2019">Feldgarden M, Brover V, Haft DH, Prasad AB, Slotta DJ, Tolstoy I, Tyson GH, Zhao S, Hsu CH, McDermott PF, Tadesse DA, Morales C, Simmons M, Tillman G, Wasilenko J, Folster JP, Klimke W.
Using the NCBI AMRFinder Tool to Determine Antimicrobial Resistance Genotype-Phenotype Correlations Within a Collection of NARMS Isolates.
<b><i>bioRxiv</i> 2019</b> doi: 10.1101/550707. <a href="https://www.biorxiv.org/content/10.1101/550707v1">Full text on bioRxiv Preprint Server</a>[bioRxiv 550707; doi: https://doi.org/10.1101/550707]</li -->
</ul>
<i>AMRFinderPlus used to confirm putative virally-encoded beta-lactamases</i>
<ul>
<li id="viral_beta_lactamase_AMRFinderPlus">Nayfach S., <i>et al</i>. Metagenomic compendium of 189,680 DNA viruses from the human gut microbiome.<b><i>Nat Microbiol.</i> 2021</b> June https://doi.org/10.1038/s41564-021-00928-6. <a href="https://doi.org/10.1038/s41564-021-00928-6">Full text at Antimicrob Resist Infect Control.</a> <a href="https://pubmed.ncbi.nlm.nih.gov/34168315/">PubMed PMID: 34168315 </a>;</li>
</ul>
<i>AMRFinderPlus implemented in SeqSphere<sup>+</sup></i>
<ul>
<li id="SeqSphere_AMRFinderPlus">Papan C., <i>et al</i>. Combined antibiotic stewardship and infection control measures to contain the spread of linezolid-resistant Staphylococcus epidermidis in an intensive care unit.<b><i>Antimicrob Resist Infect Control.</i> 2021</b> June https://doi.org/10.1186/s13756-021-00970-3. <a href="https://doi.org/10.1186/s13756-021-00970-3">Full text at Antimicrob Resist Infect Control.</a> <a href="https://pubmed.ncbi.nlm.nih.gov/34193293/">PubMed PMID: 34193293 </a>;</li>
</ul>
<i>Using AMRFinderPlus to identify metal resistance genes</i>
<ul>
<li id="Ent_metalresistance_AMRFinderPlus">Wee S.K., <i>et al</i>. Draft Genome Sequence of <i>Enterobacter hormaechei</i> subsp. <i>steigerwaltii</i> Strain BEI01.<b><i>Microbiol Resour Announc.</i> 2021</b> July https://doi.org/10.1128/mra.00406-21. <a href="https://doi.org/10.1128/mra.00406-21">Full text at Microbiol Resour Announc.</a> <a href="https://pubmed.ncbi.nlm.nih.gov/34264109/">PubMed PMID: 34264109 </a>;</li>
</ul>
<i>Uses AMRFinderPlus and MicroBIGG-E output to identify health risks of antibiotic resistance genes</i>
<ul>
<li id="OMICS_AMRFinderPlus">Zhang A-N, <i>et al</i>. An omics-based framework for assessing the health risk of antimicrobial resistance genes.<b><i>Nature Communications</i> 2021</b> August https://doi.org/10.1038/s41467-021-25096-3. <a href="https://doi.org/10.1038/s41467-021-25096-3">Full text at Nature Communications</a>.<a href="https://pubmed.ncbi.nlm.nih.gov/34362925/">PubMed PMID: 34362925 </a>;</li>
</ul>
<i>NIAID Funded Bioinformatics Resource Center PATRIC uses AMRFinderPlus</i>
<ul>
<li id="NIAID_PATRIC_AMRFinderPlus">David J, <i>et al</i>. The PATRIC Bioinformatics Resource Center: expanding data and analysis capabilities.<b><i>NAR</i> 2020</b> January https://doi.org/10.1093/nar/gkz943. <a href="https://doi.org/10.1093/nar/gkz943">Full text at Nucleic Acids Research</a>.<a href="https://www.ncbi.nlm.nih.gov/pubmed/31667520 ">PubMed PMID: 31667520 </a>;</li>
</ul>
<i>Veterinary Laboratory Information and Response Network of FDA Identifies NDM-5 in E. coli from Companion Animals Using Isolates Browser and AMRFinderPlus Results</i>
<ul>
<li id="CVM_ecoli_ndm5">Cole SD, Peak L, Tyson GH, Reimschuessel R, Ceric O, Rankin SC. New Delhi Metallo-beta-Lactamase-5-producing Escherichia coli in Companion Animals, United States. <b><i>Emerg Infect Dis.</i> 2020</b> Feb https://doi.org/10.3201/eid2602.191221. <a href="https://doi.org/10.3201/eid2602.191221">Full text at Emerging Infectious Diseases</a>.</li>
</ul>
<i>FDA Center for Veterinary Medicine uses Pathogen Browser and AMRFinder Results to Examine Fluoroquinolone Resistance in E. coli</i>
<ul>
<li id="CVM_ecoli_2019">Tyson GH, Li C, Hsu CH, Bodeis-Jones S, McDermott PF. Diverse Fluoroquinolone Resistance Plasmids From Retail Meat E. coli in the United States. <b><i>Front Microbiol.</i> 2019</b> Dec 5;10:2826. doi: 10.3389/fmicb.2019.02826. eCollection 2019. <a href="https://www.ncbi.nlm.nih.gov/pubmed/31866986 ">PubMed PMID: 31866986 </a>; <a href="https://www.ncbi.nlm.nih.gov/pmc/articles/PMC6906146/">Full text in PubMed Central PMCID: PMC6906146 </a>; <a href="https://doi.org/10.3389/fmicb.2019.02826">Full text at Frontiers in Microbiology</a>.</li>
</ul>
<i>Review of beta lactamases and nomenclature:</i>
<ul>
<li id="BetaLactamases_2018">Bush K. Past and Present Perspectives on &#946;-Lactamases. <b><i>Antimicrob Agents
Chemother</i> 2018</b> Sep 24;62(10). pii: e01076-18. doi: 10.1128/AAC.01076-18. Print 2018 Oct. Review. <a href="https://www.ncbi.nlm.nih.gov/pubmed/30061284">PubMed PMID: 30061284</a>; <a href="https://www.ncbi.nlm.nih.gov/pmc/articles/PMC6153792/">Full text in PubMed Central PMCID: PMC6153792</a>.</li>
<li id="BetaLactamases_ClassC_2019">Mack AR, Barnes MD, Taracila MA, Hujer AM, Hujer KM, Cabot G, Feldgarden M, Haft DH, Klimke W, van den Akker F, Vila AJ, Smania A, Haider S, Papp-Wallace KM, Bradford PA, Rossolini GM, Docquier JD, Fr&#232;re JM, Galleni M, Hanson ND, Oliver A, Pl&#233;siat P, Poirel L, Nordmann P, Palzkill TG, Jacoby GA, Bush K, Bonomo RA. A standard numbering scheme for class C &#946;-Lactamases. <b><i>Antimicrob Agents
Chemother</i> 2019</b> Nov 11. pii: AAC.01841-19. doi: 10.1128/AAC.01841-19. [Epub ahead of print]. <a href="https://www.ncbi.nlm.nih.gov/pubmed/31712217">PubMed PMID: 31712217</a>; <a href="https://aac.asm.org/content/early/2019/11/05/AAC.01841-19.long">Full text in Antimicrobial Agents and Chemotherapy</a>.</li>
</ul>
<i>Proposal for assignment of allele numbers for mobile colistin resistance (mcr) genes:</i>
<ul>
<li id="MCR_genes_2018">Partridge SR, Di Pilato V, Doi Y, Feldgarden M, Haft DH, Klimke W, Kumar-Singh S, Liu JH, Malhotra-Kumar S, Prasad A, Rossolini GM, Schwarz S, Shen J, Walsh T, Wang Y, Xavier BB. Proposal for assignment of allele numbers for mobile colistin resistance (mcr) genes. <b><i>J Antimicrob Chemother</i> 2018</b> 2018 Oct 1;73(10):2625-2630. doi: 10.1093/jac/dky262. <a href="https://www.ncbi.nlm.nih.gov/pubmed/30053115">PubMed PMID: 30053115</a>; <a href="https://www.ncbi.nlm.nih.gov/pmc/articles/PMC6148208/">Full text in PubMed Central PMCID: PMC6148208</a>.</li>
</ul>
<i>The NCBI AMRFinder tool helps identify the fourth mcr-1 resistant isolate in the US:</i>
<ul>
<li id="mcr-1ResistanceGene_2016">Vasquez AM, Montero N, Laughlin M, Dancy E, Melmed R, Sosa L, Watkins LF, Folster JP, Strockbine N, Moulton-Meissner H, Ansari U, Cartter ML, Walters MS. Investigation of Escherichia coli Harboring the mcr-1 Resistance Gene - Connecticut, 2016. <b><i>MMWR Morb Mortal Wkly Rep.</i> 2016</b> Sep 16;65(36):979-80. doi: 10.15585/mmwr.mm6536e3. <a href="https://www.ncbi.nlm.nih.gov/pubmed/27631346">PubMed PMID: 27631346</a>; <a href="https://www.cdc.gov/mmwr/volumes/65/wr/mm6536e3.htm">Full text at CDC</a>.</li>
</ul>
<i>The NCBI AMRFinder tools helps uncover a novel fosfomycin resistance gene:</i>
<ul>
<li id="FosfomycinResistanceGene_2017">Rehman MA, Yin X, Persaud-Lachhman MG, Diarra MS. First Detection of a Fosfomycin Resistance Gene, fosA7, in Salmonella enterica Serovar Heidelberg Isolated from Broiler Chickens. <b><i>Antimicrob Agents Chemother.</i> 2017</b> Jul 25;61(8). pii: e00410-17. doi: 10.1128/AAC.00410-17. Print 2017 Aug. <a href="https://www.ncbi.nlm.nih.gov/pubmed/28533247">PubMed PMID: 28533247</a>; <a href="https://www.ncbi.nlm.nih.gov/pmc/articles/PMC5527569/">Full text in PubMed Central PMCID: PMC5527569</a>; <a href="https://aac.asm.org/content/61/8/e00410-17.long">Full text at American Society for Microbiology</a>.</li>
</ul>
<i>The Comprehensive Antibiotic Resistance Database:</i>
<ul>
<li id="CARD_2017">Jia B, Raphenya AR, Alcock B, Waglechner N, Guo P, Tsang KK, Lago BA, Dave BM, Pereira S, Sharma AN, Doshi S, Courtot M, Lo R, Williams LE, Frye JG, Elsayegh T, Sardar D, Westman EL, Pawlowski AC, Johnson TA, Brinkman FS, Wright GD, McArthur AG. CARD 2017: expansion and model-centric curation of the comprehensive antibiotic resistance database. <b><i>Nucleic Acids Res.</i> 2017</b> Jan 4;45(D1):D566-D573. doi: 10.1093/nar/gkw1004. Epub 2016 Oct 26. <a href="https://www.ncbi.nlm.nih.gov/pubmed/27789705">PubMed PMID: 27789705</a>; <a href="https://www.ncbi.nlm.nih.gov/pmc/articles/PMC5210516/">Full text in PubMed Central PMCID: PMC5210516</a>; <a href="https://academic.oup.com/nar/article/45/D1/D566/2333912">Full text at Oxford Academic</a>.</li>
</ul>
<i>Resfinder:</i>
<ul>
<li id="Resfinder_2012">Zankari E, Hasman H, Cosentino S, Vestergaard M, Rasmussen S, Lund O, Aarestrup FM, Larsen MV. Identification of acquired antimicrobial resistance genes. <b><i>J Antimicrob Chemother.</i> 2012</b> Nov;67(11):2640-4. doi: 10.1093/jac/dks261. Epub 2012 Jul 10. <a href="https://www.ncbi.nlm.nih.gov/pubmed/22782487">PubMed PMID: 22782487</a>; <a href="https://www.ncbi.nlm.nih.gov/pmc/articles/PMC3468078/">Full text in PubMed Central PMCID: PMC3468078</a>; <a href="https://academic.oup.com/jac/article/67/11/2640/707208">Full text at Oxford Academic</a>.</li>
</ul>
<i>Pointfinder:</i>
<ul>
<li id="PointFinder_2017">Zankari E, Alles&#248;e R, Joensen KG, Cavaco LM, Lund O, Aarestrup FM. PointFinder: a novel web tool for WGS-based detection of antimicrobial resistance associated with chromosomal point mutations in bacterial pathogens. <b><i>J Antimicrob Chemother.</i> 2017</b> Oct 1;72(10):2764-2768. doi: 10.1093/jac/dkx217. <a href="https://www.ncbi.nlm.nih.gov/pubmed/29091202">PubMed PMID: 29091202</a>; <a href="https://www.ncbi.nlm.nih.gov/pmc/articles/PMC5890747/">Full text in PubMed Central PMCID: PMC5890747</a>; <a href="https://academic.oup.com/jac/article/72/10/2764/3979530">Full text at Oxford Academic</a>.</li>
</ul>
</div>
<!-- ======== END_REFERENCES_ANTIMICROBIAL_RESISTANCE ============ -->
<!-- ======== REFERENCES_TEMPLATE_XXXXXXXX ============ -->
<!-- h3 id="______">_____________________ <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#references"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/buttons/toc_icon.png" width="15" height="12" border="0" alt="References, topic list" /></a><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="5" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h3 -->
<!-- div style='padding-left: 2em'>
<i>______________</i>
<ul>
<li id="______">Authors II. Article title. <b><i>Journal Name</i> YYYY</b> Mmm; Vol(Issue): PPP-PPP. doi: _____________. <a href="https://www.ncbi.nlm.nih.gov/pubmed/________">PubMed PMID: _______</a>; <a href="https://www.ncbi.nlm.nih.gov/pmc/articles/_______/">Full text in PubMed Central PMCID: _______</a>; <a href="__________">Full text at ______</a></li>
</ul>
<i>______________</i>
<ul>
<li id="______">Authors II. Article title. <b><i>Journal Name</i> YYYY</b> Mmm; Vol(Issue): PPP-PPP. doi: _____________. <a href="https://www.ncbi.nlm.nih.gov/pubmed/________">PubMed PMID: _______</a>; <a href="https://www.ncbi.nlm.nih.gov/pmc/articles/_______/">Full text in PubMed Central PMCID: _______</a>; <a href="__________">Full text at ______</a></li>
</ul>
</div -->
<!-- ======== END_REFERENCES_TEMPLATE_XXXXXXXX ============ -->
<!-- ########## END_H2_SECTION:REFERENCES ########## -->
<!-- ======== HORIZONTAL_RULE ============ -->
<hr />
<!-- ======== END_HORIZONTAL_RULE ======== -->
<!-- ########## H2_SECTION:CONTACT_INFO ########## -->
<h2 id="contact">Contact information <img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" /><a href="#top"><img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/arrowup_blue.gif" width="12" height="12" border="0" alt="back to top" /></a></h2>
<!-- ========== PARAGRAPH =========== -->
<p>If you would like to contact the NCBI Pathogen Detection team, please send an email to: <a href="mailto:pd-help@ncbi.nlm.nih.gov"><b>pd-help@ncbi.nlm.nih.gov</b></a></p>
<!-- ======== END_PARAGRAPH ========= -->
<!-- ########## END_H2_SECTION:CONTACT_INFO ########## -->
<!-- ======== HORIZONTAL_RULE ============ -->
<hr />
<!-- ======== END_HORIZONTAL_RULE ======== -->
<!-- ========== DATE_REVISED =========== -->
<p id="date-revised">Revised 18 Dec 2023
<img src="https://www.ncbi.nlm.nih.gov/Structure/IMG/spacer.gif" width="25" height="1" border="0" />
Pathogen Detection Project help: <a href="mailto:pd-help@ncbi.nlm.nih.gov" id="mailto_pd">pd-help@ncbi.nlm.nih.gov</a>
</p>
<!-- ======== END_DATE_REVISED ========= -->
</body>
<!-- ============ END_BODY ============= -->
</html></div>
</section>
</main>
<!-- ========== BEGIN FOOTER ========== -->
<footer>
<section class="icon-section">
<div id="icon-section-header" class="icon-section_header">Follow NCBI</div>
<div class="grid-container container">
<div class="icon-section_container">
<a class="footer-icon" id="footer_twitter" href="https://twitter.com/ncbi" aria-label="Twitter">
<svg width="40" height="40" viewBox="0 0 40 37" fill="none" xmlns="http://www.w3.org/2000/svg">
<title>Twitter</title>
<g id="twitterx1008">
<path id="path1008"
d="M6.06736 7L16.8778 20.8991L6.00001 32.2H10.2L18.6 23.1L25.668 32.2H34L22.8 17.5L31.9 7H28.4L20.7 15.4L14.401 7H6.06898H6.06736ZM9.66753 8.73423H12.9327L29.7327 30.4658H26.5697L9.66753 8.73423Z"
fill="#5B616B"/>
</g>
</svg>
</a>
<a class="footer-icon" id="footer_facebook" href="https://www.facebook.com/ncbi.nlm" aria-label="Facebook"><svg
data-name="Layer 1" xmlns="http://www.w3.org/2000/svg" viewBox="0 0 300 300">
<title>Facebook</title>
<path class="cls-11"
d="M210.5,115.12H171.74V97.82c0-8.14,5.39-10,9.19-10h27.14V52l-39.32-.12c-35.66,0-42.42,26.68-42.42,43.77v19.48H99.09v36.32h27.24v109h45.41v-109h35Z">
</path>
</svg></a>
<a class="footer-icon" id="footer_linkedin"
href="https://www.linkedin.com/company/ncbinlm"
aria-label="LinkedIn"><svg data-name="Layer 1" xmlns="http://www.w3.org/2000/svg" viewBox="0 0 300 300">
<title>LinkedIn</title>
<path class="cls-11"
d="M101.64,243.37H57.79v-114h43.85Zm-22-131.54h-.26c-13.25,0-21.82-10.36-21.82-21.76,0-11.65,8.84-21.15,22.33-21.15S101.7,78.72,102,90.38C102,101.77,93.4,111.83,79.63,111.83Zm100.93,52.61A17.54,17.54,0,0,0,163,182v61.39H119.18s.51-105.23,0-114H163v13a54.33,54.33,0,0,1,34.54-12.66c26,0,44.39,18.8,44.39,55.29v58.35H198.1V182A17.54,17.54,0,0,0,180.56,164.44Z">
</path>
</svg></a>
<a class="footer-icon" id="footer_github" href="https://github.com/ncbi" aria-label="GitHub"><svg
data-name="Layer 1" xmlns="http://www.w3.org/2000/svg" viewBox="0 0 300 300">
<defs>
<style>
.cls-11,
.cls-12 {
fill: #737373;
}
.cls-11 {
fill-rule: evenodd;
}
</style>
</defs>
<title>GitHub</title>
<path class="cls-11"
d="M151.36,47.28a105.76,105.76,0,0,0-33.43,206.1c5.28,1,7.22-2.3,7.22-5.09,0-2.52-.09-10.85-.14-19.69-29.42,6.4-35.63-12.48-35.63-12.48-4.81-12.22-11.74-15.47-11.74-15.47-9.59-6.56.73-6.43.73-6.43,10.61.75,16.21,10.9,16.21,10.9,9.43,16.17,24.73,11.49,30.77,8.79,1-6.83,3.69-11.5,6.71-14.14C108.57,197.1,83.88,188,83.88,147.51a40.92,40.92,0,0,1,10.9-28.39c-1.1-2.66-4.72-13.42,1-28,0,0,8.88-2.84,29.09,10.84a100.26,100.26,0,0,1,53,0C198,88.3,206.9,91.14,206.9,91.14c5.76,14.56,2.14,25.32,1,28a40.87,40.87,0,0,1,10.89,28.39c0,40.62-24.74,49.56-48.29,52.18,3.79,3.28,7.17,9.71,7.17,19.58,0,14.15-.12,25.54-.12,29,0,2.82,1.9,6.11,7.26,5.07A105.76,105.76,0,0,0,151.36,47.28Z">
</path>
<path class="cls-12"
d="M85.66,199.12c-.23.52-1.06.68-1.81.32s-1.2-1.06-.95-1.59,1.06-.69,1.82-.33,1.21,1.07.94,1.6Zm-1.3-1">
</path>
<path class="cls-12"
d="M90,203.89c-.51.47-1.49.25-2.16-.49a1.61,1.61,0,0,1-.31-2.19c.52-.47,1.47-.25,2.17.49s.82,1.72.3,2.19Zm-1-1.08">
</path>
<path class="cls-12"
d="M94.12,210c-.65.46-1.71,0-2.37-.91s-.64-2.07,0-2.52,1.7,0,2.36.89.65,2.08,0,2.54Zm0,0"></path>
<path class="cls-12"
d="M99.83,215.87c-.58.64-1.82.47-2.72-.41s-1.18-2.06-.6-2.7,1.83-.46,2.74.41,1.2,2.07.58,2.7Zm0,0">
</path>
<path class="cls-12"
d="M107.71,219.29c-.26.82-1.45,1.2-2.64.85s-2-1.34-1.74-2.17,1.44-1.23,2.65-.85,2,1.32,1.73,2.17Zm0,0">
</path>
<path class="cls-12"
d="M116.36,219.92c0,.87-1,1.59-2.24,1.61s-2.29-.68-2.3-1.54,1-1.59,2.26-1.61,2.28.67,2.28,1.54Zm0,0">
</path>
<path class="cls-12"
d="M124.42,218.55c.15.85-.73,1.72-2,1.95s-2.37-.3-2.52-1.14.73-1.75,2-2,2.37.29,2.53,1.16Zm0,0"></path>
</svg></a>
<a class="footer-icon" id="footer_blog" href="https://ncbiinsights.ncbi.nlm.nih.gov/" aria-label="Blog">
<svg id="Layer_1" data-name="Layer 1" xmlns="http://www.w3.org/2000/svg" viewBox="0 0 40 40"><defs><style>.cls-1{fill:#737373;}</style></defs><path class="cls-1" d="M14,30a4,4,0,1,1-4-4,4,4,0,0,1,4,4Zm11,3A19,19,0,0,0,7.05,15a1,1,0,0,0-1,1v3a1,1,0,0,0,.93,1A14,14,0,0,1,20,33.07,1,1,0,0,0,21,34h3a1,1,0,0,0,1-1Zm9,0A28,28,0,0,0,7,6,1,1,0,0,0,6,7v3a1,1,0,0,0,1,1A23,23,0,0,1,29,33a1,1,0,0,0,1,1h3A1,1,0,0,0,34,33Z"/></svg>
</a>
</div>
</div>
</section>
<section class="container-fluid bg-primary">
<div class="container pt-5">
<div class="row mt-3">
<div class="col-lg-3 col-12">
<p><a class="text-white" href="https://www.nlm.nih.gov/socialmedia/index.html">Connect with NLM</a></p>
<ul class="list-inline social_media">
<li class="list-inline-item"><a href="https://twitter.com/NLM_NIH" aria-label="Twitter"
target="_blank" rel="noopener noreferrer">
<svg width="35" height="35" viewBox="0 0 38 35" fill="none" xmlns="http://www.w3.org/2000/svg">
<title>Twitter</title>
<g id="twitterx1009" clip-path="url(#clip0_65276_3946)">
<path id="Vector" d="M17.5006 34.6565C26.9761 34.6565 34.6575 26.9751 34.6575 17.4996C34.6575 8.02416 26.9761 0.342773 17.5006 0.342773C8.02514 0.342773 0.34375 8.02416 0.34375 17.4996C0.34375 26.9751 8.02514 34.6565 17.5006 34.6565Z" fill="#205493" stroke="white" stroke-width="1.2" stroke-miterlimit="10"></path>
<path id="path1009" d="M8.54811 8.5L16.2698 18.4279L8.50001 26.5H11.5L17.5 20L22.5486 26.5H28.5L20.5 16L27 8.5H24.5L19 14.5L14.5007 8.5H8.54927H8.54811ZM11.1197 9.73873H13.4519L25.4519 25.2613H23.1926L11.1197 9.73873Z" fill="white"></path>
</g>
<defs>
<clipPath id="clip0_65276_3946">
<rect width="38" height="38" fill="white"></rect>
</clipPath>
</defs>
</svg></a>
</li>
<li class="list-inline-item"><a href="https://www.facebook.com/nationallibraryofmedicine"
aria-label="Facebook" rel="noopener noreferrer" target="_blank">
<svg version="1.1" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" x="0px"
y="0px" viewBox="0 0 249 249" style="enable-background:new 0 0 249 249;" xml:space="preserve">
<style type="text/css">
.st10 {
fill: #FFFFFF;
}
.st110 {
fill: none;
stroke: #FFFFFF;
stroke-width: 8;
stroke-miterlimit: 10;
}
</style>
<title>SM-Facebook</title>
<g>
<g>
<path class="st10" d="M159,99.1h-24V88.4c0-5,3.3-6.2,5.7-6.2h16.8V60l-24.4-0.1c-22.1,0-26.2,16.5-26.2,27.1v12.1H90v22.5h16.9
v67.5H135v-67.5h21.7L159,99.1z"></path>
</g>
</g>
<circle class="st110" cx="123.6" cy="123.2" r="108.2"></circle>
</svg>
</a></li>
<li class="list-inline-item"><a href="https://www.youtube.com/user/NLMNIH" aria-label="Youtube"
target="_blank" rel="noopener noreferrer"><svg version="1.1" xmlns="http://www.w3.org/2000/svg"
xmlns:xlink="http://www.w3.org/1999/xlink" x="0px" y="0px" viewBox="0 0 249 249"
style="enable-background:new 0 0 249 249;" xml:space="preserve">
<title>SM-Youtube</title>
<style type="text/css">
.st4 {
fill: none;
stroke: #FFFFFF;
stroke-width: 8;
stroke-miterlimit: 10;
}
.st5 {
fill: #FFFFFF;
}
</style>
<circle class="st4" cx="124.2" cy="123.4" r="108.2"></circle>
<g transform="translate(0,-952.36218)">
<path class="st5"
d="M88.4,1037.4c-10.4,0-18.7,8.3-18.7,18.7v40.1c0,10.4,8.3,18.7,18.7,18.7h72.1c10.4,0,18.7-8.3,18.7-18.7
v-40.1c0-10.4-8.3-18.7-18.7-18.7H88.4z M115.2,1058.8l29.4,17.4l-29.4,17.4V1058.8z"></path>
</g>
</svg></a></li>
</ul>
</div>
<div class="col-lg-3 col-12">
<p class="address_footer text-white">National Library of Medicine<br>
<a href="https://www.google.com/maps/place/8600+Rockville+Pike,+Bethesda,+MD+20894/@38.9959508,-77.101021,17z/data=!3m1!4b1!4m5!3m4!1s0x89b7c95e25765ddb:0x19156f88b27635b8!8m2!3d38.9959508!4d-77.0988323"
class="text-white" target="_blank" rel="noopener noreferrer">8600 Rockville Pike<br>
Bethesda, MD 20894</a></p>
</div>
<div class="col-lg-3 col-12 centered-lg">
<p><a href="https://www.nlm.nih.gov/web_policies.html" class="text-white">Web Policies</a><br>
<a href="https://www.nih.gov/institutes-nih/nih-office-director/office-communications-public-liaison/freedom-information-act-office"
class="text-white">FOIA</a><br>
<a href="https://www.hhs.gov/vulnerability-disclosure-policy/index.html" class="text-white" id="vdp">HHS Vulnerability Disclosure</a></p>
</div>
<div class="col-lg-3 col-12 centered-lg">
<p><a class="supportLink text-white" href="https://support.nlm.nih.gov/">Help</a><br>
<a href="https://www.nlm.nih.gov/accessibility.html" class="text-white">Accessibility</a><br>
<a href="https://www.nlm.nih.gov/careers/careers.html" class="text-white">Careers</a></p>
</div>
</div>
<div class="row">
<div class="col-lg-12 centered-lg">
<nav class="bottom-links">
<ul class="mt-3">
<li>
<a class="text-white" href="//www.nlm.nih.gov/">NLM</a>
</li>
<li>
<a class="text-white"
href="https://www.nih.gov/">NIH</a>
</li>
<li>
<a class="text-white" href="https://www.hhs.gov/">HHS</a>
</li>
<li>
<a
class="text-white" href="https://www.usa.gov/">USA.gov</a>
</li>
</ul>
</nav>
</div>
</div>
</div>
</section>
</footer>
<!-- ========== END FOOTER ========== -->
<!-- javascript to inject NWDS meta tags. Note: value of nwds_version is updated by "npm version" command -->
<script type="text/javascript">
var nwds_version = "1.2.3";
var meta_nwds_ver = document.createElement('meta');
meta_nwds_ver.name = 'ncbi_nwds_ver';
meta_nwds_ver.content = nwds_version;
document.getElementsByTagName('head')[0].appendChild(meta_nwds_ver);
var meta_nwds = document.createElement('meta');
meta_nwds.name = 'ncbi_nwds';
meta_nwds.content = 'yes';
document.getElementsByTagName('head')[0].appendChild(meta_nwds);
var alertsUrl = "/core/alerts/alerts.js";
if (typeof ncbiBaseUrl !== 'undefined') {
alertsUrl = ncbiBaseUrl + alertsUrl;
}
</script>
<!-- JavaScript -->
<script src="/pathogens/static/django_uswds/uswds/js/uswds.js"></script>
<script src="https://code.jquery.com/jquery-3.5.0.min.js"
integrity="sha256-xNzN2a4ltkB44Mc/Jz3pT4iU1cmeR0FkXs4pru/JxaQ="
crossorigin="anonymous">
</script>
<script>
var fallbackJquery = "/pathogens/static/base/js/jquery-3.5.0.min.js";
window.jQuery || document.write("<script src=" + fallbackJquery + ">\x3C/script>")
</script>
<script src="/pathogens/static/nwds/js/nwds.js" type="text/javascript"> </script>
<script src="/pathogens/static/nwds/js/header.js" type="text/javascript"> </script>
<script src="/pathogens/static/nwds/js/ncbipopup.js" type="text/javascript"> </script>
<script src="/pathogens/static/nwds/js/ncbiclearbutton.js" type="text/javascript"> </script>
<script src="/pathogens/static/nwds/js/override-uswds.js" type="text/javascript"> </script>
<script src="/pathogens/static/nwds/js/ncbifeedback.js" type="text/javascript"> </script>
<script type="text/javascript" src="https://www.ncbi.nlm.nih.gov/core/pinger/pinger.js"> </script>
<script type="text/javascript" src="/pathogens/static/main/scripts/page-search.js" charset="utf-8"></script>
</body>
</html>