nih-gov/www.ncbi.nlm.nih.gov/pathogens/faq/index.html

729 lines
No EOL
41 KiB
HTML
Raw Permalink Blame History

This file contains ambiguous Unicode characters

This file contains Unicode characters that might be confused with other characters. If you think that this is intentional, you can safely ignore this warning. Use the Escape button to reveal them.

<!DOCTYPE html>
<html lang="en" >
<head >
<meta charset="UTF-8">
<meta http-equiv="X-UA-Compatible" content="IE=edge">
<!-- Mobile properties -->
<meta name="HandheldFriendly" content="True">
<meta name="MobileOptimized" content="320">
<meta name="viewport" content="width=device-width, initial-scale=1.0">
<!-- Stylesheets -->
<link href="/pathogens/static/django_uswds/uswds/css/uswds.css" rel="stylesheet" />
<link rel="stylesheet" href="/pathogens/static/nwds/css/nwds.css" />
<link rel="stylesheet" href="/pathogens/static/nwds/css/header.css" />
<link rel="stylesheet" href="/pathogens/static/nwds/css/footer.css" />
<link rel="stylesheet" href="/pathogens/static/nwds/css/form.css" />
<link rel="stylesheet" href="https://maxcdn.bootstrapcdn.com/font-awesome/4.7.0/css/font-awesome.min.css"/>
<title>
NCBI Pathogen Detection Frequently Asked Questions (FAQ) -
Pathogen Detection - NCBI
</title>
<!-- extra head -->
<!-- Favicons -->
<link rel="shortcut icon" type="image/ico" href="https://www.ncbi.nlm.nih.gov/coreutils/nwds/img/favicons/favicon.ico" />
<link rel="icon" type="image/png" href="https://www.ncbi.nlm.nih.gov/coreutils/nwds/img/favicons/favicon.png" />
<!-- 192x192, as recommended for Android
http://updates.html5rocks.com/2014/11/Support-for-theme-color-in-Chrome-39-for-Android
-->
<link rel="icon" type="image/png" sizes="192x192" href="https://www.ncbi.nlm.nih.gov/coreutils/nwds/img/favicons/favicon-192.png" />
<!-- 57x57 (precomposed) for iPhone 3GS, pre-2011 iPod Touch and older Android devices -->
<link rel="apple-touch-icon-precomposed" href="https://www.ncbi.nlm.nih.gov/coreutils/nwds/img/favicons/favicon-57.png">
<!-- 72x72 (precomposed) for 1st generation iPad, iPad 2 and iPad mini -->
<link rel="apple-touch-icon-precomposed" sizes="72x72" href="https://www.ncbi.nlm.nih.gov/coreutils/nwds/img/favicons/favicon-72.png">
<!-- 114x114 (precomposed) for iPhone 4, 4S, 5 and post-2011 iPod Touch -->
<link rel="apple-touch-icon-precomposed" sizes="114x114" href="https://www.ncbi.nlm.nih.gov/coreutils/nwds/img/favicons/favicon-114.png">
<!-- 144x144 (precomposed) for iPad 3rd and 4th generation -->
<link rel="apple-touch-icon-precomposed" sizes="144x144" href="https://www.ncbi.nlm.nih.gov/coreutils/nwds/img/favicons/favicon-144.png">
<link rel="stylesheet" href="/pathogens/static/main/styles/app.css" type="text/css" media="screen">
<link rel="stylesheet" href="/pathogens/static/main/styles/breadcrumbs.css" type="text/css" media="screen">
<style type="text/css">
a { text-decoration: underline }
</style>
<!-- Logging params: Pinger defaults -->
<meta name="ncbi_app" content="labs_pathogens" />
<meta name="ncbi_pdid" content="static" />
<meta name="ncbi_phid" content="939B8FCEB20BE4F500004A37E2251606.1.m_8" />
<!-- /extra head -->
<link rel="stylesheet" href="/pathogens/static/main/styles/page-search.css" type="text/css">
</head>
<body >
<a class="usa-skipnav" href="#main_content">Skip to main page content</a>
<!-- ========== BEGIN HEADER ========== -->
<section class="usa-banner">
<div class="usa-accordion">
<header class="usa-banner-header">
<div class="usa-grid usa-banner-inner">
<img src="https://www.ncbi.nlm.nih.gov/coreutils/uswds/img/favicons/favicon-57.png" alt="U.S. flag" />
<p>An official website of the United States government</p>
<button
class="usa-accordion-button usa-banner-button"
aria-expanded="false"
aria-controls="gov-banner-top"
>
<span class="usa-banner-button-text">Here's how you know</span>
</button>
</div>
</header>
<div
class="usa-banner-content usa-grid usa-accordion-content"
id="gov-banner-top"
>
<div class="usa-banner-guidance-gov usa-width-one-half">
<img
class="usa-banner-icon usa-media_block-img"
src="https://www.ncbi.nlm.nih.gov/coreutils/uswds/img/icon-dot-gov.svg"
alt="Dot gov"
/>
<div class="usa-media_block-body">
<p>
<strong>The .gov means its official.</strong>
<br />
Federal government websites often end in .gov or .mil. Before
sharing sensitive information, make sure youre on a federal
government site.
</p>
</div>
</div>
<div class="usa-banner-guidance-ssl usa-width-one-half">
<img
class="usa-banner-icon usa-media_block-img"
src="https://www.ncbi.nlm.nih.gov/coreutils/uswds/img/icon-https.svg"
alt="Https"
/>
<div class="usa-media_block-body">
<p>
<strong>The site is secure.</strong>
<br />
The <strong>https://</strong> ensures that you are connecting to the
official website and that any information you provide is encrypted
and transmitted securely.
</p>
</div>
</div>
</div>
</div>
</section>
<div class="usa-overlay"></div>
<header class="ncbi-header" role="banner" data-section="Header">
<div class="usa-grid">
<div class="usa-width-one-whole">
<div class="ncbi-header__logo">
<a href="https://www.ncbi.nlm.nih.gov/" class="logo" aria-label="NCBI Logo" data-ga-action="click_image" data-ga-label="NIH NLM Logo">
<img src="https://www.ncbi.nlm.nih.gov/coreutils/nwds/img/logos/AgencyLogo.svg" alt="NIH NLM Logo" />
</a>
</div>
<div class="ncbi-header__account">
<a id="account_login" href="https://account.ncbi.nlm.nih.gov" class="usa-button header-button" style="display:none" data-ga-action="open_menu" data-ga-label="account_menu">Log in</a>
<button id="account_info" class="header-button" style="display:none"
aria-controls="account_popup">
<span class="fa fa-user" aria-hidden="true"></span>
<span class="username desktop-only" aria-hidden="true" id="uname_short"></span>
<span class="sr-only">Show account info</span>
</button>
</div>
<div class="ncbi-popup-anchor">
<div class="ncbi-popup account-popup" id="account_popup" aria-hidden="true">
<div class="ncbi-popup-head">
<button class="ncbi-close-button" data-ga-action="close_menu" data-ga-label="account_menu"><span class="fa fa-times"></span><span class="usa-sr-only">Close</span></button>
<h4>Account</h4>
</div>
<div class="account-user-info">
Logged in as:<br/>
<b><span class="username" id="uname_long">username</span></b>
</div>
<div class="account-links">
<ul class="usa-unstyled-list">
<li><a id="account_myncbi" href="/myncbi/" class="set-base-url" data-ga-action="click_menu_item" data-ga-label="account_myncbi">Dashboard</a></li>
<li><a id="account_pubs" href="/myncbi/collections/bibliography/" class="set-base-url" data-ga-action="click_menu_item" data-ga-label="account_pubs">Publications</a></li>
<li><a id="account_settings" href="/account/settings/" class="set-base-url" data-ga-action="click_menu_item" data-ga-label="account_settings">Account settings</a></li>
<li><a id="account_logout" href="/account/signout/" class="set-base-url" data-ga-action="click_menu_item" data-ga-label="account_logout">Log out</a></li>
</ul>
</div>
</div>
</div>
</div>
</div>
</header>
<div role="navigation" aria-label="access keys">
<a id="nws_header_accesskey_0" href="https://www.ncbi.nlm.nih.gov/guide/browsers/#ncbi_accesskeys" class="usa-sr-only" accesskey="0" tabindex="-1">Access keys</a>
<a id="nws_header_accesskey_1" href="https://www.ncbi.nlm.nih.gov" class="usa-sr-only" accesskey="1" tabindex="-1">NCBI Homepage</a>
<a id="nws_header_accesskey_2" href="/myncbi/" class="set-base-url usa-sr-only" accesskey="2" tabindex="-1">MyNCBI Homepage</a>
<a id="nws_header_accesskey_3" href="#maincontent" class="usa-sr-only" accesskey="3" tabindex="-1">Main Content</a>
<a id="nws_header_accesskey_4" href="#" class="usa-sr-only" accesskey="4" tabindex="-1">Main Navigation</a>
</div>
<section data-section="Alerts">
<div class="ncbi-alerts-placeholder"></div>
</section>
<!-- ========== END HEADER ========== -->
<main id="main_content" accesskey="3">
<section class="pathogens-content-page usa-grid">
<div class="usa-width-one-whole ptg-top">
<div><ul id="breadcrumbs" class="usa-unstyled-list breadcrumbs">
<li><a href="https://www.ncbi.nlm.nih.gov/home/health.shtml">Health</a></li>
<li><a href=/pathogens/>Pathogen Detection</a></li>
<li>NCBI Pathogen Detection Frequently Asked Questions (FAQ)</li>
</ul>
</div>
<div class="ptg-search">
<input placeholder="Search page" type="search"/><button title="Previous" disabled="disabled"></button><button title="Next" disabled="disabled"></button>
</div>
</div>
<div>
<h1 id="pathgen-faq-main">NCBI Pathogen Detection Frequently Asked Questions (FAQ)</h1>
<h2 aria-expanded="true" id="where-can-i-find-more-informatio">Where can I find more information on the NCBI Pathogen Detection System</h2>
<p>Our <a href="/pathogens/pathogens_help/">help page</a> provides detailed documentation on how to use the NCBI Pathogen Detection System, including all of the ways to view the processed data in our browsers. Additional information on the organization of the FTP site and on analysis methods can be found on our FTP site in the <a href="https://ftp.ncbi.nlm.nih.gov/pathogen/ReadMe.txt">ReadMe.txt</a> and <a href="https://ftp.ncbi.nlm.nih.gov/pathogen/Methods.txt">Methods.txt</a> files.</p>
<h2 aria-expanded="false" id="what-is-the-pathogen-detection-p">What is the Pathogen Detection project?</h2>
<p><a href="/pathogens/">NCBI Pathogen Detection</a> project is a centralized system that
integrates sequence data and analysis for bacterial pathogens.</p>
<p>NCBI Pathogen Detection integrates bacterial and fungal pathogen genomic
sequences from numerous ongoing surveillance and research efforts whose sources
include food, environmental sources such as water or production facilities, and
patient samples. Foodborne, hospital-acquired, and other potentially clinically
infectious pathogens are included.</p>
<p>The system provides two major automated real-time analyses:</p>
<ol>
<li>It quickly clusters related pathogen genome sequences to identify potential
transmission chains, helping public health scientists investigate disease
outbreaks</li>
<li>As part of the National Database of Antibiotic Resistant Organisms (NDARO),
NCBI screens genomic sequences using AMRFinderPlus to identify the
antimicrobial resistance, stress response, and virulence genes found in
bacterial genomic sequences, which enables scientists to track the spread of
resistance genes and to understand the relationships among antimicrobial
resistance, stress response, and virulence.</li>
</ol>
<p>A number of public health agencies and researchers in the US and
internationally are collecting samples from clinical cases, from the
environment, from food products, and from industrial production facilities to
facilitate active, real-time surveillance of pathogens, including foodborne
disease. Public health agencies and researchers sequence the samples and submit
the data to NCBI, which analyzes the sequences and compares them to others in
its database, including all genomes in GenBank, to identify closely related
sequences. The aim is to identify closely or clonally related isolates to aid
in outbreak investigation. </p>
<p>The NCBI Pathogen Detection Project also analyzes the assemblies in its database in real-time for known anti-microbial resistance (AMR) genes and other genes of interest and maintains <a href="/pathogens/antimicrobial-resistance/">software and databases</a> to facilitate monitoring and research including the <a href="/pathogens/antimicrobial-resistance/">National Database of Antibiotic Resistant Organisms</a>.</p>
<h2 aria-expanded="false" id="what-is-a-targetisolate">What is a target/isolate?</h2>
<p>A target is an assembled genome for one pathogen isolate. Assemblies for this may not yet be available in GenBank.</p>
<h2 aria-expanded="false" id="what-are-these-accession-numbers">What are these Accession Numbers? What is a PDG?</h2>
<p>The Pathogen Detection system is currently using three series of Accession
Numbers. </p>
<ul>
<li>PDT# - isolate accession for each pathogen genome</li>
<li>PDG# - taxgroup accessions for each organism group</li>
<li>PDS# - SNP cluster accessions - are sets of isolates that have been determined by wgMLST or single-linkage clustering to be closely related for the purposes of facilitating outbreak and traceback investigations. Note - not all isolates within the taxgroups will be genetically similar enough to another isolate to fall into a SNP cluster. In other words there will be isolates in the taxgroup (PDG#) that will not have a PDS number assigned because they were not found sufficiently close to other isolates in our system to be clustered together.</li>
</ul>
<p>These Accession Numbers are distinct from those associated with nucleotide records in GenBank or RefSeq. These Accession Numbers are available in the <a href="/pathogens/isolates">Pathogen Detection Isolates Browser</a>, <a href="/pathogens/microbigge">MicroBIGG-E</a>, and in <a href="https://ftp.ncbi.nlm.nih.gov/pathogen/Results/">FTP</a> files.</p>
<p>Each of the accessions ends in a .version e.g., PDG000000004.355. A larger
version number is always more recent than a smaller version number.</p>
<p>Note that unlike many other NCBI resources the Pathogen Detection accessions
are not archival (the data they refer to is not guaranteed to persist
indefinitely) because of the rapid real-time reanalysis that happens in the
Pathogen Detection System. For that reason we recommend you download the
metadata associated with your analyses and save it locally. Check our <a href="/core/assets/pathogens/files/HowTo/how_to_cite_pathogen_detection.pdf">HowTo
Cite the Pathogen Detection Resource and the Data Contained
Within</a>
PDF for info on how to get the metadata for web-based analyses.</p>
<h2 aria-expanded="false" id="does-the-pathogen-detection-syst">Does the Pathogen Detection system use all genomes?</h2>
<p>For each organism group the system incorporates ALL assembled genomes submitted
to GenBank that are not flagged as anomalous in the <a href="/assembly">Assembly database</a>, and select sequences submitted to <a href="/sra">SRA</a> by public health agencies and
others. If you would like sequences you have submitted to SRA from the <a href="/pathogens/organisms/">supported organisms</a> to be included in the NCBI Pathogen Detection analysis please contact us at <a href="mailto:pd-help@ncbi.nlm.nih.gov">pd-help@ncbi.nlm.nih.gov</a>.</p>
<h2 aria-expanded="false" id="what-about-other-types-of-bacter">What about other types of bacterial pathogens?</h2>
<p>NCBI Pathogen Detection now analyzes over <a href="/pathogens/organisms/">50 taxa</a>, and
more are addded as capacity allows. If you are interested in large-scale
real-time analyses of pathogens that are not included in the <a href="/pathogens/organisms/">Organism
Groups we analyze</a>, please contact us at
<a href="mailto:pd-help@ncbi.nlm.nih.gov">pd-help@ncbi.nlm.nih.gov</a>.</p>
<h2 aria-expanded="false" id="where-are-the-analysis-results-h">Where are the analysis results? How can I visualize the results?</h2>
<p>Results can be viewed in the <a href="/pathogens/isolates">Isolates Browser</a>,
<a href="/pathogens/microbigge">MicroBIGG-E</a>, and by
<a href="https://ftp.ncbi.nlm.nih.gov/pathogen/Results">FTP</a> approximately every
day if new data are submitted. Our system outputs SNP cluster trees in
*.pdf, *.newick, and *.asn format. The *.asn format can be opened
in <a href="/tools/gbench/">NCBI's Genome Workbench tool</a>. The phylogenetic
trees for the SNP clusters are available on both
<a href="https://ftp.ncbi.nlm.nih.gov/pathogen/Results/">FTP</a> and in the
<a href="/pathogens/isolates">isolates browser</a>.
<a href="/pathogens/antimicrobial-resistance/AMRFinder/">AMRFinderPlus</a> results
are available in the Microbial Browser for the Identification of Genetic and Genomic Elements (<a href="/pathogens/microbigge">MicroBIGG-E</a>).</p>
<p>More information can be found in our <a href="/pathogens/pathogens_help/">help documentation</a> and <a href="https://ftp.ncbi.nlm.nih.gov/pathogen/ReadMe.txt">FTP ReadMe file</a>.</p>
<h2 aria-expanded="false" id="how-are-isolates-clustered-and-w">How are isolates clustered and what are SNP clusters?</h2>
<!--
All isolates for a given taxonomic group are compared to each other, either by
a shared K-mer approach for smaller groups or by wgMLST for those groups with
sufficient numbers of assemblies to develop a good wgMLST scheme.
For taxonomic groups with wgMLST schemes all isolates that have fewer than 25
different alleles at shared loci are grouped into a "SNP cluster" for SNP-based
analysis and phylogenetic tree inference.
Taxonomic groups that are grouped by shared Kmers are clustered first into
larger clusters by Kmer analysis then within each of those "Kmer clusters" all
assemblies are aligned to each-other and those assemblies within 50 filtered
SNPs of each-other are grouped into a "SNP cluster" for SNP-based phylogenetic
tree inference.
-->
<p>See the <a href="/pathogens/pathogens_help/#data-processing-overview">Pipeline overview</a>
on our help page for a high level description of the pipeline including clustering, and the
<a href="https://ftp.ncbi.nlm.nih.gov/pathogen/Methods.txt">Methods.txt</a> on our FTP
site for more details.</p>
<h2 aria-expanded="false" id="how-are-snp-distances-computed">How are SNP distances computed?</h2>
<p>SNP distances are patristic distances on the maximum compatibility tree. See
below and the (<a href="/pubmed/28231758">Cherry, J. 2017. A practical exact maximum compatibility
algorithm for reconstruction of recent evolutionary history. BMC Bioinformatics:
2017 Feb 23;18(1):127. doi: 10.1186/s12859-017-1520-4</a>)
for more information on SNP distance calculation. For a description of
filtering of potential SNP sites that occurs before running compat see the
<a href="https://ftp.ncbi.nlm.nih.gov/pathogen/Methods.txt">Methods.txt</a>
file on FTP.</p>
<h2 aria-expanded="false" id="i-know-there-are-some-snps-separ">I know there are some SNPs separating these two isolates but in your cluster you are showing them 0 SNPs apart, why?</h2>
<p>We have several filtering steps that may be filtering out the SNPs that you see. In order to handle varying quality and error levels of sequence and assembly SNP filtering is required. See our <a href="https://ftp.ncbi.nlm.nih.gov/pathogen/Methods.txt">Methods.txt</a> file for information on SNP filtering. Individual SNPs and filtering is indicated in the VCF file provided for each of the SNP clusters.</p>
<h2 aria-expanded="false" id="why-doesnt-your-cluster-correspo">Why doesn't your cluster correspond to this published cluster? What are you doing different?</h2>
<p>Our clusters are based solely on automated analysis of isolate sequences. Published outbreaks generally consider other, epidemiological factors, as they should. </p>
<h2 aria-expanded="false" id="can-i-add-my-own-isolates-to-the">Can I add my own isolates to the cluster and recompute it?</h2>
<p>If you submit your sequence and let us know it will be included in the full
analysis pipeline. See our <a href="/pathogens/submit-data/">How to submit</a> page for
more information on how to submit your data.</p>
<p>However, the Pathogen Detection system is a high-throughput, automated system
and we are unable to customize SNP cluster contents, so if the pipeline does
not identify your isolate as being sufficiently close to others in a cluster it
will not be included in a cluster.</p>
<h2 aria-expanded="false" id="i-know-these-isolates-are-near-t">I know these isolates are near to the outbreak isolates, but they don't appear in the cluster</h2>
<p>See the above answer about how isolates are clustered. There are some possible data issues that may cause isolates that are in fact closely related to appear too distantly related. While we have extensive filtering steps to minimize the chances of this happen it can sometimes occur when the sequence data is contaminated or poor-quality.</p>
<h2 aria-expanded="false" id="i-know-these-isolates-are-more-t">I know these isolates are more than 50 SNPs away from the outbreak isolates, but is there any way I can get these included in the cluster to see exactly what the SNP distance is?</h2>
<p>No. The Pathogen Detection system is a high-throughput, automated system and we are unable to customize SNP cluster contents.</p>
<h2 aria-expanded="false" id="what-is-the-snp-threshold-for-an">What is the SNP threshold for an outbreak?</h2>
<p>The number of SNPs that define an oubreak is variable and depends on many factors. Outbreak determinations should be made in concert with epidemiological factors, and the number and identity of SNPs that identify an outbreak are dependent on these factors.</p>
<h2 aria-expanded="false" id="how-do-i-know-when-new-analysis-">How do I know when new analysis results are released?</h2>
<p>The pipeline produces new analysis results every day if new data has arrived for each organism group. The <a href="/pathogens/">Pathogen Detect home page</a> shows the most recent results with Accession Numbers, count of newly added and total isolates, and a link to each taxonomic group subset in the Isolates Browser.</p>
<p>The <a href="https://ftp.ncbi.nlm.nih.gov/pathogen/Results/">FTP</a> directory contains links to the latest kmer analysis and SNP analysis for each organism.</p>
<p>Automatic emails can notify you in real-time when there are updates for any Isolates Browser search. For more information see our Isolates Browser help for <a href="/pathogens/pathogens_help/#automated-searches">Automatic E-mail Notifications of New Data</a>.</p>
<h2 aria-expanded="false" id="how-do-i-submit-data">How do I submit data?</h2>
<p>Information on how to submit can be found <a href="/pathogens/submit-data/">here</a>.</p>
<h2 aria-expanded="false" id="how-do-i-submit-betalactamase-mc">How do I submit beta-lactamase, MCR, or Qnr alleles?</h2>
<p>Information on how to submit for allele assignment can be found <a href="/pathogens/submit-beta-lactamase/">here</a></p>
<h2 aria-expanded="false" id="how-do-i-submit-and-find-ast-dat">How do I submit and find AST data?</h2>
<p>To <a href="/pathogens/submit-data/#ast">submit AST data</a>.</p>
<p>To <a href="/pathogens/isolates/#AST_phenotypes:*">find all isolates with BioSample records in the isolates browser</a>.</p>
<p>To <a href="/biosample/?term=antibiogram%5bfilter%5d">find all BioSample records that have AST data</a>.</p>
<h2 aria-expanded="false" id="how-do-i-contact-the-pathogen-de">How do I contact the Pathogen Detection team?</h2>
<p>The Pathogen Detection team can be reached by email at <a href="mailto:pd-help@ncbi.nlm.nih.gov">pd-help@ncbi.nlm.nih.gov</a>.</p>
<h2 aria-expanded="false" id="what-are-the-amr_genotypes-and-a">What are the AMR_genotypes and AST_phenotypes column?</h2>
<p>These two columns refer to antimicrobial resistance.</p>
<p>The AST_phenotypes column corresponds to the antibiogram submission into BioSample database that captures antibiotic susceptbility phenotypic testing (MICs or disk diffusion). Only isolates that have an antibiogram submitted will show AST data. See the help document for the <a href="/pathogens/pathogens_help/#isolates-browser-data-field-ASTPhenotypes">AST phenotypes column</a>.</p>
<p>The AMR_genotypes column corresponds to antimicrobial resistance genes that
have been identified by NCBI's
<a href="/pathogens/antimicrobial-resistance/AMRFinder/">AMRFinderPlus</a>. This process
is run on all isolates submitted by collaborators contributing data for the
Pathogen Detection system, and is also run against all
GenBank genomes that are incorporated into the <a href="/pathogens/isolates">Isolates
Browser</a> (although there may
be a delay in the analysis). See also the help document on the <a href="/pathogens/pathogens_help/#isolates-browser-data-field-AMRGenotypes">AMR genotypes
column</a>.
For more info about NCBI's efforts about antimicrobial resistance gene/protein
identification, see <a href="/pathogens/antimicrobial-resistance/">Antimicrobial
Resistance</a>.
For information on the software we developed to identify AMR genes see
<a href="/pathogens/antimicrobial-resistance/AMRFinder/">AMRFinderPlus</a>. For
information on the reference set of genes and proteins see the <a href="/pathogens/refgene/">Reference Gene
Catalog</a>.</p>
<h2 aria-expanded="false" id="how-are-the-phylogenetic-trees-r">How are the phylogenetic trees reconstructed?</h2>
<p>The SNP trees are calculated using a maximum compatibility algorithm that is efficient for closely related bacteria while dealing with input data quality issues. The algorithm is described in this paper (<a href="/pubmed/28231758">Cherry, J. 2017. A practical exact maximum compatibility algorithm for reconstruction of recent evolutionary history. BMC Bioinformatics: 2017 Feb 23;18(1):127. doi: 10.1186/s12859-017-1520-4</a>). The VCF file output has a field that lists incompatible sites that were filtered by compat.</p>
<h2 aria-expanded="false" id="software_list">Can I download the software and run it myself?</h2>
<p>Unfortunately the complete current pipeline is tied very tightly to many NCBI internal resources and so it can't be run outside of our environment. We would like to make a distributable version, but we have not yet had development capacity to do so. Several pieces of software devloped by NCBI and used in the pipeline are available including:</p>
<ul>
<li>AMR, stress resistance, and virulence gene identification software AMRFinderPlus <a href="https://pubmed.ncbi.nlm.nih.gov/31427293/">Paper</a> and <a href="https://github.com/ncbi/amr/wiki">Software</a></li>
<li>The assemblers SKESA and SAUTE <a href="https://pubmed.ncbi.nlm.nih.gov/30286803/">Paper</a> and <a href="https://github.com/ncbi/skesa">Software</a></li>
<li>The maximum compatibility phylogenetic inference software "compat" <a href="https://pubmed.ncbi.nlm.nih.gov/28231758/">Paper</a> and <a href="https://ftp.ncbi.nih.gov/pub/jcherry/compat/">Software</a></li>
<li>The PGAP annotation system <a href="https://pubmed.ncbi.nlm.nih.gov/29112715/">Paper</a> and <a href="https://github.com/ncbi/pgap">Software</a></li>
</ul>
<h2 aria-expanded="false" id="is-your-snp-pipeline-published">Is your SNP pipeline published?</h2>
<p>Not yet. We're working on it :-)</p>
<p>In the meantime several of the components NCBI developed for the pipeline are published and open source <a href="#software_list">See above</a> and <a href="/pathogens/pathogens_help/#references">pipeline references</a>).</p>
<p><span id="shared-content-1"/></p>
</div>
</section>
</main>
<!-- ========== BEGIN FOOTER ========== -->
<footer>
<section class="icon-section">
<div id="icon-section-header" class="icon-section_header">Follow NCBI</div>
<div class="grid-container container">
<div class="icon-section_container">
<a class="footer-icon" id="footer_twitter" href="https://twitter.com/ncbi" aria-label="Twitter">
<svg width="40" height="40" viewBox="0 0 40 37" fill="none" xmlns="http://www.w3.org/2000/svg">
<title>Twitter</title>
<g id="twitterx1008">
<path id="path1008"
d="M6.06736 7L16.8778 20.8991L6.00001 32.2H10.2L18.6 23.1L25.668 32.2H34L22.8 17.5L31.9 7H28.4L20.7 15.4L14.401 7H6.06898H6.06736ZM9.66753 8.73423H12.9327L29.7327 30.4658H26.5697L9.66753 8.73423Z"
fill="#5B616B"/>
</g>
</svg>
</a>
<a class="footer-icon" id="footer_facebook" href="https://www.facebook.com/ncbi.nlm" aria-label="Facebook"><svg
data-name="Layer 1" xmlns="http://www.w3.org/2000/svg" viewBox="0 0 300 300">
<title>Facebook</title>
<path class="cls-11"
d="M210.5,115.12H171.74V97.82c0-8.14,5.39-10,9.19-10h27.14V52l-39.32-.12c-35.66,0-42.42,26.68-42.42,43.77v19.48H99.09v36.32h27.24v109h45.41v-109h35Z">
</path>
</svg></a>
<a class="footer-icon" id="footer_linkedin"
href="https://www.linkedin.com/company/ncbinlm"
aria-label="LinkedIn"><svg data-name="Layer 1" xmlns="http://www.w3.org/2000/svg" viewBox="0 0 300 300">
<title>LinkedIn</title>
<path class="cls-11"
d="M101.64,243.37H57.79v-114h43.85Zm-22-131.54h-.26c-13.25,0-21.82-10.36-21.82-21.76,0-11.65,8.84-21.15,22.33-21.15S101.7,78.72,102,90.38C102,101.77,93.4,111.83,79.63,111.83Zm100.93,52.61A17.54,17.54,0,0,0,163,182v61.39H119.18s.51-105.23,0-114H163v13a54.33,54.33,0,0,1,34.54-12.66c26,0,44.39,18.8,44.39,55.29v58.35H198.1V182A17.54,17.54,0,0,0,180.56,164.44Z">
</path>
</svg></a>
<a class="footer-icon" id="footer_github" href="https://github.com/ncbi" aria-label="GitHub"><svg
data-name="Layer 1" xmlns="http://www.w3.org/2000/svg" viewBox="0 0 300 300">
<defs>
<style>
.cls-11,
.cls-12 {
fill: #737373;
}
.cls-11 {
fill-rule: evenodd;
}
</style>
</defs>
<title>GitHub</title>
<path class="cls-11"
d="M151.36,47.28a105.76,105.76,0,0,0-33.43,206.1c5.28,1,7.22-2.3,7.22-5.09,0-2.52-.09-10.85-.14-19.69-29.42,6.4-35.63-12.48-35.63-12.48-4.81-12.22-11.74-15.47-11.74-15.47-9.59-6.56.73-6.43.73-6.43,10.61.75,16.21,10.9,16.21,10.9,9.43,16.17,24.73,11.49,30.77,8.79,1-6.83,3.69-11.5,6.71-14.14C108.57,197.1,83.88,188,83.88,147.51a40.92,40.92,0,0,1,10.9-28.39c-1.1-2.66-4.72-13.42,1-28,0,0,8.88-2.84,29.09,10.84a100.26,100.26,0,0,1,53,0C198,88.3,206.9,91.14,206.9,91.14c5.76,14.56,2.14,25.32,1,28a40.87,40.87,0,0,1,10.89,28.39c0,40.62-24.74,49.56-48.29,52.18,3.79,3.28,7.17,9.71,7.17,19.58,0,14.15-.12,25.54-.12,29,0,2.82,1.9,6.11,7.26,5.07A105.76,105.76,0,0,0,151.36,47.28Z">
</path>
<path class="cls-12"
d="M85.66,199.12c-.23.52-1.06.68-1.81.32s-1.2-1.06-.95-1.59,1.06-.69,1.82-.33,1.21,1.07.94,1.6Zm-1.3-1">
</path>
<path class="cls-12"
d="M90,203.89c-.51.47-1.49.25-2.16-.49a1.61,1.61,0,0,1-.31-2.19c.52-.47,1.47-.25,2.17.49s.82,1.72.3,2.19Zm-1-1.08">
</path>
<path class="cls-12"
d="M94.12,210c-.65.46-1.71,0-2.37-.91s-.64-2.07,0-2.52,1.7,0,2.36.89.65,2.08,0,2.54Zm0,0"></path>
<path class="cls-12"
d="M99.83,215.87c-.58.64-1.82.47-2.72-.41s-1.18-2.06-.6-2.7,1.83-.46,2.74.41,1.2,2.07.58,2.7Zm0,0">
</path>
<path class="cls-12"
d="M107.71,219.29c-.26.82-1.45,1.2-2.64.85s-2-1.34-1.74-2.17,1.44-1.23,2.65-.85,2,1.32,1.73,2.17Zm0,0">
</path>
<path class="cls-12"
d="M116.36,219.92c0,.87-1,1.59-2.24,1.61s-2.29-.68-2.3-1.54,1-1.59,2.26-1.61,2.28.67,2.28,1.54Zm0,0">
</path>
<path class="cls-12"
d="M124.42,218.55c.15.85-.73,1.72-2,1.95s-2.37-.3-2.52-1.14.73-1.75,2-2,2.37.29,2.53,1.16Zm0,0"></path>
</svg></a>
<a class="footer-icon" id="footer_blog" href="https://ncbiinsights.ncbi.nlm.nih.gov/" aria-label="Blog">
<svg id="Layer_1" data-name="Layer 1" xmlns="http://www.w3.org/2000/svg" viewBox="0 0 40 40"><defs><style>.cls-1{fill:#737373;}</style></defs><path class="cls-1" d="M14,30a4,4,0,1,1-4-4,4,4,0,0,1,4,4Zm11,3A19,19,0,0,0,7.05,15a1,1,0,0,0-1,1v3a1,1,0,0,0,.93,1A14,14,0,0,1,20,33.07,1,1,0,0,0,21,34h3a1,1,0,0,0,1-1Zm9,0A28,28,0,0,0,7,6,1,1,0,0,0,6,7v3a1,1,0,0,0,1,1A23,23,0,0,1,29,33a1,1,0,0,0,1,1h3A1,1,0,0,0,34,33Z"/></svg>
</a>
</div>
</div>
</section>
<section class="container-fluid bg-primary">
<div class="container pt-5">
<div class="row mt-3">
<div class="col-lg-3 col-12">
<p><a class="text-white" href="https://www.nlm.nih.gov/socialmedia/index.html">Connect with NLM</a></p>
<ul class="list-inline social_media">
<li class="list-inline-item"><a href="https://twitter.com/NLM_NIH" aria-label="Twitter"
target="_blank" rel="noopener noreferrer">
<svg width="35" height="35" viewBox="0 0 38 35" fill="none" xmlns="http://www.w3.org/2000/svg">
<title>Twitter</title>
<g id="twitterx1009" clip-path="url(#clip0_65276_3946)">
<path id="Vector" d="M17.5006 34.6565C26.9761 34.6565 34.6575 26.9751 34.6575 17.4996C34.6575 8.02416 26.9761 0.342773 17.5006 0.342773C8.02514 0.342773 0.34375 8.02416 0.34375 17.4996C0.34375 26.9751 8.02514 34.6565 17.5006 34.6565Z" fill="#205493" stroke="white" stroke-width="1.2" stroke-miterlimit="10"></path>
<path id="path1009" d="M8.54811 8.5L16.2698 18.4279L8.50001 26.5H11.5L17.5 20L22.5486 26.5H28.5L20.5 16L27 8.5H24.5L19 14.5L14.5007 8.5H8.54927H8.54811ZM11.1197 9.73873H13.4519L25.4519 25.2613H23.1926L11.1197 9.73873Z" fill="white"></path>
</g>
<defs>
<clipPath id="clip0_65276_3946">
<rect width="38" height="38" fill="white"></rect>
</clipPath>
</defs>
</svg></a>
</li>
<li class="list-inline-item"><a href="https://www.facebook.com/nationallibraryofmedicine"
aria-label="Facebook" rel="noopener noreferrer" target="_blank">
<svg version="1.1" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" x="0px"
y="0px" viewBox="0 0 249 249" style="enable-background:new 0 0 249 249;" xml:space="preserve">
<style type="text/css">
.st10 {
fill: #FFFFFF;
}
.st110 {
fill: none;
stroke: #FFFFFF;
stroke-width: 8;
stroke-miterlimit: 10;
}
</style>
<title>SM-Facebook</title>
<g>
<g>
<path class="st10" d="M159,99.1h-24V88.4c0-5,3.3-6.2,5.7-6.2h16.8V60l-24.4-0.1c-22.1,0-26.2,16.5-26.2,27.1v12.1H90v22.5h16.9
v67.5H135v-67.5h21.7L159,99.1z"></path>
</g>
</g>
<circle class="st110" cx="123.6" cy="123.2" r="108.2"></circle>
</svg>
</a></li>
<li class="list-inline-item"><a href="https://www.youtube.com/user/NLMNIH" aria-label="Youtube"
target="_blank" rel="noopener noreferrer"><svg version="1.1" xmlns="http://www.w3.org/2000/svg"
xmlns:xlink="http://www.w3.org/1999/xlink" x="0px" y="0px" viewBox="0 0 249 249"
style="enable-background:new 0 0 249 249;" xml:space="preserve">
<title>SM-Youtube</title>
<style type="text/css">
.st4 {
fill: none;
stroke: #FFFFFF;
stroke-width: 8;
stroke-miterlimit: 10;
}
.st5 {
fill: #FFFFFF;
}
</style>
<circle class="st4" cx="124.2" cy="123.4" r="108.2"></circle>
<g transform="translate(0,-952.36218)">
<path class="st5"
d="M88.4,1037.4c-10.4,0-18.7,8.3-18.7,18.7v40.1c0,10.4,8.3,18.7,18.7,18.7h72.1c10.4,0,18.7-8.3,18.7-18.7
v-40.1c0-10.4-8.3-18.7-18.7-18.7H88.4z M115.2,1058.8l29.4,17.4l-29.4,17.4V1058.8z"></path>
</g>
</svg></a></li>
</ul>
</div>
<div class="col-lg-3 col-12">
<p class="address_footer text-white">National Library of Medicine<br>
<a href="https://www.google.com/maps/place/8600+Rockville+Pike,+Bethesda,+MD+20894/@38.9959508,-77.101021,17z/data=!3m1!4b1!4m5!3m4!1s0x89b7c95e25765ddb:0x19156f88b27635b8!8m2!3d38.9959508!4d-77.0988323"
class="text-white" target="_blank" rel="noopener noreferrer">8600 Rockville Pike<br>
Bethesda, MD 20894</a></p>
</div>
<div class="col-lg-3 col-12 centered-lg">
<p><a href="https://www.nlm.nih.gov/web_policies.html" class="text-white">Web Policies</a><br>
<a href="https://www.nih.gov/institutes-nih/nih-office-director/office-communications-public-liaison/freedom-information-act-office"
class="text-white">FOIA</a><br>
<a href="https://www.hhs.gov/vulnerability-disclosure-policy/index.html" class="text-white" id="vdp">HHS Vulnerability Disclosure</a></p>
</div>
<div class="col-lg-3 col-12 centered-lg">
<p><a class="supportLink text-white" href="https://support.nlm.nih.gov/">Help</a><br>
<a href="https://www.nlm.nih.gov/accessibility.html" class="text-white">Accessibility</a><br>
<a href="https://www.nlm.nih.gov/careers/careers.html" class="text-white">Careers</a></p>
</div>
</div>
<div class="row">
<div class="col-lg-12 centered-lg">
<nav class="bottom-links">
<ul class="mt-3">
<li>
<a class="text-white" href="//www.nlm.nih.gov/">NLM</a>
</li>
<li>
<a class="text-white"
href="https://www.nih.gov/">NIH</a>
</li>
<li>
<a class="text-white" href="https://www.hhs.gov/">HHS</a>
</li>
<li>
<a
class="text-white" href="https://www.usa.gov/">USA.gov</a>
</li>
</ul>
</nav>
</div>
</div>
</div>
</section>
</footer>
<!-- ========== END FOOTER ========== -->
<!-- javascript to inject NWDS meta tags. Note: value of nwds_version is updated by "npm version" command -->
<script type="text/javascript">
var nwds_version = "1.2.3";
var meta_nwds_ver = document.createElement('meta');
meta_nwds_ver.name = 'ncbi_nwds_ver';
meta_nwds_ver.content = nwds_version;
document.getElementsByTagName('head')[0].appendChild(meta_nwds_ver);
var meta_nwds = document.createElement('meta');
meta_nwds.name = 'ncbi_nwds';
meta_nwds.content = 'yes';
document.getElementsByTagName('head')[0].appendChild(meta_nwds);
var alertsUrl = "/core/alerts/alerts.js";
if (typeof ncbiBaseUrl !== 'undefined') {
alertsUrl = ncbiBaseUrl + alertsUrl;
}
</script>
<!-- JavaScript -->
<script src="/pathogens/static/django_uswds/uswds/js/uswds.js"></script>
<script src="https://code.jquery.com/jquery-3.5.0.min.js"
integrity="sha256-xNzN2a4ltkB44Mc/Jz3pT4iU1cmeR0FkXs4pru/JxaQ="
crossorigin="anonymous">
</script>
<script>
var fallbackJquery = "/pathogens/static/base/js/jquery-3.5.0.min.js";
window.jQuery || document.write("<script src=" + fallbackJquery + ">\x3C/script>")
</script>
<script src="/pathogens/static/nwds/js/nwds.js" type="text/javascript"> </script>
<script src="/pathogens/static/nwds/js/header.js" type="text/javascript"> </script>
<script src="/pathogens/static/nwds/js/ncbipopup.js" type="text/javascript"> </script>
<script src="/pathogens/static/nwds/js/ncbiclearbutton.js" type="text/javascript"> </script>
<script src="/pathogens/static/nwds/js/override-uswds.js" type="text/javascript"> </script>
<script src="/pathogens/static/nwds/js/ncbifeedback.js" type="text/javascript"> </script>
<script type="text/javascript" src="https://www.ncbi.nlm.nih.gov/core/pinger/pinger.js"> </script>
<script type="text/javascript" src="/pathogens/static/main/scripts/page-search.js" charset="utf-8"></script>
</body>
</html>