nih-gov/www.ncbi.nlm.nih.gov/Structure/protfam/about.html

312 lines
22 KiB
HTML

<!DOCTYPE html>
<html>
<head>
<meta http-equiv="Content-Type" content="text/html;charset=UTF-8">
<meta name="ncbi_app" content="cdd" /><meta name="ncbi_pdid" content="SARS-CoV-2 models" /><meta name="ncbi_db" content="cdd" />
<meta name="description" content="Conserved Domain Database (CDD) models and 3D protein structures relevant to SARS-CoV-2, the novel coronavirus that causes the COVID-19 pandemic. This is a resource of the National Center of Biotechnology Information (NCBI), National Library of Medicine (NLM)">
<meta name="keywords" content="proteins, functional, conserved domains, 3D structures, macromolecular structures, severe acute respiratory syndrome coronavirus 2, architecture, coronavirus, pandemic, SARS-CoV-2, COVID-19">
<title>What are Protein Family Models?</title>
<meta name="viewport" content="width=device-width, initial-scale=1">
<link rel="apple-touch-icon" href="apple-touch-icon.png">
<link rel="icon shortcut" type="image/x-icon" href="favicon.ico">
<link rel="stylesheet" type="text/css" href="https://www.ncbi.nlm.nih.gov/Structure/shlu/jslibs/uswds/resources/uswds-not-greedy.min.css">
<link rel="stylesheet" type="text/css" href="https://www.ncbi.nlm.nih.gov/Structure/shlu/jslibs/uswds/resources/header.min.css">
<link rel="stylesheet" type="text/css" href="https://www.ncbi.nlm.nih.gov/Structure/shlu/jslibs/uswds/resources/footer.min.css">
<link rel="stylesheet" type="text/css" href="https://www.ncbi.nlm.nih.gov/Structure/shlu/jslibs/uswds/resources/form.min.css">
<link rel="stylesheet" type="text/css" href="resources/sheet.css" >
<style type="text/css">.ncbi-alerts { background: none repeat scroll 0% 0% #671414;color: #fff;padding: .231em 1.231em;}.ncbi-alerts p { color: #fff; }.ncbi-alerts a, .ncbi-alerts a:visited {color: #fff; background: none;}.ncbi-alerts p {margin: 1em 0;padding: 0 0 0 1.5em; }.ncbi-alerts p:nth-child(1) {background-image: url('/core/icons/information.png');background-position: left top;background-repeat: no-repeat }.ncbi-alerts.subclosed p:nth-child(1) {background-image: url('/core/alerts/warning.png');}.ncbi-alerts.subclosed p { padding-left: 2em;}.ncbi-alerts.pubmed, .ncbi-alerts.pubmed p {background-color: #97B0C8; color: #000;}.ncbi-alerts a { text-decoration: underline !important; }.ncbi-alerts.pubmed a, .ncbi-alerts.pubmed a:visited { color: #000; }.ncbi-alerts, .ncbi-alerts p {background-color: #97B0C8; color: #000;}.ncbi-alerts a, .ncbi-alerts a:visited { color: #000; }</style>
<style>
html {font-size: 10px;}
.waffle {font-size:0.9em }
.waffle a {
color: #0071bc!important;
text-decoration: none;
}
.waffle a:hover,
.waffle a:active {
color: #205493!important;
text-decoration: underline;
}
.waffle a:visited {
color: #4c2c92!important;
}
.readmore {display:inline-block; cursor:pointer; color: #0071bc; text-decoration: underline; font-style: italic;}
</style>
<!-- end content styles -->
</head>
<body>
<!--[if lte IE 8]>
<p class="browsehappy">You are using an <strong>outdated</strong> browser. Please <a href="http://browsehappy.com/">upgrade
your browser</a> to improve your experience.</p>
<![endif]-->
<!--indicator of global warning insertion-->
<div id="global_alert" style="display:none"></div>
<!-- Manually inserted NCBI message, as this is just an html and did not go through web services of any kind
<div class="ncbi-alerts nCoV" style="display: block; margin-bottom: 0px;"><p></p><p style="padding: 0.5em 2em; font-size: 12px; text-align: center; background: #FFB6B6 url(/core/icons/exclamation.png) no-repeat 5px center;">COVID-19 is an emerging, rapidly evolving situation.<br>Get the latest public health information from CDC: <a href="https://www.coronavirus.gov">https://www.coronavirus.gov </a>.<br>Get the latest research from NIH: <a href="https://www.nih.gov/coronavirus">https://www.nih.gov/coronavirus</a>.</p><p></p></div>
-->
<div class="us">
<a class="skipnav" href="#maincontent">Skip to main page content</a>
<header class="ncbi-page-header" role="banner">
<div class="prefix">
<span class="nih" title="National Institutes of Health">
<a href="https://www.nih.gov/" title="To NIH homepage">
<img src="nih-logo-header.svg" width="82%" height="82%" alt="NIH">
</a>
</span>
<span class="nlm">
<a href="https://www.nlm.nih.gov/" title="To NLM homepage">U.S. National Library of Medicine</a>
</span>
</div>
<div class="ncbi">
<abbr class="abbr">
<a href="https://www.ncbi.nlm.nih.gov/" title="To NCBI homepage">NCBI</a>
</abbr>
<span class="name">
<a href="https://www.ncbi.nlm.nih.gov/" accesskey="1" title="To NCBI homepage">National Center for Biotechnology Information</a>
<a href="https://www.ncbi.nlm.nih.gov/guide/browsers/#ncbi_accesskeys" class="usa-sr-only" accesskey="0">Accesskeys</a>
</div>
</header>
</div>
<!--
<div class="ncbi-alerts nCoV" style="display: block; margin-bottom: 16.003px;"><p></p><p style="padding: 0.5em 2em; font-size: 12px; text-align: center; background: #FFB6B6 url(/core/icons/exclamation.png) no-repeat 5px center;">COVID-19 is an emerging, rapidly evolving situation.<br>Get the latest public health information from CDC: <a href="https://www.coronavirus.gov">https://www.coronavirus.gov </a>.<br>Get the latest research from NIH: <a href="https://www.nih.gov/coronavirus">https://www.nih.gov/coronavirus</a>.<br>Find NCBI SARS-CoV-2 literature, sequence, and clinical content: <a href="https://www.ncbi.nlm.nih.gov/sars-cov-2/">https://www.ncbi.nlm.nih.gov/sars-cov-2/</a>.</p><p></p></div>
-->
<!-- Start of Real content-->
<!-- Insert static message blocks here
<div class="ncbi-alerts null" style="display: block; margin-bottom: 0px;"><p></p><p style="padding: 0.5em 2em; font-size: 12pt; text-align: center; background: #FFB6B6 url(/core/icons/exclamation.png) no-repeat 5px center;">Because of a lapse in government funding, the information on this website may not be up to date, transactions submitted via the website may not be processed, and the agency may not be able to respond to inquiries until appropriations are enacted.<br>The NIH Clinical Center (the research hospital of NIH) is open. For more details about its operating status, please visit <a href="http://cc.nih.gov">cc.nih.gov</a>.<br>Updates regarding government operating status and resumption of normal operations can be found at <a href="http://USA.gov">USA.gov</a>.</p></div>
<!-- End of message block---------------->
<div id="sl-page-content-wrap" class="us">
<div class="usa-grid-full">
<html lang="en"><head>
<br><title>What are Protein Family Models</title>
<style>
body {font-family: Verdana, Arial, Helvetica, sans-serif; font-size:0.9em;}
table { border-collapse: collapse;}
table tr td { border-bottom: 1px solid #ddd;}
.largetitle {font-size:1.3em; font-weight:bold}
.title {font-size:1.1em; font-weight:bold}
</style>
</head>
<body>
<div class='largetitle'>What are Protein Family Models?</div><br>
<div>
The <a href="https://www.ncbi.nlm.nih.gov/protfam">Protein Family Models database</a> contains Hidden Markov models (HMM), <a href="https://www.ncbi.nlm.nih.gov/Structure/cdd/cdd.shtml">conserved domain (CDD) architectures</a> and <a href="https://www.ncbi.nlm.nih.gov/pubmed/29112715">BlastRules</a> that represent protein families found in prokaryotes and eukaryotes. Notably, this database includes the models used for structural and functional annotation by the NCBI <a href="https://www.ncbi.nlm.nih.gov/genome/annotation_prok/">(Prokaryotic Genome Annotation Pipeline (PGAP))</a>.
</div>
<br>
<div class='title'>HMMs</div><br>
<div>
An HMM-based protein family is a probabilistic model used to determine which proteins belong or don't belong to the family. HMMs are built by converting multiple sequence alignments (seed alignments) of proteins of known function into a position-specific scoring system to generate an HMM profile. Amino acids at each position on the seed alignment are given a score according to their frequency. Sequence and domain cutoffs are established based on the seed alignments and used as minimum thresholds for query proteins to be classified as members of the HMM's protein family (See <a href="https://www.ncbi.nlm.nih.gov/genome/annotation_prok/evidence/example/">how to build an HMM</a>).
The HMMs included in the database encompass multiple collections.
<ul>
<li>NCBIFAMs: developed at NCBI, either de novo based on publications documenting protein function or from NCBI protein clusters (<a href="https://www.ncbi.nlm.nih.gov/pubmed/18940865">PRKs</a>)
<li><a href="https://www.ncbi.nlm.nih.gov/pubmed/18940865">TIGRFAMs</a>: created at The Institute for Genomic Research (now J. Craig Venter Institute) but now owned and maintained by NCBI
<li><a href="https://www.ncbi.nlm.nih.gov/pubmed/26673716">Pfams</a>: maintained and distributed by <a href="https://www.ebi.ac.uk/">EBI-EMBL</a>. NCBI expert curators may associate extra attributes that are not distributed in the EBI-EMBL Pfam releases such as product names, gene symbols or publications to the Entrez records.
</ul>
</div>
<div class='title'>Conserved domain (CDD) architectures</div><br>
<div>
<a href="https://www.ncbi.nlm.nih.gov/Structure/cdd/cdd.shtml">Conserved domain architectures</a> are protein classifiers built based on the nature and order of conserved domain signatures identified along protein sequences. Architectures with significant coverage are reviewed and given names, with an emphasis on architectures prominent in bacteria.
</div>
<br>
<div class='title'>BlastRules</div><br>
<div>
<a href="https://www.ncbi.nlm.nih.gov/pubmed/29112715">BlastRules</a> are a type of evidence for functional classification of proteins based on <a href="https://blast.ncbi.nlm.nih.gov/Blast.cgi">BLAST</a> (Basic Local Alignment Search Tool). A BlastRule consists of one or more 'model' proteins with known biological function, and BLAST identity and coverage cutoffs. Any protein aligning to a model protein above the cutoffs is considered a BlastRule hit. Curators review the literature to determine whether the biological function of studied proteins is conclusive and informative enough for creating a BlastRule. The protein sequences cited in articles are used as queries for BLAST searches in a database of proteins with known function. The identity and coverage cutoffs of the BlastRule are determined based on the BLAST results themselves, as well as phylogenetic analyses of the BLAST hits.
</div>
</body>
</html>
<br>
Revised 31 August 2023
</div>
</div>
<script src="//www.ncbi.nlm.nih.gov/Structure/shlu/jslibs/slucore.min.js"></script>
<script src="//www.ncbi.nlm.nih.gov/Structure/shlu/jslibs/infobox/infobox.min.js"></script>
<script src="//www.ncbi.nlm.nih.gov/Structure/shlu/jslibs/svg/svg.min.js"></script>
<script src="js/main.min.js"></script>
<script type='text/javascript' nonce='qRzoK/xtejHsZTMH3a2Hmw'>
function posObj(sheet, id, row, col, x, y) {
var rtl = false;
var sheetElement = document.getElementById(sheet);
if (!sheetElement) {
sheetElement = document.getElementById(sheet + '-grid-container');
}
if (sheetElement) {
rtl = sheetElement.getAttribute('dir') == 'rtl';
}
var r = document.getElementById(sheet+'R'+row);
var c = document.getElementById(sheet+'C'+col);
if (r && c) {
var objElement = document.getElementById(id);
var s = objElement.style;
var t = y;
while (r && r != sheetElement) {
t += r.offsetTop;
r = r.offsetParent;
}
var offsetX = x;
while (c && c != sheetElement) {
offsetX += c.offsetLeft;
c = c.offsetParent;
}
if (rtl) {
offsetX -= objElement.offsetWidth;
}
s.left = offsetX + 'px';
s.top = t + 'px';
s.display = 'block';
s.border = '1px solid #000000';
}
};
function posObjs() {
};
posObjs();
</script>
<!-- End of Real content-->
<div class="us">
<footer class="usa-footer usa-footer-big ncbi-footer" role="contentinfo">
<div class="usa-grid">
<div class="usa-row">
<nav class="usa-footer-nav">
<ul class="usa-unstyled-list usa-width-one-fourth usa-footer-primary-content">
<li class="usa-footer-primary-link ncbi-footer-heading">
<h4>Popular</h4>
</li>
<li><a href="https://www.ncbi.nlm.nih.gov/pubmed/">PubMed</a></li>
<li><a href="https://www.ncbi.nlm.nih.gov/pmc/">PMC</a></li>
<li><a href="https://www.ncbi.nlm.nih.gov/pubmedhealth/">PubMed Health</a></li>
<li><a href="https://www.ncbi.nlm.nih.gov/books/">Bookshelf</a></li>
<li><a href="https://pubchem.ncbi.nlm.nih.gov">PubChem</a></li>
<li><a href="https://blast.ncbi.nlm.nih.gov">BLAST</a></li>
<li><a href="https://www.ncbi.nlm.nih.gov/gene">Gene</a></li>
<li><a href="https://www.ncbi.nlm.nih.gov/nucleotide/">Nucleotide</a></li>
<li><a href="https://www.ncbi.nlm.nih.gov/protein/">Protein</a></li>
</ul>
<ul class="usa-unstyled-list usa-width-one-fourth usa-footer-primary-content">
<li class="usa-footer-primary-link ncbi-footer-heading"><h4>Connect</h4></li>
<li><a href="https://www.facebook.com/ncbi.nlm"><i class="fa fa-facebook fa-lg" aria-hidden="true"></i>Facebook</a></li>
<li><a href="https://twitter.com/ncbi"><i class="fa fa-twitter fa-lg" aria-hidden="true"></i>Twitter</a></li>
<li><a href="https://www.linkedin.com/company/national-center-for-biotechnology-information-ncbi-"><i class="fa fa-linkedin fa-lg" aria-hidden="true"></i>LinkedIn</a></li>
<li><a href="https://www.youtube.com/user/NCBINLM"><i class="fa fa-youtube fa-lg" aria-hidden="true"></i>YouTube</a></li>
<li><a href="https://github.com/ncbi"><i class="fa fa-github fa-lg" aria-hidden="true"></i>GitHub</a></li>
<li><a href="https://www.ncbi.nlm.nih.gov/news/announcements-list"><i class="fa fa-rss" aria-hidden="true"></i>News RSS</a></li>
<li><a href="https://ncbiinsights.ncbi.nlm.nih.gov/"><i class="fa fa-comments" aria-hidden="true"></i>Blog</a></li>
<li><a href="https://www.ncbi.nlm.nih.gov/home/about/contact.shtml"><i class="fa fa-envelope" aria-hidden="true"></i>Contact</a></li>
<li><a href="https://support.ncbi.nlm.nih.gov/"><i class="fa fa-question-circle" aria-hidden="true"></i>Support Center</a></li>
</ul>
<ul class="usa-unstyled-list usa-width-one-fourth usa-footer-primary-content">
<li class="usa-footer-primary-link ncbi-footer-heading"><h4>Resources</h4></li>
<li><a href="https://www.ncbi.nlm.nih.gov/home/literature.shtml">Literature</a></li>
<li><a href="https://www.ncbi.nlm.nih.gov/home/health.shtml">Health</a></li>
<li><a href="https://www.ncbi.nlm.nih.gov/home/genomes.shtml">Genomes</a></li>
<li><a href="https://www.ncbi.nlm.nih.gov/home/genes.shtml">Genes</a></li>
<li><a href="https://www.ncbi.nlm.nih.gov/home/proteins.shtml">Proteins</a></li>
<li><a href="https://www.ncbi.nlm.nih.gov/home/chemicals.shtml">Chemicals</a></li>
</ul>
<ul class="usa-unstyled-list usa-width-one-fourth usa-footer-primary-content">
<li class="usa-footer-primary-link ncbi-footer-heading"><h4>Actions</h4></li>
<li><a href="https://www.ncbi.nlm.nih.gov/home/submit.shtml">Submit</a></li>
<li><a href="https://www.ncbi.nlm.nih.gov/home/download.shtml">Download</a></li>
<li><a href="https://www.ncbi.nlm.nih.gov/home/learn.shtml">Learn</a></li>
<li><a href="https://www.ncbi.nlm.nih.gov/home/develop.shtml">Develop</a></li>
<li><a href="https://www.ncbi.nlm.nih.gov/home/analyze.shtml">Analyze</a></li>
<li><a href="https://www.ncbi.nlm.nih.gov/research/">Research</a></li>
</ul>
</nav>
<div class="usa-footer-logo usa-width-one-half">
<h3 class="ncbi"><a href="https://www.ncbi.nlm.nih.gov/">National Center for Biotechnology Information</a></h3>
<address>
<span class="h-adr">
<span class="p-street-address">8600 Rockville Pike</span>,
<span class="p-locality">Bethesda</span>
<span class="p-region"> MD</span>,
<span class="p-postal-code">20894</span>
<span class="p-country-name">USA</span>
</span>
</address>
</div>
</div>
</div>
<div class="usa-grid">
<div class="usa-row">
<div class="usa-width-one-half">
<div class="org-section">
<a href="https://www.hhs.gov/"><img class="usa-footer-logo-img hhs-logo" src="https://www.ncbi.nlm.nih.gov/Structure/sparcle/uswds/resources/dhhs-logo-white.svg" width="82%" height="82%" alt="U.S. Department of Health &amp; Human Services">
<span class="usa-sr-only">Department of Health and Human Services</span>
</a>
<a href="https://www.nih.gov/"><img class="usa-footer-logo-img nih-logo" src="https://www.ncbi.nlm.nih.gov/Structure/sparcle/uswds/resources/nih-logo-white.svg" width="82%" height="82%" alt="National Institutes of Health">
<span class="usa-sr-only">National Institutes of Health</span>
</a>
<a href="https://www.nlm.nih.gov/"><img class="usa-footer-logo-img nlm-logo" src="https://www.ncbi.nlm.nih.gov/Structure/sparcle/uswds/resources/nlm-logo-letters-white.svg" width="82%" height="82%" alt="National Library of Medicine">
<span class="usa-sr-only">National Library of Medicine</span>
</a>
<a href="https://www.usa.gov/"><img class="usa-footer-logo-img usagov-logo" src="https://www.ncbi.nlm.nih.gov/Structure/sparcle/uswds/resources/usagov-logo-white.svg" width="82%" height="82%" alt="USA.gov">
<span class="usa-sr-only">USA.gov</span></a>
</div>
</div>
<div class="usa-width-one-half">
<p class="about-links">
<a href="https://www.ncbi.nlm.nih.gov/home/about/">About NCBI</a>
<a href="https://www.ncbi.nlm.nih.gov/home/about/policies.shtml">Polices and Guidelines</a>
</p>
</div>
</div>
</div>
</footer>
</div>
<!--uswds header start-->
<script src="/Structure/shlu/jslibs/uswds/uswds.min.js"></script>
<script src="/Structure/shlu/jslibs/uswds/header.min.js"></script>
<!--uswds header end-->
<script src="/Structure/icn3d/lib/jquery-3.5.0.min.js"></script>
<script type="text/javascript">
$( document ).ready(function() {
$(document).on("click", ".mmdb-expand", function(e) {
e.stopImmediatePropagation();
var oriId = $(this).attr('id');
var pos = oriId.lastIndexOf('_');
var id = oriId.substr(0, pos);
$("#" + id).show();
$("#" + id + "_expand").hide();
$("#" + id + "_shrink").show();
});
$(document).on("click", ".mmdb-shrink", function(e) {
e.stopImmediatePropagation();
var oriId = $(this).attr('id');
var pos = oriId.lastIndexOf('_');
var id = oriId.substr(0, pos);
$("#" + id).hide();
$("#" + id + "_expand").show();
$("#" + id + "_shrink").hide();
});
});
</script>
</body>
</html>