nih-gov/www.ncbi.nlm.nih.gov/tools/cobalt/index.html

403 lines
25 KiB
HTML

<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
<html xmlns="http://www.w3.org/1999/xhtml">
<head>
<meta http-equiv="Content-Type" content="text/html; charset=UTF-8" />
<meta name="ncbi_app" content="cobalt" />
<meta name="ncbi_pdid" content="blastsearch" />
<meta name="ncbi_program" content="" />
<meta name="referrer" content="origin-when-cross-origin" />
<meta name="ncbi_sessionid" content="CE8B5AF87C7FFCB1_0191SID" />
<meta name="ncbi_phid" content="0751F75D7D2148C10000000000000001" />
<script type="text/javascript"> var ncbi_startTime = new Date(); </script>
<title>COBALT:Multiple Alignment Tool</title>
<!-- style -->
<link rel="stylesheet" type="text/css" href="css/common.css" media="screen" />
<link rel="stylesheet" type="text/css" href="css/searchForm.css" media="screen" />
<!--[if IE]>
<link rel="stylesheet" type="text/css" href="css/searchFormIE.css" media="screen" />
<![endif]-->
<!--[if IE 8]>
<link rel="stylesheet" type="text/css" href="css/searchFormIE8.css" media="screen" />
<![endif]-->
<!--[if lte IE 6]>
<link rel="stylesheet" type="text/css" href="css/ie6_or_less.css" />
<![endif]-->
<!-- behavior -->
<!-- Not currently using ie7 JS script, because it causes a JS error -->
<!-- [if lt IE 7]>
<script src="https://nihms.nih.gov/db/ie7-standard-p.js" type="text/javascript"></script>
<![endif]-->
<!-- js files for title filling -->
<script type="text/javascript" src="/core/jig/1.15.2/js/jig.min.js"></script>
<script type="text/javascript"> jQuery.getScript("/core/alerts/alerts.js", function() {
galert(['div#header', 'body > *:nth-child(1)'])
});</script>
<link rel="stylesheet" type="text/css" href="css/header.css" media="screen" />
<link rel="stylesheet" type="text/css" href="css/google-fonts.css" media="screen" />
<link rel="stylesheet" type="text/css" href="css/footer.css" media="screen" />
<script type="text/javascript" src="js/utils.js"></script>
<script type="text/javascript" src="js/toggle.js"></script>
<script type="text/javascript" src="js/genericMln.js"></script>
<script type="text/javascript" src="js/multiAlign.js"></script>
</head>
<body id="type-a" class="">
<header id="page_header" role="banner">
<ul class="skip_nav">
<li><a accesskey="1" title="NCBI Homepage" href="https://www.ncbi.nlm.nih.gov/">NCBI Home</a></li>
<li><a accesskey="2" title="MyNCBI" href="https://www.ncbi.nlm.nih.gov/myncbi">Sign in to NCBI</a></li>
<li><a accesskey="3" title="Skip to main content" href="#content">Skip to Main Content</a></li>
<li><a accesskey="4" title="Skip to navigation" href="#navcontent">Skip to Navigation</a></li>
<li><a accesskey="0" title="About NCBI Accesskeys" href="https://www.ncbi.nlm.nih.gov/guide/browsers/#accesskeys">About NCBI Accesskeys</a></li>
</ul>
<nav class="blue_nav_bar">
<div class="nih">
<a id="page_header_6" href="https://www.nih.gov/" class="left norm_height">
<img src="css/images/nih_logo.svg" alt="NIH logo" class="left"/></a>
<a id="page_header_7" href="https://www.nlm.nih.gov/" class="left header_link">U.S. National Library of Medicine</a>
</div>
<div class="left">
<img src="css/images/arrow.svg" class="left norm_height" alt=""/>
</div>
<div class="ncbi">
<a id="page_header_8" href="https://www.ncbi.nlm.nih.gov/" class="header_link">
<span class="ncbi_name">NCBI</span>
<span class="med_hidden">National Center for Biotechnology Information</span></a>
<div class="right sign-in">
<ul class="myncbi2">
<li id="myncbiusername">
<span id="mnu">
<a id="mnu_0" href="https://www.ncbi.nlm.nih.gov/account/settings/" title="Edit account settings"></a>
</span>
</li>
<li id="myncbi"><a id="myncbi_0" href="https://www.ncbi.nlm.nih.gov/myncbi/">My NCBI</a></li>
<li id="myncbi_sign_in"><a id="myncbi_sign_in_0" href="https://www.ncbi.nlm.nih.gov/account/?back_url=https%3A%2F%2Fwww%2Encbi%2Enlm%2Enih%2Egov%2Ftools%2Fcobalt%2F">Sign in to NCBI</a></li>
<li id="myncbi_register"><a id="myncbi_register_0" href="https://www.ncbi.nlm.nih.gov/account/register/?back_url=https%3A%2F%2Fwww%2Encbi%2Enlm%2Enih%2Egov%2Ftools%2Fcobalt%2F">Register</a></li>
<li id="myncbi_sign_out"><a id="myncbi_sign_out_0" href="https://www.ncbi.nlm.nih.gov/account/signout/?back_url=https%3A%2F%2Fwww%2Encbi%2Enlm%2Enih%2Egov%2Ftools%2Fcobalt%2F">Sign Out</a></li>
</ul>
</div>
</div>
</nav>
<div class="bg-gray header-div">
<nav class="top-nav" id="navcontent" role="navigation">
<a class="lf" href="cobalt.cgi?CMD=Web">COBALT</a> <span id="brc">Constraint-based Multiple Alignment Tool</span>
<div class="rf">
<ul id="blnav">
<li class="first active"><a href="cobalt.cgi?CMD=Web">Home</a></li>
<li class="recent "><a href="cobalt.cgi?CMD=RecentRes">Recent Results</a></li>
<li class="recent "><a href="cobalt.cgi?CMD=Doc">Help</a></li>
</ul>
</div>
</nav>
</div>
</header>
<div id="wrap">
<div id="content-wrap">
<!--<span class="pgt">Cobalt Constraint-based Multiple Protein Alignment Tool</span>-->
<div id="content">
<!-- Do errors this way -->
<ul id="msg" class="msg"><li class=""></li></ul>
<form name="searchForm" enctype="multipart/form-data" action="cobalt.cgi?CMD=submit" method="post" class="f-wrap-1" id="searchForm" >
<!-- <FORM name="searchForm" action="?request=page&seqList=true&seqType=Protein&submitRequest=on&dispAlignsID=0" method=post class="f-wrap-1" id="searchForm" > -->
<div id="progDescr">
COBALT computes a multiple protein sequence alignment using conserved domain and local sequence similarity information.
<a href="#" title="help" class="helplink showing" id="moreHelp"><span>[?]</span></a>
</div>
<div id="pagelinks"><a href="#" id="resetlink" resetform="searchForm">Reset page</a></div>
<div class="helpbox hidden" id="mhlp" toggle="moreHelp">
COBALT is a multiple sequence alignment tool that finds a collection of pairwise constraints derived from conserved domain database, protein motif database, and sequence similarity, using RPS-BLAST, BLASTP, and PHI-BLAST.
<br />
Pairwise constraints are then incorporated into a progressive multiple alignment.
<br />
More details in <a href="https://www.ncbi.nlm.nih.gov/pubmed/17332019">Papadopoulos JS and Agarwala R,
Bioinformatics 23:1073-79, 2007 (PMID: 17332019)</a>
</div>
<div id="query" class="section">
<fieldset class="section">
<legend>Enter Query Sequences</legend>
<div class="qs">
<div class="formblock all" id="qseq">
<label for="seq">Enter at least 2 protein accessions, gis, or FASTA sequences</label>
<a class="helplink hiding" title="help" href="#" id="queryHelp"><span>[?]</span></a>
<a href="#" class="clearlink" fieldToClear="seq" id="clearseq">Clear</a>
<div toggle="queryHelp" class="helpbox hidden" id="hq">
Query sequences to be aligned should be pasted in the text area.
It automatically determines the format or the input. To allow this feature there
are certain conventions required with regard to the input of identifiers.
<a href="https://blast.ncbi.nlm.nih.gov/Blast.cgi?CMD=Web&amp;PAGE_TYPE=BlastDocs&amp;DOC_TYPE=BlastHelp" target="helpWin" class="helplink">more...</a>
</div>
<textarea id="seq" class="reset" rows="6" cols="96" name="seqsToAlignFastA" ></textarea>
<br />
<label for="upl" class="m" >Or, upload FASTA file</label>
<div class="input ">
<input type="file" id="upl" name="fileSeqsToAlignFastA" />
</div>
<label for="jt" class="m" >Job Title</label>
<div class="input ">
<input type="text" id="jt" size="63" value="" name="jobTitle" />
</div>
</div> <!-- qseq -->
</div><!-- /.qs -->
</fieldset>
</div> <!-- query -->
<div class="searchInfo ">
<div class="summary">
<img border="0" id="b1" src="css/images/align.jpg" class="alnbutton" alt="Align" mouseovImg="css/images/alignOver.jpg" mouseoutImg="css/images/align.jpg" mousedownImg="css/images/alignDown.jpg" mouseupImg="css/images/alignOver.jpg" />
</div>
<div class="searchsummary">
<div class="openNewWin ">
<input class="newwin" type="checkbox" name="NEWWIN" id="nw1" form="searchForm" winType="random" />
<label class="inlineLabel " for="nw1">Show results in a new window</label>
</div>
</div>
</div>
<div class="" id="optSection">
<div id="sopts" class="section">
<a href="#i" class="arrowlink hiding moreOptions" id="toggleOptions">Advanced parameters</a>
<div id="moreopts" toggle="toggleOptions" class="hidden">
<fieldset class="section">
<legend>Alignment Parameters</legend>
<label for="GOP" class="m ">Gap Penalties</label>
<div class="input ">
<div class=" infl">
<label for="GOP">Opening</label>
<label for="GEP" class="lbLm">Extension</label>
</div>
<input name="gapOpenPenalty" id="GOP" type="text" size="5" value="-11" />
<input name="gapExtendPenalty" id="GEP" type="text" size="5" value="-1" class="rs" />
<a class="helplink" title="help" href="#" id="gopHelp"><span>[?]</span></a>
<p toggle="gopHelp" class="helpbox hidden">
Gap opening penalty and gap extension penalty for gaps inside of a sequence used in pairwise global alignment
in the progressive alignment stage.
</p>
</div>
<label for="EGOP" class="m ">End-Gap Penalties</label>
<div class="input ">
<div class=" infl">
<label for="EGOP">Opening</label>
<label for="EGEP" class="lbLm">Extension</label>
</div>
<input name="endGapOpenPenalty" id="EGOP" type="text" size="5" value="-5" />
<input name="endGapExtendPenalty" id="EGEP" type="text" size="5" value="-1" class="rs" />
<a class="helplink" title="help" href="#" id="egopHelp"><span>[?]</span></a>
<p toggle="egopHelp" class="helpbox hidden">
Gap opening penalty and gap extension penalty for gaps at ends of a sequence used in pairwise global alignment
in the progressive alignment stage.
</p>
</div>
</fieldset>
<fieldset class="section">
<legend>Constraint Parameters</legend>
<label for="URB" class="m ">RPS blast</label>
<div class="input">
<input name="useRPSBlast" type="checkbox" checked="checked" class="reset" id="URB" />
<label class="right inlinelabel" for="URB">Use RPS BLAST to guide alignment</label>
<a class="helplink" title="help" href="#" id="urbHelp"><span>[?]</span></a>
<p toggle="urbHelp" class="helpbox hidden">
Use RPS-BLAST to find conserved domains in query sequences to guide alignment. The sequence matches to conserved
domains will be converted into pair wise alignment constraints. Ranges of input sequences that match to the same
conserved domain will be aligned to each other in the final multiple alignment. We strongly recommend checking
this box. <br />
This box can be unchecked in order to decrease computation time if all sequences are expected to match to the
same conserved domains or not to match to any conserved domain. COBALT is optimized for cases where groups of
sequences do match to the same domain (see <i>Query Clustering</i> below). <br />
<b>Note:</b> Unchecking this box in other cases will result in poorer alignment.
</p>
</div>
<label for="BE" class="m ">Constraint E-value</label>
<div class="input ">
<input name="blastEvalue" id="BE" type="text" size="5" value="0.005" />
<a class="helplink" title="help" href="#" id="beHelp"><span>[?]</span></a>
<p toggle="beHelp" class="helpbox hidden">
E-value threshold for accepting BLAST-P hits in pair wise local alignment of input sequences. The accepted
matches will be converted into pair wise alignment constraints. Pair wise locally aligned ranges of input
sequences will be aligned to one another in the multiple alignment. E-value can be increased if very dissimilar
sequences are used. <br />
<b>Note:</b> Changing this value can significantly impact quality of the resulting alignment.
</p>
</div>
<label for="FCC" class="m ">Conserved columns</label>
<div class="input">
<input name="findConservedCols" type="checkbox" checked="checked" class="reset" id="FCC" />
<label class="right inlinelabel" for="FCC">Find Conserved Columns and Recompute Alignment</label>
<a class="helplink" title="help" href="#" id="fccHelp"><span>[?]</span></a>
<p toggle="fccHelp" class="helpbox hidden">
Identify conserved columns after the first iteration of progressive alignment and re-align input sequences using
this information. Unchecking this box will reduce computation time but will also result in poorer alignment
(especially if <i>Use query clusters</i> box is checked). We strongly recommend checking this box.
</p>
</div>
</fieldset>
<fieldset class="section">
<legend>Query Clustering Parameters</legend>
<label for="UQC" class="m ">Query Clustering Parameters</label>
<div class="input">
<input name="useQueryClusters" type="checkbox" checked="checked" class="reset" id="UQC" />
<label class="right inlinelabel" for="UQC">Use query clusters</label>
<a class="helplink" title="help" href="#" id="uqcHelp"><span>[?]</span></a>
<p toggle="uqcHelp" class="helpbox hidden">
Reduce computation time by using clusters of similar sequences. The idea behind using clusters is that constraints
do not contribute information for alignment of very similar sequences. Then computationally intensive tasks
of identifying conserved domains and consistent set of constraints can be avoided for many sequences. Clusters of
similar sequences are found using alignment-free k-mer counting-based method. See Edgar RC, <i>Nucleic Acids Res</i>
16:380-5, 2004, <i>PMID: 14729922</i> for k-mer counting-based sequence similarity.
Constraints will be computed only for cluster representatives. In-cluster sequences will be aligned using combined
local and global alignment. We recommend that the <i>Find Conserved Columns and Recompute Alignment</i> option (above) is
also selected.
We recommend using this option for aligning BLAST results and whenever a subset of input sequences that
share conserved domains is expected.
This option can be unchecked for aligning of sequences that are not expected to share conserved domains and are
expected to have very short pair wise local alignments.
</p>
</div>
<label for="WS" class="m ">Word Size</label>
<div class="input ">
<select name="wordSize" id="WS">
<option value="3" >3</option>
<option value="4" selected="selected" >4</option>
<option value="5" >5</option>
<option value="6" >6</option>
<option value="7" >7</option>
</select>
<a class="helplink" title="help" href="#" id="wsHelp"><span>[?]</span></a>
<p toggle="wsHelp" class="helpbox hidden">
Number of letters in a word (k-mer) for k-mer count-based sequence similarity computation. Smaller words will
make sequences more similar than larger words.
</p>
</div>
<label for="MCD" class="m ">Max Cluster distance</label>
<div class="input ">
<select name="maxClusterDist" id="MCD">
<option value="0.6" >0.6</option>
<option value="0.65" >0.65</option>
<option value="0.7" >0.7</option>
<option value="0.75" >0.75</option>
<option value="0.8" selected="selected" >0.8</option>
<option value="0.85" >0.85</option>
<option value="0.9" >0.9</option>
<option value="0.95" >0.95</option>
</select>
<a class="helplink" title="help" href="#" id="mcdHelp"><span>[?]</span></a>
<p toggle="mcdHelp" class="helpbox hidden">
Maximum allowed distance between two sequences in a cluster. This threshold prvents COBALT from forming clusters
o unrelated sequences.
The distance between two sequences is computed as a fraction of words that appear in both sequences with respect
to number of all words in the longer sequence (similarly as in Edgar RC, <i>Nucleic Acids Res</i>
16:380-5, 2004, <i>PMID: 14729922</i>).
This distance overestimates exponentially scaled percentage of different residues in aligned sequences (see graphs
in the above paper for details).
Allowed range for this threshold is between 0 and 1. Smaller values result in more clusters and hence more
conserved domain-based constraints used in multiple alignment. Larger values result in fewer clusters and
hence less conserved domain information used in multiple alignment.
</p>
</div>
<label for="ALPH" class="m ">Alphabet</label>
<div class="input ">
<select name="alphabet" id="ALPH" class="reset">
<option value="2" selected="selected" >SE-B15</option>
<option value="1" >SE-V10</option>
<option value="0" >Regular</option>
</select>
<a class="helplink" title="help" href="#" id="alphHelp"><span>[?]</span></a>
<div toggle="alphHelp" class="helpbox hidden">
Alphabet for creating k-mer count representations of sequences.
Available options:
<ul>
<li>SE-B15 and SE-V10 - 15 and 10-letter compressed alphabets (see Shiryev SA et al.,
Bioinformatics 23:2949-51, 2007, <i>PMID: 17921491</i> for details)</li>
<li>Regular - regular 20-amino-acid alphabet.</li>
</ul>
</div>
</div>
</fieldset>
<div class="searchInfo ">
<div class="summary">
<img border="0" id="b2" src="css/images/align.jpg" class="alnbutton" alt="Align" mouseovImg="css/images/alignOver.jpg" mouseoutImg="css/images/align.jpg" mousedownImg="css/images/alignDown.jpg" mouseupImg="css/images/alignOver.jpg" />
</div>
<div class="searchsummary">
<div class="openNewWin ">
<input class="newwin" type="checkbox" name="NEWWIN" id="nw2" form="searchForm" winType="random" />
<label class="inlineLabel " for="nw2">Show results in a new window</label>
</div>
</div>
</div>
</div><!-- moreopts -->
</div>
</div>
<input name="distanceMethod" value="0" type="hidden" />
<!-- <input name="inputScreen" value="true" type="hidden" />
<input name="AlignSeqs" value="" id="AlignSeqs" type="hidden" /> -->
<input name="link_loc" type="hidden" value="cobaltInpPage"/>
</form>
</div><!--/#content-->
<div id="footer">
<div id="rgs">BLAST is a registered trademark of the National Library of Medicine.</div>
<p id="orgns">
<a href="https://www.ncbi.nlm.nih.gov/" title="National Center for Biotechnology Information">NCBI</a> |
<a href="https://www.nlm.nih.gov/" title="National Library of Medicine">NLM</a> |
<a href="https://www.nih.gov/" title="National Institutes of Health">NIH</a> |
<a href="https://www.hhs.gov/" title="US Department of Health and Human Services">DHHS</a>
</p>
<p>
<a href='https://www.ncbi.nlm.nih.gov/About/disclaimer.html'
title='NCBI intellectual property statement'>Copyright</a> |
<a href='https://www.ncbi.nlm.nih.gov/About/disclaimer.html#disclaimer'
title='About liability, endorsements, external links, pop-up advertisements'>Disclaimer</a> |
<a href='https://www.nlm.nih.gov/privacy.html'
title='NLM privacy policy'>Privacy</a> |
<a href='https://www.nlm.nih.gov/accessibility.html'
title='About using NCBI resources with assistive technology'>Accessibility</a> |
<a href='https://www.ncbi.nlm.nih.gov/About/glance/contact_info.html'
title='How to get help, submit data, or provide feedback'>Contact</a> |
<a href='https://www.ncbi.nlm.nih.gov/sites/ehelp/feedback?Ncbi_App=blast'
title='How to get help, submit data, or provide feedback'>Send feedback</a>
</p>
</div>
<script type="text/javascript" src="js/header.js"> </script>
</div><!--/#content-wrap-->
</div><!--/#wrap-->
<script type="text/javascript" src="/portal/portal3rc.fcgi/rlib/js/InstrumentOmnitureBaseJS/InstrumentNCBIBaseJS/InstrumentPageStarterJS.js"></script>
</body>
</html>