nih-gov/www.ncbi.nlm.nih.gov/sra/docs/sra-aws-download/index.html

708 lines
44 KiB
HTML

<?xml version="1.0" encoding="utf-8"?>
<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
<head><meta http-equiv="Content-Type" content="text/html; charset=utf-8" />
<!-- AppResources meta begin -->
<meta name="paf-app-resources" content="" />
<!-- AppResources meta end -->
<!-- TemplateResources meta begin -->
<meta name="paf_template" content="StdNCol" />
<!-- TemplateResources meta end -->
<!-- Page meta begin -->
<!-- Page meta end -->
<!-- Logger begin -->
<meta xmlns:ncbi-portal="http://ncbi.gov/portal/XSLT/namespace" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" name="ncbi_app" content="sra" /><meta xmlns:ncbi-portal="http://ncbi.gov/portal/XSLT/namespace" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" name="ncbi_pdid" content="sra-custom-page" />
<!-- Logger end -->
<title>Download SRA sequence data using Amazon Web Services (AWS)</title>
<!-- PageFixtures headcontent begin -->
<meta name="cms-local-nav-url" content="https://cms.ncbi.nlm.nih.gov//sra/docs/sratabnav" />
<!-- PageFixtures headcontent end -->
<!-- AppResources external_resources begin -->
<script type="text/javascript" src="/core/jig/1.14.8/js/jig.min.js"></script>
<!-- AppResources external_resources end -->
<!-- Page headcontent begin -->
<meta name="subsite" content="sra" />
<meta name="path" content="sra/docs/sra-aws-download" />
<meta name="modified" content="2023-07-12T17:46:09Z" />
<link type="text/css" rel="stylesheet" href="/core/assets/sra/css/SraDoc.css" />
<!-- Page headcontent end -->
<!-- PageFixtures resources begin -->
<link xmlns="http://www.w3.org/1999/xhtml" type="text/css" rel="stylesheet" href="//static.pubmed.gov/portal/portal3rc.fcgi/4218191/css/4207974/4206132.css" xml:base="http://127.0.0.1/sites/static/header_footer" />
<!-- PageFixtures resources end -->
<link rel="shortcut icon" href="//www.ncbi.nlm.nih.gov/favicon.ico" /><meta name="ncbi_phid" content="CE8CA5AD7D1FE9D100000000013B0116.m_6" />
<meta name='referrer' content='origin-when-cross-origin'/><link type="text/css" rel="stylesheet" href="//static.pubmed.gov/portal/portal3rc.fcgi/4217302/css/4121862/3974050/3917732/251717/4082496/14534/45193/3534283/4128070/4082512/4005757/4062871.css" /><link type="text/css" rel="stylesheet" href="//static.pubmed.gov/portal/portal3rc.fcgi/4217302/css/3529741/3529739.css" media="print" /></head>
<body class=" sra-custom-page">
<div class="grid">
<div class="col twelve_col nomargin shadow">
<!-- System messages like service outage or JS required; this is handled by the TemplateResources portlet -->
<div class="sysmessages">
<noscript>
<p class="nojs">
<strong>Warning:</strong>
The NCBI web site requires JavaScript to function.
<a href="/guide/browsers/#enablejs" title="Learn how to enable JavaScript" target="_blank">more...</a>
</p>
</noscript>
</div>
<!--/.sysmessage-->
<div class="wrap">
<div class="page">
<div xmlns:xi="http://www.w3.org/2001/XInclude">
<div xmlns="http://www.w3.org/1999/xhtml" id="universal_header" xml:base="http://127.0.0.1/sites/static/header_footer">
<section class="usa-banner">
<div class="usa-accordion">
<header class="usa-banner-header">
<div class="usa-grid usa-banner-inner">
<img src="https://www.ncbi.nlm.nih.gov/coreutils/uswds/img/favicons/favicon-57.png" alt="U.S. flag" />
<p>An official website of the United States government</p>
<button class="non-usa-accordion-button usa-banner-button" aria-expanded="false" aria-controls="gov-banner-top" type="button">
<span class="usa-banner-button-text">Here's how you know</span>
</button>
</div>
</header>
<div class="usa-banner-content usa-grid usa-accordion-content" id="gov-banner-top" aria-hidden="true">
<div class="usa-banner-guidance-gov usa-width-one-half">
<img class="usa-banner-icon usa-media_block-img" src="https://www.ncbi.nlm.nih.gov/coreutils/uswds/img/icon-dot-gov.svg" alt="Dot gov" />
<div class="usa-media_block-body">
<p>
<strong>The .gov means it's official.</strong>
<br />
Federal government websites often end in .gov or .mil. Before
sharing sensitive information, make sure you're on a federal
government site.
</p>
</div>
</div>
<div class="usa-banner-guidance-ssl usa-width-one-half">
<img class="usa-banner-icon usa-media_block-img" src="https://www.ncbi.nlm.nih.gov/coreutils/uswds/img/icon-https.svg" alt="Https" />
<div class="usa-media_block-body">
<p>
<strong>The site is secure.</strong>
<br />
The <strong>https://</strong> ensures that you are connecting to the
official website and that any information you provide is encrypted
and transmitted securely.
</p>
</div>
</div>
</div>
</div>
</section>
<div class="usa-overlay"></div>
<header class="ncbi-header" role="banner" data-section="Header">
<div class="usa-grid">
<div class="usa-width-one-whole">
<div class="ncbi-header__logo">
<a href="/" class="logo" aria-label="NCBI Logo" data-ga-action="click_image" data-ga-label="NIH NLM Logo">
<img src="https://www.ncbi.nlm.nih.gov/coreutils/nwds/img/logos/AgencyLogo.svg" alt="NIH NLM Logo" />
</a>
</div>
<div class="ncbi-header__account">
<a id="account_login" href="https://account.ncbi.nlm.nih.gov" class="usa-button header-button" style="display:none" data-ga-action="open_menu" data-ga-label="account_menu">Log in</a>
<button id="account_info" class="header-button" style="display:none" aria-controls="account_popup" type="button">
<span class="fa fa-user" aria-hidden="true">
<svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 24 24" width="20px" height="20px">
<g style="fill: #fff">
<ellipse cx="12" cy="8" rx="5" ry="6"></ellipse>
<path d="M21.8,19.1c-0.9-1.8-2.6-3.3-4.8-4.2c-0.6-0.2-1.3-0.2-1.8,0.1c-1,0.6-2,0.9-3.2,0.9s-2.2-0.3-3.2-0.9 C8.3,14.8,7.6,14.7,7,15c-2.2,0.9-3.9,2.4-4.8,4.2C1.5,20.5,2.6,22,4.1,22h15.8C21.4,22,22.5,20.5,21.8,19.1z"></path>
</g>
</svg>
</span>
<span class="username desktop-only" aria-hidden="true" id="uname_short"></span>
<span class="sr-only">Show account info</span>
</button>
</div>
<div class="ncbi-popup-anchor">
<div class="ncbi-popup account-popup" id="account_popup" aria-hidden="true">
<div class="ncbi-popup-head">
<button class="ncbi-close-button" data-ga-action="close_menu" data-ga-label="account_menu" type="button">
<span class="fa fa-times">
<svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 48 48" width="24px" height="24px">
<path d="M38 12.83l-2.83-2.83-11.17 11.17-11.17-11.17-2.83 2.83 11.17 11.17-11.17 11.17 2.83 2.83 11.17-11.17 11.17 11.17 2.83-2.83-11.17-11.17z"></path>
</svg>
</span>
<span class="usa-sr-only">Close</span></button>
<h4>Account</h4>
</div>
<div class="account-user-info">
Logged in as:<br />
<b><span class="username" id="uname_long">username</span></b>
</div>
<div class="account-links">
<ul class="usa-unstyled-list">
<li><a id="account_myncbi" href="/myncbi/" class="set-base-url" data-ga-action="click_menu_item" data-ga-label="account_myncbi">Dashboard</a></li>
<li><a id="account_pubs" href="/myncbi/collections/bibliography/" class="set-base-url" data-ga-action="click_menu_item" data-ga-label="account_pubs">Publications</a></li>
<li><a id="account_settings" href="/account/settings/" class="set-base-url" data-ga-action="click_menu_item" data-ga-label="account_settings">Account settings</a></li>
<li><a id="account_logout" href="/account/signout/" class="set-base-url" data-ga-action="click_menu_item" data-ga-label="account_logout">Log out</a></li>
</ul>
</div>
</div>
</div>
</div>
</div>
</header>
<div role="navigation" aria-label="access keys">
<a id="nws_header_accesskey_0" href="https://www.ncbi.nlm.nih.gov/guide/browsers/#ncbi_accesskeys" class="usa-sr-only" accesskey="0" tabindex="-1">Access keys</a>
<a id="nws_header_accesskey_1" href="https://www.ncbi.nlm.nih.gov" class="usa-sr-only" accesskey="1" tabindex="-1">NCBI Homepage</a>
<a id="nws_header_accesskey_2" href="/myncbi/" class="set-base-url usa-sr-only" accesskey="2" tabindex="-1">MyNCBI Homepage</a>
<a id="nws_header_accesskey_3" href="#maincontent" class="usa-sr-only" accesskey="3" tabindex="-1">Main Content</a>
<a id="nws_header_accesskey_4" href="#" class="usa-sr-only" accesskey="4" tabindex="-1">Main Navigation</a>
</div>
<section data-section="Alerts">
<div class="ncbi-alerts-placeholder"></div>
</section>
</div>
</div>
<!--/.header-->
<div class="header">
<div class="res_logo"><h1 class="res_name"><a href="/sra/" title="SRA home">SRA</a></h1><h2 class="res_tagline">SRA</h2></div>
<div class="search"><form method="get" action="/sra/"><div class="search_form"><label for="database" class="offscreen_noflow">Search database</label><select id="database"><optgroup label="Recent"><option value="sra" selected="selected">SRA</option><option value="nuccore">Nucleotide</option><option value="books">Books</option><option value="pubmed" class="last">PubMed</option></optgroup><optgroup label="All"><option value="gquery">All Databases</option><option value="assembly">Assembly</option><option value="biocollections">Biocollections</option><option value="bioproject">BioProject</option><option value="biosample">BioSample</option><option value="books">Books</option><option value="clinvar">ClinVar</option><option value="cdd">Conserved Domains</option><option value="gap">dbGaP</option><option value="dbvar">dbVar</option><option value="gene">Gene</option><option value="genome">Genome</option><option value="gds">GEO DataSets</option><option value="geoprofiles">GEO Profiles</option><option value="gtr">GTR</option><option value="ipg">Identical Protein Groups</option><option value="medgen">MedGen</option><option value="mesh">MeSH</option><option value="nlmcatalog">NLM Catalog</option><option value="nuccore">Nucleotide</option><option value="omim">OMIM</option><option value="pmc">PMC</option><option value="protein">Protein</option><option value="proteinclusters">Protein Clusters</option><option value="protfam">Protein Family Models</option><option value="pcassay">PubChem BioAssay</option><option value="pccompound">PubChem Compound</option><option value="pcsubstance">PubChem Substance</option><option value="pubmed">PubMed</option><option value="snp">SNP</option><option value="sra">SRA</option><option value="structure">Structure</option><option value="taxonomy">Taxonomy</option><option value="toolkit">ToolKit</option><option value="toolkitall">ToolKitAll</option><option value="toolkitbookgh">ToolKitBookgh</option></optgroup></select><div class="nowrap"><label for="term" class="offscreen_noflow" accesskey="/">Search term</label><div class="nowrap"><input type="text" name="term" id="term" title="Search SRA" value="" class="jig-ncbiclearbutton jig-ncbiautocomplete" data-jigconfig="isEnabled:false,disableUrl:'NcbiSearchBarAutoComplCtrl'" autocomplete="off" data-sbconfig="ds:'no',pjs:'no',afs:'yes'" /></div><button id="search" type="submit" class="button_search nowrap" cmd="go">Search</button></div></div></form><ul class=" inline_list searchlinks"><li>
<a href="/sra/advanced/">Advanced</a>
</li></ul></div>
</div>
<div class="nav_and_browser">
<div class="localnav"><ul class="jig-ncbilocalnav">
<li>
<a title="Getting Started" href="/sra/docs/">Getting Started</a></li>
<li>
<a title="SRA Submission Quick Start" href="/sra/docs/submit">Submission Quick Start</a></li>
<li>
<a title="SRA Search and Download Guide" href="/sra/docs/sradownload">Search and Download</a>
</li>
<li>
<a title="How to use SRA in the cloud" href="/sra/docs/sra-cloud">SRA in the Cloud</a>
</li>
<li>
<a title="Archive Documentation" href="/sra/docs/sra-data-storage-model/">Archive Documentation</a>
<ul>
<li><a title="Data Storage Model" href="/sra/docs/sra-data-storage-model/">Data Storage Model</a></li>
<li><a title="Root Cause Analysis: Summary and Report" href="/sra/docs/rca/">Root Cause Analysis: Summary and Report</a></li>
</ul>
</li>
</ul></div>
</div>
<!-- was itemctrl -->
<div class="container">
<div id="maincontent" class="content col twelve_col last">
<div class="col1">
<h1 id="download-sra-sequence-data-using">Download SRA sequence data using Amazon Web Services (AWS)</h1>
<div class="toc">
<ul>
<li><a href="#sra-data-in-the-aws-registry-of-">SRA Data in the AWS Registry of Open Data</a><ul>
<li><a href="#coronaviridae-datasets">Coronaviridae Datasets</a></li>
<li><a href="#public-data">Public data</a></li>
<li><a href="#public-usersubmitted-files">Public user-submitted files</a></li>
</ul>
</li>
<li><a href="#accessing-sra-data-in-aws">Accessing SRA Data in AWS</a></li>
<li><a href="#introduction-for-first-time-user">Introduction for First Time Users</a></li>
<li><a href="#creating-an-aws-instance">Creating an AWS Instance</a><ul>
<li><a href="#signin-and-enter-the-amazon-ec2-">Sign-in and Enter the Amazon EC2 Console</a></li>
<li><a href="#create-an-aws-instance">Create an AWS Instance</a></li>
<li><a href="#connect-to-the-instance">Connect to the Instance</a></li>
<li><a href="#terminate-the-instance">Terminate the Instance</a></li>
</ul>
</li>
<li><a href="#the-sra-toolkit-in-aws">The SRA Toolkit in AWS</a><ul>
<li><a href="#installing-the-sra-toolkit-in-yo">Installing The SRA Toolkit in your instance</a></li>
<li><a href="#using-the-sra-toolkit-in-aws">Using the SRA Toolkit in AWS</a></li>
</ul>
</li>
<li><a href="#youtube-video-tutorial-setting-u">Youtube Video Tutorial - Setting up AWS - demo</a></li>
<li><a href="#engage">Engage</a></li>
</ul>
</div>
<h2 id="sra-data-in-the-aws-registry-of-">SRA Data in the AWS Registry of Open Data</h2>
<p><a target="_blank" title="NCB-coronavirus data available on AWS, new window" href="https://aws.amazon.com/blogs/publicsector/taking-covid-strides-national-center-biotechnology-information-coronavirus-genomic-data-available-aws">Amazon Web Services publicly hosts SRA data<img src="/core/assets/sra/images/offsite.png" alt="offsite image" width="15" /></a>
through
the <a target="_blank" title="Registry of Open Data, new window" href="https://aws.amazon.com/opendata/open-data-sponsorship-program">Registry of Open Data<img src="/core/assets/sra/images/offsite.png" alt="offsite image" width="15" /></a>.
SRA has several datasets in the AWS Registry of
Open Data, all of which can be accessed freely, without charge, through either an HTTPS or S3 URL. One dataset contains public SRA
data in the originally submitted format from select high value and newly-released studies. The second dataset acts as a centralized repository of
SARS-CoV-2 related sequences submitted to NCBI. Included are both the original files submitted by the principal investigator as well as SRA-processed
sequences (including normalized sequence files and SRA
<a title="SRA alighned read format" href="sra/docs/sra-aligned-read-format/">aligned read format</a> files) that require the
<a title="SRA Toolkit" href="https://github.com/ncbi/sra-tools/wiki/02.-Installing-SRA-Toolkit">SRA Toolkit</a> for analysis. This dataset also includes
metadata <a title="Search in Athena" href="/sra/docs/sra-athena/">searchable in AWS Athena</a>
by BLAST result, taxonomic analysis, and more, to allow rapid discovery of the most relevant data to your research. </p>
<h3 id="coronaviridae-datasets"><a target="_blank" title="Coronaviridae Datasets" href="https://registry.opendata.aws/ncbi-covid-19/">Coronaviridae Datasets<img src="/core/assets/sra/images/offsite.png" alt="offsite image" width="15" /></a></h3>
<ul>
<li><strong>Runs</strong> directory contains normalized sequence data, accessible in multiple formats (fastq, sam, fasta) via the SRA Toolkit and organized by Run accession. </li>
<li><strong>sra-src</strong> directory contains the submitted sequence files in their original format, organized by Run accession. </li>
<li><strong>VCF</strong> directory contains SRA generated VCF files, organized by Run accession. </li>
</ul>
<p>AWS CLI Access (No AWS account required): </p>
<p><code>aws s3 ls s3://sra-pub-sars-cov2/ --no-sign-request</code> </p>
<h3 id="public-data"><a target="_blank" title="Public data" href="https://registry.opendata.aws/ncbi-sra/">Public data<img src="/core/assets/sra/images/offsite.png" alt="offsite image" width="15" /></a></h3>
<ul>
<li>Contains all public SRA Runs organized by Run accession. </li>
</ul>
<p>AWS CLI Access (No AWS account required): </p>
<p><code>aws s3 ls s3://sra-pub-run-odp/ --no-sign-request</code> </p>
<h3 id="public-usersubmitted-files"><a target="_blank" title="Public submitted files" href="https://registry.opendata.aws/ncbi-sra/">Public user-submitted files<img src="/core/assets/sra/images/offsite.png" alt="offsite image" width="15" /></a></h3>
<ul>
<li>Contains submitted sequence files in their original format, organized by Run accession. </li>
</ul>
<p>AWS CLI Access (No AWS account required): </p>
<p><code>aws s3 ls s3://sra-pub-src-2/ --no-sign-request</code> </p>
<h2 id="accessing-sra-data-in-aws">Accessing SRA Data in AWS</h2>
<p>If you know your Run accessions of interest you can access the data several ways.
To download files from the <a target="_blank" title="Amazon AWS Console, new window" href="https://aws.amazon.com/">AWS Console<img src="/core/assets/sra/images/offsite.png" alt="offsite image" width="15" /></a> using a
browser, visit the HTTPS URL for the Coronaviridae dataset, Public SRA data, or Public user-submitted files respectively: </p>
<ul>
<li>https://s3.console.aws.amazon.com/s3/buckets/sra-pub-sars-cov2/ </li>
<li>https://s3.console.aws.amazon.com/s3/buckets/sra-pub-run-odp/ </li>
<li>https://s3.console.aws.amazon.com/s3/buckets/sra-pub-src-2/ </li>
</ul>
<p>From there you can navigate the directory structure using the provided graphical interface and you can
search a given directory for your accession of interest using the provided search box near the top of the page.
Once you have navigated to a specific file of interest you can click the <strong>Object URL</strong> link or use the <strong>Object actions</strong>
button to copy the file to your own S3 bucket or download a copy to local storage. </p>
<p>To access files from <em>within</em> AWS, e.g. from an EC2 instance, you can use the
<a target="_blank" title="AWS CLI, new window" href="https://aws.amazon.com/cli/">AWS CLI<img src="/core/assets/sra/images/offsite.png" alt="offsite image" width="15" /></a>
to perform an S3 copy or sync, using a command like this: </p>
<p><code>aws s3 cp s3://sra-pub-sars-cov2/README.txt $USER/$HOME/README.txt</code> </p>
<p>These data can also be accessed using various other
<a target="_blank" title="AWS tools and libraries, new window" href="https://docs.aws.amazon.com/AmazonS3/latest/dev/UsingAWSSDK.html">tools and libraries<img src="/core/assets/sra/images/offsite.png" alt="offsite image" width="15" /></a>.
Access to files in the
<a target="_blank" title="AWS Registry of Open Data, new window" href="https://aws.amazon.com/opendata/public-datasets/">AWS Registry of Open Data<img src="/core/assets/sra/images/offsite.png" alt="offsite image" width="15" /></a>
is free. This is true whether you use the HTTPS or S3 URL. For S3 URLs, the transfer is free even if it crosses an AWS region boundary; there is no
<a target="_blank" title="inter-regional data transfer fee, new window" href="https://aws.amazon.com/s3/pricing/">inter-regional data transfer fee<img src="/core/assets/sra/images/offsite.png" alt="offsite image" width="15" /></a>. </p>
<p>If you don't know the Run accessions you are interested in, you can start by searching in the
<a title="SRA Run Selector" href="/Traces/study/">SRA Run Selector</a>,<br />
<a target="_blank" title="AWS Athena - Youtube" href="https://www.youtube.com/watch?v=_F4FhcDWSJg">AWS Athena<img src="/core/assets/sra/images/offsite.png" alt="offsite image" width="15" /></a>, or
<a title="SRA Entrez" href="/sra">SRA Entrez</a>.<br />
A full list of Coronaviridae-containing SRA runs as detected with NCBI's kmer analysis tool is available here: <a title="SRA FTP: full list of Coronaviridae-containing SRA runs" href="https://ftp.ncbi.nlm.nih.gov/sra/reports/AccList/">ftp://ftp.ncbi.nlm.nih.gov/sra/reports/AccList/ </a>. </p>
<h2 id="introduction-for-first-time-user">Introduction for First Time Users</h2>
<p><strong>Amazon Elastic Compute Cloud (EC2)</strong> is the Amazon Web Service you use to create and run virtual machines in the cloud.
AWS calls these virtual machines 'instances'.
You will need to install your bioinformatics tools for data analysis and the SRA Toolkit for accessing the SRA data. </p>
<h2 id="creating-an-aws-instance">Creating an AWS Instance</h2>
<p><img src="/core/assets/sra/images/znak.png" alt="Exclamation point" height="20" /> Users will need to address accounts on their own. <br />
Please work with your organization for credential and billing questions. If using a personal account, this guide attempts to stay within <strong>AWS Free Tier</strong> for users who are still eligible. </p>
<p><img src="/core/assets/sra/images/znak.png" alt="Exclamation point" height="20" /> Users of this guide are expected to have experience using a Unix command-line interface. </p>
<h3 id="signin-and-enter-the-amazon-ec2-">Sign-in and Enter the Amazon EC2 Console</h3>
<p>Sign-in using your AWS account: <a target="_blank" title="Amazon AWS Console, new window" href="https://aws.amazon.com/">Amazon AWS Console<img src="/core/assets/sra/images/offsite.png" alt="offsite image" width="15" /></a>. </p>
<h3 id="create-an-aws-instance">Create an AWS Instance</h3>
<p>Please follow this <a target="_blank" title="Amazon AWS guide, new window" href="https://docs.aws.amazon.com/efs/latest/ug/gs-step-one-create-ec2-resources.html">Amazon step-by-step guide<img src="/core/assets/sra/images/offsite.png" alt="offsite image" width="15" /></a>
that will help you launch a Linux virtual machine on Amazon EC2 within Amazon AWS Free Tier.<br />
Please make sure to create your EC2 instance in the <strong>US East (N. Virginia) us-east-1 region</strong>. </p>
<h3 id="connect-to-the-instance">Connect to the Instance</h3>
<p>Use either a Unix/OSX terminal or your preferred ssh application to connect the same as the Amazon tutorial linked above.
- This AMI username is <strong>ec2-user</strong>. </p>
<h3 id="terminate-the-instance">Terminate the Instance</h3>
<ul>
<li>Remember to terminate the EC2 instance from the AWS console when you have finished using it. If you do not terminate the instance, charges can be generated on your account even when no users are connected. </li>
<li>Data stored on the EC2 instance will be deleted when the instance is terminated. Users will likely want to have stable s3 storage to store results from their work. </li>
</ul>
<h2 id="the-sra-toolkit-in-aws">The SRA Toolkit in AWS</h2>
<h3 id="installing-the-sra-toolkit-in-yo">Installing The SRA Toolkit in your instance</h3>
<p>Once you connected, you will be able to work in Unix-like command line environment where you can install and configure the SRA Toolkit. </p>
<ul>
<li><a target="_blank" title="Installing the SRA Toolkit" href="https://github.com/ncbi/sra-tools/wiki/02.-Installing-SRA-Toolkit">Installing the SRA Toolkit</a> </li>
</ul>
<h3 id="using-the-sra-toolkit-in-aws">Using the SRA Toolkit in AWS</h3>
<ul>
<li>For downloading public SRA data from our cloud buckets to your cloud storage you can use the SRA Toolkit utilities as described in the <a title="SRA Download Guide" href="/sra/docs/sradownload">SRA Download Guide</a> </li>
<li>For downloading dbGAP data from our cloud buckets to your cloud storage you need to use <strong>jwt.cart</strong> file as descibed in the <a title="Downloading dbGaP data with JWT" href="/sra/docs/sra-dbGAP-cloud-download">Downloading dbGaP data with JWT</a> </li>
</ul>
<p><span class="warning-message"><img src="/core/assets/sra/images/tack.png" alt="Tack" height="30" />Don't forget to STOP your instance after you finished your work! </span> </p>
<h2 id="youtube-video-tutorial-setting-u">Youtube Video Tutorial - Setting up AWS - demo</h2>
<ul>
<li><a title="Setting up AWS demo" href="https://www.youtube.com/watch?v=rjjrHnZfymU">Setting up AWS demo</a> </li>
</ul>
<iframe src="https://www.youtube.com/embed/rjjrHnZfymU" width="647" height="364" title="How to Access SRA Data with Amazon Web Services" frameborder="0" allow="accelerometer; autoplay; clipboard-write; encrypted-media; gyroscope; picture-in-picture" allowfullscreen=""></iframe>
<h2 id="engage">Engage</h2>
<p>NCBI wants your feedback on SRA in the Cloud. Contact <a href="mailto:sra@ncbi.nlm.nih.gov?subject=SRA%20question&amp;body=Dear%20SRA%20staff">sra@ncbi.nlm.nih.gov</a> with questions or if you would like to provide input on new functionality.</p>
</div>
<!--/.col1-->
<div class="col2">
<div id="shared-content-1">
<h2 data-heading="h2" data-no-toc="true">Getting Started</h2>
<ul>
<li><a title="SRA Getting Started" href="/sra/docs/">Getting Started</a> </li>
</ul>
<h2 data-heading="h2" data-no-toc="true">Cloud Quick Start</h2>
<ul>
<li><a title="SRA Cloud getting started" href="/sra/docs/sra-cloud">Cloud Introduction</a> </li>
<li><a target="_blank" title="SRA on YouTube: Tutorials" href="https://www.youtube.com/playlist?list=PL7dF9e2qSW0ZZci13mHSKZYis3MV4Mdoa">YouTube Tutorials</a> </li>
<li><a title="GCP SARS-CoV-2 Public Dataset Guide" href="/sra/docs/gcp-pdp-guide">GCP SARS-CoV-2 Public Dataset Guide</a> </li>
<li><a title="SRA Cloud Access Costs" href="/sra/docs/sra-cloud-access-costs">SRA Cloud Access Costs</a> </li>
</ul>
<h2 data-heading="h2" data-no-toc="true">Setting Up</h2>
<ul>
<li><a title="SRA Google Cloud" href="/sra/docs/SRA-Google-Cloud">Set up Google Cloud</a> </li>
<li><a title="SRA Amazon Cloud" href="/sra/docs/sra-aws-download/">Set up Amazon Cloud</a> </li>
<li><a title="SRA in BigQuery" href="/sra/docs/sra-bigquery">Set up BigQuery</a> </li>
<li><a title="SRA in Athena" href="/sra/docs/sra-athena">Set up Athena</a> </li>
</ul>
<h2 data-heading="h2" data-no-toc="true">Cloud Data Access</h2>
<ul>
<li><a title="Download SRA sequences from Entrez search results" href="/sra/docs/sradownload">Download Guide</a> </li>
<li><a title="Data Delivery to cloud bucket" href="/sra/docs/data-delivery">Cloud Data Delivery Service</a> </li>
</ul>
<h2 data-heading="h2" data-no-toc="true">Accessing dbGAP</h2>
<ul>
<li><a title="Download dbGAP from cloud" href="/sra/docs/sra-dbGAP-cloud-download">Download dbGAP with JWT</a> </li>
</ul>
<h2 data-heading="h2" data-no-toc="true">Search</h2>
<ul>
<li><a title="SRA cloud-based search" href="/sra/docs/sra-cloud-based-examples">Cloud-based Search</a> </li>
<li><a title="SRA in BigQuery" href="/sra/docs/sra-bigquery-examples">Search in BigQuery</a> </li>
<li><a title="SRA in Athena" href="/sra/docs/sra-athena-examples">Search in Athena</a> </li>
</ul>
<h2 data-heading="h2" data-no-toc="true">SRA Analysis</h2>
<ul>
<li><a title="SRA Aligned Read Format" href="/sra/docs/sra-aligned-read-format">SRA Aligned Read Format</a> </li>
<li><a title="SRA SARS-CoV-2 Detection Tool" href="/sra/docs/sra-detection-tool">SARS-CoV-2 Detection Tool</a> </li>
<li><a title="SARS-CoV-2 Variant Calling" href="/sra/docs/sars-cov-2-variant-calling">SARS-CoV-2 Variant Calling</a> </li>
<li><a title="SRA Taxonomy Analysis Tool" href="/sra/docs/sra-taxonomy-analysis-tool">SRA Taxonomy Analysis Tool</a> </li>
</ul>
<h2 data-heading="h2" data-no-toc="true">SRA Data Formats</h2>
<ul>
<li><a title="SRA Data Formats" href="/sra/docs/sra-data-formats">SRA Data Formats</a> </li>
<li><a title="Data Format FAQ" href="/sra/docs/data-format-faq">Data Format FAQ</a> </li>
</ul>
</div>
</div>
<!--/.col2-->
<div class="col3">
</div>
<!--/.col3-->
<div class="col4">
</div>
<!--/.col4-->
<div class="col5">
</div>
<div class="col6">
</div>
<div class="col7">
</div>
<div class="col8">
</div>
<div class="col9">
</div>
</div><!--/.content-->
</div><!--/.container-->
<div id="NCBIFooter_dynamic">
<div class="breadcrumbs">You are here:
<span id="breadcrumb_text"><a href="/guide/">NCBI</a></span></div>
<a id="help-desk-link" class="help_desk" href="https://support.ncbi.nlm.nih.gov/ics/support/default.asp?Time=2025-03-12T19:01:34-04:00&amp;Snapshot=%2Fprojects%2Fstaticsites%2FSraDocs@1.5&amp;Host=portal105&amp;ncbi_phid=CE8CA5AD7D1FE9D100000000013B0116&amp;ncbi_session=CE8B5AF87C7FFCB1_0191SID&amp;from=https%3A%2F%2Fwww.ncbi.nlm.nih.gov%2Fsra%2Fdocs%2Fsra-aws-download%2F&amp;Ncbi_App=sra&amp;Page=sra-custom-page&amp;style=classic&amp;deptID=28049" target="_blank">Support Center</a>
<noscript><img alt="" src="/stat?jsdisabled=true&amp;ncbi_app=sra&amp;ncbi_db=&amp;ncbi_pdid=sra-custom-page&amp;ncbi_phid=CE8CA5AD7D1FE9D100000000013B0116" /></noscript>
</div>
<div xmlns:xi="http://www.w3.org/2001/XInclude">
<div xmlns="http://www.w3.org/1999/xhtml" class="footer" id="footer" xml:base="http://127.0.0.1/sites/static/header_footer">
<section class="icon-section">
<div id="icon-section-header" class="icon-section_header">Follow NCBI</div>
<div class="grid-container container">
<div class="icon-section_container">
<a class="footer-icon" id="footer_twitter" href="https://twitter.com/ncbi" aria-label="Twitter">
<svg xmlns="http://www.w3.org/2000/svg" width="40" height="40" viewBox="0 0 40 40" fill="none">
<title>Twitter</title>
<g id="twitterx1008">
<path id="path1008" d="M6.06736 7L16.8778 20.8991L6.00001 32.2H10.2L18.6 23.1L25.668 32.2H34L22.8 17.5L31.9 7H28.4L20.7 15.4L14.401 7H6.06898H6.06736ZM9.66753 8.73423H12.9327L29.7327 30.4658H26.5697L9.66753 8.73423Z" fill="#5B616B"></path>
</g>
</svg>
</a>
<a class="footer-icon" id="footer_facebook" href="https://www.facebook.com/ncbi.nlm" aria-label="Facebook"><svg xmlns="http://www.w3.org/2000/svg" data-name="Layer 1" viewBox="0 0 300 300">
<title>Facebook</title>
<path class="cls-11" d="M210.5,115.12H171.74V97.82c0-8.14,5.39-10,9.19-10h27.14V52l-39.32-.12c-35.66,0-42.42,26.68-42.42,43.77v19.48H99.09v36.32h27.24v109h45.41v-109h35Z">
</path>
</svg></a>
<a class="footer-icon" id="footer_linkedin" href="https://www.linkedin.com/company/ncbinlm" aria-label="LinkedIn"><svg xmlns="http://www.w3.org/2000/svg" data-name="Layer 1" viewBox="0 0 300 300">
<title>LinkedIn</title>
<path class="cls-11" d="M101.64,243.37H57.79v-114h43.85Zm-22-131.54h-.26c-13.25,0-21.82-10.36-21.82-21.76,0-11.65,8.84-21.15,22.33-21.15S101.7,78.72,102,90.38C102,101.77,93.4,111.83,79.63,111.83Zm100.93,52.61A17.54,17.54,0,0,0,163,182v61.39H119.18s.51-105.23,0-114H163v13a54.33,54.33,0,0,1,34.54-12.66c26,0,44.39,18.8,44.39,55.29v58.35H198.1V182A17.54,17.54,0,0,0,180.56,164.44Z">
</path>
</svg></a>
<a class="footer-icon" id="footer_github" href="https://github.com/ncbi" aria-label="GitHub"><svg xmlns="http://www.w3.org/2000/svg" data-name="Layer 1" viewBox="0 0 300 300">
<defs>
<style>
.cls-11,
.cls-12 {
fill: #737373;
}
.cls-11 {
fill-rule: evenodd;
}
</style>
</defs>
<title>GitHub</title>
<path class="cls-11" d="M151.36,47.28a105.76,105.76,0,0,0-33.43,206.1c5.28,1,7.22-2.3,7.22-5.09,0-2.52-.09-10.85-.14-19.69-29.42,6.4-35.63-12.48-35.63-12.48-4.81-12.22-11.74-15.47-11.74-15.47-9.59-6.56.73-6.43.73-6.43,10.61.75,16.21,10.9,16.21,10.9,9.43,16.17,24.73,11.49,30.77,8.79,1-6.83,3.69-11.5,6.71-14.14C108.57,197.1,83.88,188,83.88,147.51a40.92,40.92,0,0,1,10.9-28.39c-1.1-2.66-4.72-13.42,1-28,0,0,8.88-2.84,29.09,10.84a100.26,100.26,0,0,1,53,0C198,88.3,206.9,91.14,206.9,91.14c5.76,14.56,2.14,25.32,1,28a40.87,40.87,0,0,1,10.89,28.39c0,40.62-24.74,49.56-48.29,52.18,3.79,3.28,7.17,9.71,7.17,19.58,0,14.15-.12,25.54-.12,29,0,2.82,1.9,6.11,7.26,5.07A105.76,105.76,0,0,0,151.36,47.28Z">
</path>
<path class="cls-12" d="M85.66,199.12c-.23.52-1.06.68-1.81.32s-1.2-1.06-.95-1.59,1.06-.69,1.82-.33,1.21,1.07.94,1.6Zm-1.3-1">
</path>
<path class="cls-12" d="M90,203.89c-.51.47-1.49.25-2.16-.49a1.61,1.61,0,0,1-.31-2.19c.52-.47,1.47-.25,2.17.49s.82,1.72.3,2.19Zm-1-1.08">
</path>
<path class="cls-12" d="M94.12,210c-.65.46-1.71,0-2.37-.91s-.64-2.07,0-2.52,1.7,0,2.36.89.65,2.08,0,2.54Zm0,0"></path>
<path class="cls-12" d="M99.83,215.87c-.58.64-1.82.47-2.72-.41s-1.18-2.06-.6-2.7,1.83-.46,2.74.41,1.2,2.07.58,2.7Zm0,0">
</path>
<path class="cls-12" d="M107.71,219.29c-.26.82-1.45,1.2-2.64.85s-2-1.34-1.74-2.17,1.44-1.23,2.65-.85,2,1.32,1.73,2.17Zm0,0">
</path>
<path class="cls-12" d="M116.36,219.92c0,.87-1,1.59-2.24,1.61s-2.29-.68-2.3-1.54,1-1.59,2.26-1.61,2.28.67,2.28,1.54Zm0,0">
</path>
<path class="cls-12" d="M124.42,218.55c.15.85-.73,1.72-2,1.95s-2.37-.3-2.52-1.14.73-1.75,2-2,2.37.29,2.53,1.16Zm0,0"></path>
</svg></a>
<a class="footer-icon" id="footer_blog" href="https://ncbiinsights.ncbi.nlm.nih.gov/" aria-label="Blog">
<svg xmlns="http://www.w3.org/2000/svg" id="Layer_1" data-name="Layer 1" viewBox="0 0 40 40">
<defs><style>.cls-1{fill:#737373;}</style></defs>
<title>NCBI Insights Blog</title>
<path class="cls-1" d="M14,30a4,4,0,1,1-4-4,4,4,0,0,1,4,4Zm11,3A19,19,0,0,0,7.05,15a1,1,0,0,0-1,1v3a1,1,0,0,0,.93,1A14,14,0,0,1,20,33.07,1,1,0,0,0,21,34h3a1,1,0,0,0,1-1Zm9,0A28,28,0,0,0,7,6,1,1,0,0,0,6,7v3a1,1,0,0,0,1,1A23,23,0,0,1,29,33a1,1,0,0,0,1,1h3A1,1,0,0,0,34,33Z"></path>
</svg>
</a>
</div>
</div>
</section>
<section class="container-fluid bg-primary">
<div class="container pt-5">
<div class="row mt-3">
<div class="col-lg-3 col-12">
<p><a class="text-white" href="https://www.nlm.nih.gov/socialmedia/index.html">Connect with NLM</a></p>
<ul class="list-inline social_media">
<li class="list-inline-item"><a href="https://twitter.com/NLM_NIH" aria-label="Twitter" target="_blank" rel="noopener noreferrer">
<svg xmlns="http://www.w3.org/2000/svg" width="35" height="35" viewBox="0 0 36 35" fill="none">
<title>Twitter</title>
<g id="twitterx1009" clip-path="url(#clip0_65276_3946)">
<path id="Vector_Twitter" d="M17.5006 34.6565C26.9761 34.6565 34.6575 26.9751 34.6575 17.4996C34.6575 8.02416 26.9761 0.342773 17.5006 0.342773C8.02514 0.342773 0.34375 8.02416 0.34375 17.4996C0.34375 26.9751 8.02514 34.6565 17.5006 34.6565Z" fill="#205493" stroke="white" stroke-width="1.0" stroke-miterlimit="10"></path>
<path id="path1009" d="M8.54811 8.5L16.2698 18.4279L8.50001 26.5H11.5L17.5 20L22.5486 26.5H28.5L20.5 16L27 8.5H24.5L19 14.5L14.5007 8.5H8.54927H8.54811ZM11.1197 9.73873H13.4519L25.4519 25.2613H23.1926L11.1197 9.73873Z" fill="white"></path>
</g>
<defs>
<clipPath id="clip0_65276_3946">
<rect width="35" height="35" fill="white"></rect>
</clipPath>
</defs>
</svg>
</a></li>
<li class="list-inline-item"><a href="https://www.facebook.com/nationallibraryofmedicine" aria-label="Facebook" rel="noopener noreferrer" target="_blank">
<svg xmlns="http://www.w3.org/2000/svg" width="35" height="35" viewBox="0 0 36 35" fill="none">
<title>Facebook</title>
<g id="Facebook" clip-path="url(#clip0_1717_1086)">
<path id="Vector_Facebook" d="M15.1147 29.1371C15.1147 29.0822 15.1147 29.0296 15.1147 28.9747V18.9414H11.8183C11.6719 18.9414 11.6719 18.9414 11.6719 18.8018C11.6719 17.5642 11.6719 16.3289 11.6719 15.0937C11.6719 14.9793 11.7062 14.9518 11.816 14.9518C12.8683 14.9518 13.9206 14.9518 14.9751 14.9518H15.1215V14.8329C15.1215 13.8057 15.1215 12.774 15.1215 11.7492C15.1274 10.9262 15.3148 10.1146 15.6706 9.37241C16.1301 8.38271 16.9475 7.60378 17.9582 7.19235C18.6492 6.90525 19.3923 6.76428 20.1405 6.7783C21.0029 6.79202 21.8653 6.83091 22.7278 6.86065C22.8879 6.86065 23.048 6.89496 23.2082 6.90182C23.2974 6.90182 23.3271 6.94071 23.3271 7.02993C23.3271 7.54235 23.3271 8.05477 23.3271 8.5649C23.3271 9.16882 23.3271 9.77274 23.3271 10.3767C23.3271 10.4819 23.2974 10.5139 23.1921 10.5116C22.5379 10.5116 21.8814 10.5116 21.2271 10.5116C20.9287 10.5184 20.6316 10.5528 20.3395 10.6146C20.0822 10.6619 19.8463 10.7891 19.6653 10.9779C19.4842 11.1668 19.3672 11.4078 19.3307 11.6669C19.2857 11.893 19.2612 12.1226 19.2575 12.3531C19.2575 13.1904 19.2575 14.0299 19.2575 14.8695C19.2575 14.8946 19.2575 14.9198 19.2575 14.9564H23.0229C23.1807 14.9564 23.183 14.9564 23.1624 15.1074C23.0778 15.7662 22.9885 16.425 22.9039 17.0816C22.8322 17.6321 22.7636 18.1827 22.698 18.7332C22.6729 18.9437 22.6797 18.9437 22.4693 18.9437H19.2644V28.8992C19.2644 28.9793 19.2644 29.0593 19.2644 29.1394L15.1147 29.1371Z" fill="white"></path>
<path id="Vector_2_Facebook" d="M17.5006 34.657C26.9761 34.657 34.6575 26.9756 34.6575 17.5001C34.6575 8.02465 26.9761 0.343262 17.5006 0.343262C8.02514 0.343262 0.34375 8.02465 0.34375 17.5001C0.34375 26.9756 8.02514 34.657 17.5006 34.657Z" stroke="white" stroke-width="1.0" stroke-miterlimit="10"></path>
</g>
<defs>
<clipPath id="clip0_1717_1086">
<rect width="35" height="35" fill="white"></rect>
</clipPath>
</defs>
</svg>
</a></li>
<li class="list-inline-item"><a href="https://www.youtube.com/user/NLMNIH" aria-label="Youtube" target="_blank" rel="noopener noreferrer">
<svg xmlns="http://www.w3.org/2000/svg" width="35" height="35" viewBox="0 0 36 35" fill="none">
<title>Youtube</title>
<g id="YouTube" clip-path="url(#clip0_1717_1101)">
<path id="Vector_Youtube" d="M26.2571 11.4791C25.9025 11.1589 25.5709 10.9576 24.228 10.834C22.5512 10.6785 20.2797 10.6556 18.564 10.6533H16.4365C14.7208 10.6533 12.4493 10.6785 10.7725 10.834C9.43196 10.9576 9.09798 11.1589 8.7434 11.4791C7.81464 12.321 7.6202 14.6268 7.59961 16.8938C7.59961 17.3178 7.59961 17.741 7.59961 18.1635C7.62706 20.4121 7.82837 22.686 8.7434 23.521C9.09798 23.8412 9.42967 24.0425 10.7725 24.1661C12.4493 24.3216 14.7208 24.3445 16.4365 24.3468H18.564C20.2797 24.3468 22.5512 24.3216 24.228 24.1661C25.5686 24.0425 25.9025 23.8412 26.2571 23.521C27.1722 22.6929 27.3735 20.451 27.4009 18.2206C27.4009 17.7402 27.4009 17.2599 27.4009 16.7795C27.3735 14.5491 27.1699 12.3072 26.2571 11.4791ZM15.5604 20.5311V14.652L20.561 17.5001L15.5604 20.5311Z" fill="white"></path>
<path id="Vector_2_Youtube" d="M17.5006 34.657C26.9761 34.657 34.6575 26.9756 34.6575 17.5001C34.6575 8.02465 26.9761 0.343262 17.5006 0.343262C8.02514 0.343262 0.34375 8.02465 0.34375 17.5001C0.34375 26.9756 8.02514 34.657 17.5006 34.657Z" stroke="white" stroke-width="1.0" stroke-miterlimit="10"></path>
</g>
<defs>
<clipPath id="clip0_1717_1101">
<rect width="35" height="35" fill="white"></rect>
</clipPath>
</defs>
</svg>
</a></li>
</ul>
</div>
<div class="col-lg-3 col-12">
<p class="address_footer text-white">National Library of Medicine<br />
<a href="https://www.google.com/maps/place/8600+Rockville+Pike,+Bethesda,+MD+20894/@38.9959508,-77.101021,17z/data=!3m1!4b1!4m5!3m4!1s0x89b7c95e25765ddb:0x19156f88b27635b8!8m2!3d38.9959508!4d-77.0988323" class="text-white" target="_blank" rel="noopener noreferrer">8600 Rockville Pike<br />
Bethesda, MD 20894</a></p>
</div>
<div class="col-lg-3 col-12 centered-lg">
<p><a href="https://www.nlm.nih.gov/web_policies.html" class="text-white">Web Policies</a><br />
<a href="https://www.nih.gov/institutes-nih/nih-office-director/office-communications-public-liaison/freedom-information-act-office" class="text-white">FOIA</a><br />
<a href="https://www.hhs.gov/vulnerability-disclosure-policy/index.html" class="text-white" id="vdp">HHS Vulnerability Disclosure</a></p>
</div>
<div class="col-lg-3 col-12 centered-lg">
<p><a class="supportLink text-white" href="https://support.nlm.nih.gov/">Help</a><br />
<a href="https://www.nlm.nih.gov/accessibility.html" class="text-white">Accessibility</a><br />
<a href="https://www.nlm.nih.gov/careers/careers.html" class="text-white">Careers</a></p>
</div>
</div>
<div class="row">
<div class="col-lg-12 centered-lg">
<nav class="bottom-links">
<ul class="mt-3">
<li>
<a class="text-white" href="//www.nlm.nih.gov/">NLM</a>
</li>
<li>
<a class="text-white" href="https://www.nih.gov/">NIH</a>
</li>
<li>
<a class="text-white" href="https://www.hhs.gov/">HHS</a>
</li>
<li>
<a class="text-white" href="https://www.usa.gov/">USA.gov</a>
</li>
</ul>
</nav>
</div>
</div>
</div>
</section>
<script type="text/javascript" src="/portal/portal3rc.fcgi/rlib/js/InstrumentOmnitureBaseJS/InstrumentNCBIConfigJS/InstrumentNCBIBaseJS/InstrumentPageStarterJS.js?v=1"> </script>
<script type="text/javascript" src="/portal/portal3rc.fcgi/static/js/hfjs2.js"> </script>
</div>
</div>
<!--/.footer-->
<p class="last-updated small">Last updated: 2023-07-12T17:46:09Z</p>
</div>
<!--/.page-->
</div>
<!--/.wrap-->
<span class="PAFAppResources"></span>
</div><!-- /.twelve_col -->
</div>
<!-- /.grid -->
<!-- usually for JS scripts at page bottom -->
<span class="pagefixtures"></span>
<!-- CE8B5AF87C7FFCB1_0191SID /projects/staticsites/SraDocs@1.5 portal105 v4.1.r689238 Tue, Oct 22 2024 16:10:51 -->
<span id="portal-csrf-token" style="display:none" data-token="CE8B5AF87C7FFCB1_0191SID"></span>
<script type="text/javascript" src="//static.pubmed.gov/portal/portal3rc.fcgi/4217302/js/3879255/4121861/4082503/4217304/4087685.js" snapshot="sra"></script></body>
</html>