891 lines
54 KiB
XML
891 lines
54 KiB
XML
<?xml version="1.0" encoding="utf-8"?>
|
||
<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
|
||
<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
|
||
|
||
<head><meta http-equiv="Content-Type" content="text/html; charset=utf-8" />
|
||
<!-- AppResources meta begin -->
|
||
<meta name="paf-app-resources" content="" />
|
||
<!-- AppResources meta end -->
|
||
|
||
<!-- TemplateResources meta begin -->
|
||
<meta name="paf_template" content="StdNCol" />
|
||
|
||
<!-- TemplateResources meta end -->
|
||
|
||
<!-- Page meta begin -->
|
||
|
||
<!-- Page meta end -->
|
||
|
||
<!-- Logger begin -->
|
||
<meta xmlns:ncbi-portal="http://ncbi.gov/portal/XSLT/namespace" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" name="ncbi_app" content="dbgapdocs" /><meta xmlns:ncbi-portal="http://ncbi.gov/portal/XSLT/namespace" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" name="ncbi_pdid" content="static" />
|
||
<!-- Logger end -->
|
||
|
||
<title>dbGaP Molecular Data Submission Guide</title>
|
||
|
||
<!-- PageFixtures headcontent begin -->
|
||
|
||
|
||
<!-- PageFixtures headcontent end -->
|
||
|
||
<!-- AppResources external_resources begin -->
|
||
<script type="text/javascript" src="/core/jig/1.15.1/js/jig.min.js"></script>
|
||
|
||
<!-- AppResources external_resources end -->
|
||
|
||
<!-- Page headcontent begin -->
|
||
<meta name="subsite" content="dbgap" />
|
||
<meta name="path" content="dbgap/docs/moleculardatasection" />
|
||
<meta name="modified" content="2024-04-12T20:18:35Z" />
|
||
<!-- Page headcontent end -->
|
||
<!-- PageFixtures resources begin -->
|
||
<link xmlns="http://www.w3.org/1999/xhtml" type="text/css" rel="stylesheet" href="//static.pubmed.gov/portal/portal3rc.fcgi/4218191/css/4207974/4206132.css" xml:base="http://127.0.0.1/sites/static/header_footer" />
|
||
|
||
<!-- PageFixtures resources end -->
|
||
<link rel="shortcut icon" href="//www.ncbi.nlm.nih.gov/favicon.ico" /><meta name="ncbi_phid" content="CE8C416E7D1F84C10000000000BC00A9.m_5" />
|
||
<meta name='referrer' content='origin-when-cross-origin'/><link type="text/css" rel="stylesheet" href="//static.pubmed.gov/portal/portal3rc.fcgi/4176647/css/4121862/3974050/3917732/251717/4175140/14534/45193/3534283/4128070/4062871/4005757.css" /><link type="text/css" rel="stylesheet" href="//static.pubmed.gov/portal/portal3rc.fcgi/4176647/css/3529741/3529739.css" media="print" /></head>
|
||
<body class=" static">
|
||
<div class="grid">
|
||
<div class="col twelve_col nomargin shadow">
|
||
<!-- System messages like service outage or JS required; this is handled by the TemplateResources portlet -->
|
||
<div class="sysmessages">
|
||
<noscript>
|
||
<p class="nojs">
|
||
<strong>Warning:</strong>
|
||
The NCBI web site requires JavaScript to function.
|
||
<a href="/guide/browsers/#enablejs" title="Learn how to enable JavaScript" target="_blank">more...</a>
|
||
</p>
|
||
</noscript>
|
||
</div>
|
||
<!--/.sysmessage-->
|
||
<div class="wrap">
|
||
<div class="page">
|
||
<div xmlns:xi="http://www.w3.org/2001/XInclude">
|
||
<div xmlns="http://www.w3.org/1999/xhtml" id="universal_header" xml:base="http://127.0.0.1/sites/static/header_footer">
|
||
<section class="usa-banner">
|
||
<div class="usa-accordion">
|
||
<header class="usa-banner-header">
|
||
<div class="usa-grid usa-banner-inner">
|
||
<img src="https://www.ncbi.nlm.nih.gov/coreutils/uswds/img/favicons/favicon-57.png" alt="U.S. flag" />
|
||
<p>An official website of the United States government</p>
|
||
<button class="non-usa-accordion-button usa-banner-button" aria-expanded="false" aria-controls="gov-banner-top" type="button">
|
||
<span class="usa-banner-button-text">Here's how you know</span>
|
||
</button>
|
||
</div>
|
||
</header>
|
||
<div class="usa-banner-content usa-grid usa-accordion-content" id="gov-banner-top" aria-hidden="true">
|
||
<div class="usa-banner-guidance-gov usa-width-one-half">
|
||
<img class="usa-banner-icon usa-media_block-img" src="https://www.ncbi.nlm.nih.gov/coreutils/uswds/img/icon-dot-gov.svg" alt="Dot gov" />
|
||
<div class="usa-media_block-body">
|
||
<p>
|
||
<strong>The .gov means it's official.</strong>
|
||
<br />
|
||
Federal government websites often end in .gov or .mil. Before
|
||
sharing sensitive information, make sure you're on a federal
|
||
government site.
|
||
</p>
|
||
</div>
|
||
</div>
|
||
<div class="usa-banner-guidance-ssl usa-width-one-half">
|
||
<img class="usa-banner-icon usa-media_block-img" src="https://www.ncbi.nlm.nih.gov/coreutils/uswds/img/icon-https.svg" alt="Https" />
|
||
<div class="usa-media_block-body">
|
||
<p>
|
||
<strong>The site is secure.</strong>
|
||
<br />
|
||
The <strong>https://</strong> ensures that you are connecting to the
|
||
official website and that any information you provide is encrypted
|
||
and transmitted securely.
|
||
</p>
|
||
</div>
|
||
</div>
|
||
</div>
|
||
</div>
|
||
</section>
|
||
<div class="usa-overlay"></div>
|
||
<header class="ncbi-header" role="banner" data-section="Header">
|
||
|
||
<div class="usa-grid">
|
||
<div class="usa-width-one-whole">
|
||
|
||
<div class="ncbi-header__logo">
|
||
<a href="/" class="logo" aria-label="NCBI Logo" data-ga-action="click_image" data-ga-label="NIH NLM Logo">
|
||
<img src="https://www.ncbi.nlm.nih.gov/coreutils/nwds/img/logos/AgencyLogo.svg" alt="NIH NLM Logo" />
|
||
</a>
|
||
</div>
|
||
|
||
<div class="ncbi-header__account">
|
||
<a id="account_login" href="https://account.ncbi.nlm.nih.gov" class="usa-button header-button" style="display:none" data-ga-action="open_menu" data-ga-label="account_menu">Log in</a>
|
||
<button id="account_info" class="header-button" style="display:none" aria-controls="account_popup" type="button">
|
||
<span class="fa fa-user" aria-hidden="true">
|
||
<svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 24 24" width="20px" height="20px">
|
||
<g style="fill: #fff">
|
||
<ellipse cx="12" cy="8" rx="5" ry="6"></ellipse>
|
||
<path d="M21.8,19.1c-0.9-1.8-2.6-3.3-4.8-4.2c-0.6-0.2-1.3-0.2-1.8,0.1c-1,0.6-2,0.9-3.2,0.9s-2.2-0.3-3.2-0.9 C8.3,14.8,7.6,14.7,7,15c-2.2,0.9-3.9,2.4-4.8,4.2C1.5,20.5,2.6,22,4.1,22h15.8C21.4,22,22.5,20.5,21.8,19.1z"></path>
|
||
</g>
|
||
</svg>
|
||
</span>
|
||
<span class="username desktop-only" aria-hidden="true" id="uname_short"></span>
|
||
<span class="sr-only">Show account info</span>
|
||
</button>
|
||
</div>
|
||
|
||
<div class="ncbi-popup-anchor">
|
||
<div class="ncbi-popup account-popup" id="account_popup" aria-hidden="true">
|
||
<div class="ncbi-popup-head">
|
||
<button class="ncbi-close-button" data-ga-action="close_menu" data-ga-label="account_menu" type="button">
|
||
<span class="fa fa-times">
|
||
<svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 48 48" width="24px" height="24px">
|
||
<path d="M38 12.83l-2.83-2.83-11.17 11.17-11.17-11.17-2.83 2.83 11.17 11.17-11.17 11.17 2.83 2.83 11.17-11.17 11.17 11.17 2.83-2.83-11.17-11.17z"></path>
|
||
</svg>
|
||
</span>
|
||
<span class="usa-sr-only">Close</span></button>
|
||
<h4>Account</h4>
|
||
</div>
|
||
<div class="account-user-info">
|
||
Logged in as:<br />
|
||
<b><span class="username" id="uname_long">username</span></b>
|
||
</div>
|
||
<div class="account-links">
|
||
<ul class="usa-unstyled-list">
|
||
<li><a id="account_myncbi" href="/myncbi/" class="set-base-url" data-ga-action="click_menu_item" data-ga-label="account_myncbi">Dashboard</a></li>
|
||
<li><a id="account_pubs" href="/myncbi/collections/bibliography/" class="set-base-url" data-ga-action="click_menu_item" data-ga-label="account_pubs">Publications</a></li>
|
||
<li><a id="account_settings" href="/account/settings/" class="set-base-url" data-ga-action="click_menu_item" data-ga-label="account_settings">Account settings</a></li>
|
||
<li><a id="account_logout" href="/account/signout/" class="set-base-url" data-ga-action="click_menu_item" data-ga-label="account_logout">Log out</a></li>
|
||
</ul>
|
||
</div>
|
||
</div>
|
||
</div>
|
||
|
||
</div>
|
||
</div>
|
||
</header>
|
||
<div role="navigation" aria-label="access keys">
|
||
<a id="nws_header_accesskey_0" href="https://www.ncbi.nlm.nih.gov/guide/browsers/#ncbi_accesskeys" class="usa-sr-only" accesskey="0" tabindex="-1">Access keys</a>
|
||
<a id="nws_header_accesskey_1" href="https://www.ncbi.nlm.nih.gov" class="usa-sr-only" accesskey="1" tabindex="-1">NCBI Homepage</a>
|
||
<a id="nws_header_accesskey_2" href="/myncbi/" class="set-base-url usa-sr-only" accesskey="2" tabindex="-1">MyNCBI Homepage</a>
|
||
<a id="nws_header_accesskey_3" href="#maincontent" class="usa-sr-only" accesskey="3" tabindex="-1">Main Content</a>
|
||
<a id="nws_header_accesskey_4" href="#" class="usa-sr-only" accesskey="4" tabindex="-1">Main Navigation</a>
|
||
</div>
|
||
<section data-section="Alerts">
|
||
<div class="ncbi-alerts-placeholder"></div>
|
||
</section>
|
||
</div>
|
||
</div>
|
||
<!--/.header-->
|
||
<div class="header">
|
||
<div class="res_logo"><h1 class="res_name"><a href="/gap/" title="dbGaP home">dbGaP</a></h1><h2 class="res_tagline">dbgap</h2></div>
|
||
<div class="search"><form method="get" action="/gap/"><div class="search_form"><label for="database" class="offscreen_noflow">Search database</label><select id="database"><optgroup label="Recent"><option value="gap" selected="selected">dbGaP</option><option value="clinvar">ClinVar</option><option value="medgen">MedGen</option><option value="pubmed" class="last">PubMed</option></optgroup><optgroup label="All"><option value="gquery">All Databases</option><option value="assembly">Assembly</option><option value="biocollections">Biocollections</option><option value="bioproject">BioProject</option><option value="biosample">BioSample</option><option value="books">Books</option><option value="clinvar">ClinVar</option><option value="cdd">Conserved Domains</option><option value="gap">dbGaP</option><option value="dbvar">dbVar</option><option value="gene">Gene</option><option value="genome">Genome</option><option value="gds">GEO DataSets</option><option value="geoprofiles">GEO Profiles</option><option value="gtr">GTR</option><option value="ipg">Identical Protein Groups</option><option value="medgen">MedGen</option><option value="mesh">MeSH</option><option value="nlmcatalog">NLM Catalog</option><option value="nuccore">Nucleotide</option><option value="omim">OMIM</option><option value="pmc">PMC</option><option value="protein">Protein</option><option value="proteinclusters">Protein Clusters</option><option value="protfam">Protein Family Models</option><option value="pcassay">PubChem BioAssay</option><option value="pccompound">PubChem Compound</option><option value="pcsubstance">PubChem Substance</option><option value="pubmed">PubMed</option><option value="snp">SNP</option><option value="sra">SRA</option><option value="structure">Structure</option><option value="taxonomy">Taxonomy</option><option value="toolkit">ToolKit</option><option value="toolkitall">ToolKitAll</option><option value="toolkitbookgh">ToolKitBookgh</option></optgroup></select><div class="nowrap"><label for="term" class="offscreen_noflow" accesskey="/">Search term</label><div class="nowrap"><input type="text" name="term" id="term" title="Search dbGaP" value="" class="jig-ncbiclearbutton jig-ncbiautocomplete" data-jigconfig="isEnabled:false,disableUrl:'NcbiSearchBarAutoComplCtrl'" autocomplete="off" data-sbconfig="ds:'no',pjs:'no',afs:'yes'" /></div><button id="search" type="submit" class="button_search nowrap" cmd="go">Search</button></div></div></form><ul class=" inline_list searchlinks"><li>
|
||
<a href="/gap/advanced/">Advanced</a>
|
||
</li><li>
|
||
<a href="/gap/limits/">Limits</a>
|
||
</li></ul></div>
|
||
|
||
</div>
|
||
<div class="nav_and_browser">
|
||
|
||
</div>
|
||
|
||
<!-- was itemctrl -->
|
||
<div class="container">
|
||
<div id="maincontent" class="content col twelve_col last">
|
||
<div class="col1">
|
||
<h1 id="dbgap-molecular-data-submission-">dbGaP Molecular Data Submission Guide</h1>
|
||
|
||
|
||
<p>Go back to <em><a href="/gap/docs/submissionguide">dbGaP Study Submission Guide</a></em></p>
|
||
|
||
|
||
<h2 data-heading="h2" data-no-toc="true">Summary of the Molecular Data Submission Process</h2>
|
||
|
||
|
||
<p>If you have a question, search through the commonly asked questions below. Otherwise, start with <a href="#genostart">Which data types can be submitted as "Molecular data" to the dbGaP Submission Portal?</a></p>
|
||
|
||
|
||
<div class="toc">
|
||
<ul>
|
||
<li><a href="#1-which-data-types-can-be-submit">1. Which data types can be submitted as "Molecular Data" to the dbGaP Submission Portal?</a></li>
|
||
<li><a href="#2-when-where-and-how-should-mole">2. When, where, and how should Molecular data be submitted?</a></li>
|
||
<li><a href="#3-what-are-the-sample-id-require">3. What are the Sample ID requirements for all individual level "Molecular Data"?</a></li>
|
||
<li><a href="#4-how-should-genotype-array-data">4. How should Genotype Array data be formatted?</a></li>
|
||
<li><a href="#5-how-should-snp-cnv-and-structu">5. How should SNP, CNV, and structural variants derived from sequence data be formatted?</a></li>
|
||
<li><a href="#6-how-should-imputations-be-form">6. How should Imputations be formatted?</a></li>
|
||
<li><a href="#7-how-should-expression-and-epig">7. How should Expression and Epigenetic data be formatted?</a></li>
|
||
<li><a href="#8-how-should-somatic-andor-germl">8. How should Somatic and/or Germline Mutation Annotations be formatted?</a></li>
|
||
<li><a href="#9-how-should-molecular-data-incl">9. How should Molecular data, including -omics data, in non-standard format be formatted?</a></li>
|
||
<li><a href="#10-what-are-common-errors-to-che">10. What are common errors to check for and what will happen after I submit Molecular data?</a></li>
|
||
</ul>
|
||
</div>
|
||
|
||
|
||
<p><a name="genostart" id="genostart"></a></p>
|
||
|
||
|
||
<h3 id="1-which-data-types-can-be-submit">1. Which data types can be submitted as "Molecular Data" to the dbGaP Submission Portal?</h3>
|
||
|
||
|
||
<p>Data generated with the use of molecular technologies (e.g., DNA/RNA/protein microarrays, DNA/RNA/protein sequencing, PCR) except for BAM, CRAM, and FASTQ data. No BAM, CRAM, and FASTQ files should be submitted as "Molecular Data" type to the dbGaP Submission Portal. High throughput human sequence data and alignment information should be submitted through a separate process: <a href="/gap/docs/submissionguide#aSRA">High throughput sequencing submission instructions</a>. For specific requirements of each Molecular Data (non-SRA) type, click below:</p>
|
||
|
||
|
||
<ul>
|
||
<li><a href="#aarray">Genotype</a> (SNP array in PLINK format and if available, raw data (Illumina .idat or Affymetrix .cel), and genotype reports)</li>
|
||
<li><a href="#avcf">SNP, CNV, and structural variants derived from sequence data</a> (.vcf)</li>
|
||
<li><a href="#aimpute">Imputation</a> (IMPUTE2, MACH, MINIMAC, SHAPEIT)</li>
|
||
<li><a href="#expressionepigenetic">Expression/Epigenetic</a> array or counts (.txt, .tsv)</li>
|
||
<li><a href="#amaf">Somatic and/or germline mutation annotations</a> (.maf)</li>
|
||
<li><a href="#aother">Other</a> (individual and summary level data (.txt or .csv matrix), -omics, single cell, UCSC BED format, etc.)</li>
|
||
</ul>
|
||
|
||
|
||
<h3 id="2-when-where-and-how-should-mole">2. When, where, and how should Molecular data be submitted?</h3>
|
||
|
||
|
||
<p>Molecular data should be submitted to the dbGaP <a href="https://submit.ncbi.nlm.nih.gov/dbgap/">Submission Portal</a> under the section "Other files" with type "Molecular Data". It should be submitted along with the phenotype data or as early as possible so that it enters a dbGaP genotype curator's queue. </p>
|
||
|
||
|
||
<p>Please include a README with a brief description of the data that you are submitting. It should minimally include genotyping steps, genome build, and technology if applicable.</p>
|
||
|
||
|
||
<p>To compress and bundle files, zip first then tar. Do not tar first then zip as this will significantly delay the processing time.</p>
|
||
|
||
|
||
<p>For <strong>VCFs</strong>, the files should be compressed using bgzip instead of zip as bgzip's block compression method can be directly used with VCFtools and BCFtools. This enables dbGaP to run qc checks quickly and report back to you any errors. For VCF files larger than 300GB, please split by chromosome, then tar the set of VCFs and submit as a single tarball.</p>
|
||
|
||
|
||
<p><a name="genosampID" id="genosampID"></a></p>
|
||
|
||
|
||
<h3 id="3-what-are-the-sample-id-require">3. What are the Sample ID requirements for all individual level "Molecular Data"?</h3>
|
||
|
||
|
||
<p><span style="color:red">Essential requirement: Sample IDs must be de-identified. Every sample ID found in an individual level Molecular Data file must be mapped to a consented subject in the Subject Sample Mapping (<a href="/gap/docs/submissionguide#ssmds">SSM</a>) dataset.</span> See <a href="/gap/docs/submissionguide#sampid">SAMPLE_ID</a> in Glossary for full requirement details. Sample IDs that do not follow the requirements will not be processed. If sample IDs are modified, please also modify the corresponding <a href="/gap/docs/submissionguide#asampattr">Sample Attributes</a> dataset. </p>
|
||
|
||
|
||
<ul>
|
||
<li>The sample ID is ideally the final aliquot used for a sequencing run or well on an array plate. A person with a given subject ID can have many samples.</li>
|
||
<li>If a sample ID is a technical control such as Coriell HapMap sample or a publicly available control, it must be mapped to a subject ID in the <a href="/gap/docs/submissionguide#ssmds">Subject Sample Mapping (SSM) DS</a> and that subject ID must be explicitly marked as CONSENT=0 in the <a href="/gap/docs/submissionguide#scds">Subject Consent DS</a> dataset.</li>
|
||
<li>Single cells or multiplexed single cells should each be given a unique sample ID.</li>
|
||
<li>Sample IDs in sequence derived genotypes (VCFs) must be identical to the sample IDs used in the corresponding sequence data (BAMs).</li>
|
||
<li>Include a File Sample Mapping (FSM) file to map sample IDs to single sample data files.</li>
|
||
<li>Include README to describe content of data files and QC anomalies especially if the content is not in one of the formats listed and fits into the "Other" category.</li>
|
||
<li>Check that files are not truncated.</li>
|
||
</ul>
|
||
|
||
|
||
<p><a name="aarray" id="aarray"></a></p>
|
||
|
||
|
||
<h3 id="4-how-should-genotype-array-data">4. How should Genotype Array data be formatted?</h3>
|
||
|
||
|
||
<p>PLINK formatted genotype files are the preferred format to submit genotype array data. It is submitted as binary (.bed/.bim/.fam) or text (.map/.ped or .tfam/.tped) sets. Please see <a href="http://zzz.bwh.harvard.edu/plink/">http://zzz.bwh.harvard.edu/plink/</a> and <a href="https://www.cog-genomics.org/plink/1.9">https://www.cog-genomics.org/plink/1.9</a> for PLINK specifications. The alleles should be encoded as ACGT for automated processing, otherwise, please be prepared for a longer processing time. Raw genotype data (Illumina .idat and Affymetrix .cel) should also be submitted if available. If Illumina's individual genotype reports or comparable reports are submitted without PLINK formatted sets, dbGaP will generate a PLINK formatted multisample set from the reports to include with the submitted files. Please do not submit VCFs for chip data.</p>
|
||
|
||
|
||
<ul>
|
||
<li>See <a href="#genosampID">sample ID requirements</a>. Every sample ID found in an individual level Molecular data file must be mapped to a consented subject in the Subject Sample Mapping (<a href="/gap/docs/submissionguide#ssmds">SSM</a>) dataset. If each sample has multiple files, you may also create a File Sample Mapping (FSM) that has one column for the sample ID and the other column for the full filename including extensions.</li>
|
||
<li>
|
||
<p>Marker or Probe</p>
|
||
<ul>
|
||
<li>Provide manufacturer's array manifest if available. This should include the .bmp or text readable file, which contains SNP or probe content on the array or assay. dbGaP will provide novel array manifest to dbSNP. *Required.<blockquote>
|
||
<table>
|
||
<thead>
|
||
<tr>
|
||
<th align="center">col_num</th>
|
||
<th>col_name</th>
|
||
</tr>
|
||
</thead>
|
||
<tbody>
|
||
<tr>
|
||
<td align="center">1</td>
|
||
<td>IlmnID [unique ID]*</td>
|
||
</tr>
|
||
<tr>
|
||
<td align="center">2</td>
|
||
<td>Name [Marker name]*</td>
|
||
</tr>
|
||
<tr>
|
||
<td align="center">3</td>
|
||
<td>IlmnStrand</td>
|
||
</tr>
|
||
<tr>
|
||
<td align="center">4</td>
|
||
<td>SNP*</td>
|
||
</tr>
|
||
<tr>
|
||
<td align="center">5</td>
|
||
<td>AddressA_ID</td>
|
||
</tr>
|
||
<tr>
|
||
<td align="center">6</td>
|
||
<td>AlleleA_ProbeSeq*</td>
|
||
</tr>
|
||
<tr>
|
||
<td align="center">7</td>
|
||
<td>AddressB_ID</td>
|
||
</tr>
|
||
<tr>
|
||
<td align="center">8</td>
|
||
<td>AlleleB_ProbeSeq*</td>
|
||
</tr>
|
||
<tr>
|
||
<td align="center">9</td>
|
||
<td>GenomeBuild*</td>
|
||
</tr>
|
||
<tr>
|
||
<td align="center">10</td>
|
||
<td>Chr*</td>
|
||
</tr>
|
||
<tr>
|
||
<td align="center">11</td>
|
||
<td>MapInfo*</td>
|
||
</tr>
|
||
<tr>
|
||
<td align="center">12</td>
|
||
<td>Ploidy</td>
|
||
</tr>
|
||
<tr>
|
||
<td align="center">13</td>
|
||
<td>Species</td>
|
||
</tr>
|
||
<tr>
|
||
<td align="center">14</td>
|
||
<td>Source</td>
|
||
</tr>
|
||
<tr>
|
||
<td align="center">15</td>
|
||
<td>SourceVersion</td>
|
||
</tr>
|
||
<tr>
|
||
<td align="center">16</td>
|
||
<td>SourceStrand</td>
|
||
</tr>
|
||
<tr>
|
||
<td align="center">17</td>
|
||
<td>SourceSeq</td>
|
||
</tr>
|
||
<tr>
|
||
<td align="center">18</td>
|
||
<td>TopGenomicSeq</td>
|
||
</tr>
|
||
<tr>
|
||
<td align="center">19</td>
|
||
<td>BeadSetID</td>
|
||
</tr>
|
||
<tr>
|
||
<td align="center">20</td>
|
||
<td>Exp_Clusters</td>
|
||
</tr>
|
||
<tr>
|
||
<td align="center">21</td>
|
||
<td>RefStrand*</td>
|
||
</tr>
|
||
</tbody>
|
||
</table>
|
||
</blockquote>
|
||
</li>
|
||
<li>If not available, submit array annotation file with comprehesive marker/probe information (SNP, flanks, chr, position, genome build, reference strand, etc.)</li>
|
||
<li>The marker or probe information will be included in the release as a 'sample-info' component.</li>
|
||
</ul>
|
||
</li>
|
||
<li>
|
||
<p>PLINK</p>
|
||
<ul>
|
||
<li>.bed files</li>
|
||
<li>.fam/.ped/.tfam files<ul>
|
||
<li>Annotate with IIDs (sample IDs) using the same sample IDs listed in the <a href="/gap/docs/submissionguide#ssmds">SSM</a></li>
|
||
<li>If dataset contains duplicated samples, create a sample-level PLINK set. List the subject IDs as the Family IDs and the sample IDs as the IIDs.</li>
|
||
<li>Indicate which of the duplicates you recommend to use for GWAS or analyses. A list of duplicates can be submitted as a separate file.</li>
|
||
</ul>
|
||
</li>
|
||
<li>.bim/.map/.tped files<ul>
|
||
<li>Annotate variants with ACGT alleles</li>
|
||
<li>DO NOT manually modify marker level information in the BIM file</li>
|
||
<li>Sample and marker filter (.keep, .extract) files may be provided
|
||
<a name="rawgeno" id="rawgeno"></a></li>
|
||
</ul>
|
||
</li>
|
||
</ul>
|
||
</li>
|
||
<li>Raw Genotype Data (Illumina .idat or Affymetrix .cel)<ul>
|
||
<li>Provide single sample genotypes in the format of .idat or .cel files</li>
|
||
<li>.idat files should include both green and red intensity files</li>
|
||
<li>Provide a File Sample Mapping (FSM) file which explicitly maps each report name to the sample ID listed in the <a href="/gap/docs/submissionguide#ssmds">SSM</a></li>
|
||
</ul>
|
||
</li>
|
||
<li>Genotype Reports<ul>
|
||
<li>Individual genotype reports may be single sample or multisample reports</li>
|
||
<li>Provide Illumina's final reports or comparable reports. Required columns: SNP Name, Sample ID, alleles, intensities, genotype call quality scores, B allele frequencies, and other relevant information</li>
|
||
<li>Provide dictionary to describe columns</li>
|
||
<li>When PLINK formatted genotype files are not provided, single sample or multisample reports will be combined into a single PLINK formatted multisample set for release.</li>
|
||
</ul>
|
||
</li>
|
||
</ul>
|
||
|
||
|
||
<p>Example of a single sample header and report from Illumina</p>
|
||
|
||
|
||
<p>[Header] <br />
|
||
GSGT Version,1.9.4<br />
|
||
Processing Date,2/25/2014 4:59 AM<br />
|
||
Content,HumanOmni5Exome-4v1-1_A.bpm<br />
|
||
Num SNPs,4641218<br />
|
||
Total SNPs,4641218<br />
|
||
Num Samples,1200<br />
|
||
Total Samples,4181<br />
|
||
File,534 of 1200<br />
|
||
[Data]</p>
|
||
|
||
|
||
<p>Red is required and blue is recommended.</p>
|
||
|
||
|
||
<p><span style="color:red">SNP Name</span><br />
|
||
<span style="color:red">GC Score</span><br />
|
||
Allele1 – Forward<br />
|
||
Allele2 - Forward<br />
|
||
<span style="color:red">Allele1 – Top</span><br />
|
||
<span style="color:red">Allele2 – Top</span><br />
|
||
Allele1 - Design<br />
|
||
Allele2 - Design<br />
|
||
Allele1 - AB<br />
|
||
Allele2 - AB<br />
|
||
<span style="color:blue">Theta<br />
|
||
<span style="color:blue">R<br />
|
||
<span style="color:blue">X intensity</span><br />
|
||
<span style="color:blue">Y intensity</span><br />
|
||
X Raw<br />
|
||
Y Raw<br />
|
||
<span style="color:blue">B Allele Freq</span><br />
|
||
<span style="color:blue">Log R Ratio</span></span></span></p>
|
||
|
||
|
||
<ul>
|
||
<li>QC your data to identify sample switches, contaminated DNA, unexpected duplicates and relatedness, and samples with high MCR<ul>
|
||
<li>Exclude sample IDs and markers without genotype calls, where missing call rate (MCR) = 100%. Run PLINK command <code>--missing</code></li>
|
||
<li>Verify genotype sex and phenotype sex are identical. Run PLINK command <code>--check-sex</code>. Resolve by excluding problematic sample IDs or providing evidence in the form of a README for samples with known sex chromosome anomalies.</li>
|
||
<li>Verify IBD results from the PLINK set are consistent with known relationships provided in the <a href="/gap/docs/submissionguide#pdds">Pedigree DS</a>. Merge PLINK sets if there are more than one PLINK set before running IBD checks. Run PLINK commands <code>--freq</code> and <code>--genome</code>. Note that monozygotic twins should be marked in the Pedigree DS. Correct issues with unexpected duplicates or relatedness in the pedigree and genotype data, OR provide README documenting issue and reason why it cannot be resolved.</li>
|
||
</ul>
|
||
</li>
|
||
<li>Include description and data (IBD results, .genome file, thresholds, etc.) resulting from your data cleaning process. The QC data will be included in the release as a 'genotype-qc' component.</li>
|
||
</ul>
|
||
|
||
|
||
<p><a name="avcf" id="avcf"></a></p>
|
||
|
||
|
||
<h3 id="5-how-should-snp-cnv-and-structu">5. How should SNP, CNV, and structural variants derived from sequence data be formatted?</h3>
|
||
|
||
|
||
<p>The Variant Call Format (VCF) is the preferred format to submit SNP, CNV, and structural variants. VCFs can be derived from Whole Genome Sequences (WGS), Whole Exome Sequences (WXS), or targeted sequences (Targeted-Capture or OTHER). Please see <a href="https://samtools.github.io/hts-specs/">https://samtools.github.io/hts-specs/</a> for VCF specifications.</p>
|
||
|
||
|
||
<ul>
|
||
<li>See <a href="#genosampID">sample ID requirements</a>. Every sample ID found in an individual level Molecular data file must be mapped to a consented subject in the Subject Sample Mapping (<a href="/gap/docs/submissionguide#ssmds">SSM</a>) dataset.</li>
|
||
<li>Marker or Probe<ul>
|
||
<li>Provide <strong>Marker Annotations</strong> as a separate file from the VCFs and include gene, gene_family, other identifiers and details</li>
|
||
</ul>
|
||
</li>
|
||
<li>VCF Header<ul>
|
||
<li>Information relevant for genotype calls should not be included in the <strong>Marker Annotations</strong>, but rather in the VCF header: ##INFO</li>
|
||
<li>Genome Build (e.g., GRC38) should be included in the VCF header: ##reference</li>
|
||
<li>Exclude long internal paths to the individual data</li>
|
||
</ul>
|
||
</li>
|
||
<li>Multisample VCFs vs. single sample VCFs <ul>
|
||
<li>Multisample VCFs are preferred when variants are called across many samples.</li>
|
||
<li>Submit single sample VCFs only when the project calls variants for each sample independently against a reference genome and the variants are not compared across samples. </li>
|
||
<li>Merging single sample VCF called individually against reference into multisample VCFs is recommended ONLY if the KNOWN homozygous reference genotypes can be included for all samples/variants covered by sequencing. As per the VCF specification the genotype string './.' should be used for any UNKNOWN genotypes.</li>
|
||
<li>Sequence derived genotypes should be identified with the same sample IDs as the sequence data (.bam, .cram, .fastq) they were derived from</li>
|
||
<li>Final VCFs can be processed by standard processing software (PSEQ, BCFTOOLS, VCFTOOLS, TABIX)<ul>
|
||
<li>If possible, submit tabix indexes along with the VCFs</li>
|
||
<li>Use bgzip to compress VCF files</li>
|
||
</ul>
|
||
</li>
|
||
<li>Set FILTER=PASS for markers with high quality data</li>
|
||
<li>Adhere to VCF specifications for missing data (including chrX genotypes for male samples)</li>
|
||
</ul>
|
||
</li>
|
||
<li>QC VCFs to identify sample switches, contaminated DNA, unexpected duplicates and relatedness, and samples with high MCR<ul>
|
||
<li>Exclude sample IDs and markers without genotype calls, where missing call rate (MCR) = 100%. Run PLINK command <code>--missing</code></li>
|
||
<li>Verify genotype sex and phenotype sex are identical. Run PLINK command <code>--check-sex</code>. Resolve by excluding problematic sample IDs or providing evidence in the form of a README for samples with known sex chromosome anomalies.</li>
|
||
<li>Verify IBD results from VCFs are consistent with known relationships provided in the <a href="#pdds">Pedigree DS</a>. Merge VCF sets if there are more than several multisample or single sample VCFs before running IBD checks. Note that monozygotic twins should be marked in the Pedigree DS. Correct issues with unexpected duplicates or relatedness in the pedigree and genotype data, OR provide README documenting issue and reason why it cannot be resolved.</li>
|
||
<li>dbGaP will create PLINK files from the VCFs to run QC checks, but will not release temporarily generated PLINK files.</li>
|
||
</ul>
|
||
</li>
|
||
<li>Include description and data (IBD results, thresholds, etc.) resulting from your data cleaning process. The QC data will be included in the release as a 'genotype-qc' component.</li>
|
||
</ul>
|
||
|
||
|
||
<p>For <strong>VCFs</strong>, the files should be compressed using bgzip instead of zip as bgzip's block compression method can be directly used with VCFtools and BCFtools. This enables dbGaP to run qc checks quickly and report back to you any errors. For VCF files larger than 300GB, please split by chromosome, then tar the set of VCFs and submit as a single tarball.</p>
|
||
|
||
|
||
<p><a name="aimpute" id="aimpute"></a></p>
|
||
|
||
|
||
<h3 id="6-how-should-imputations-be-form">6. How should Imputations be formatted?</h3>
|
||
|
||
|
||
<p>Imputed genotype data can be submitted if they are generated from PLINK, BCFTOOLS, VCFTOOLS, IMPUTE2, and MACH/MINIMAC. Please discuss with a genotype curator if another format needs to be submitted.</p>
|
||
|
||
|
||
<ul>
|
||
<li>See <a href="#genosampID">sample ID requirements</a>. Every sample ID found in an individual level Molecular data file must be mapped to a consented subject in the Subject Sample Mapping (<a href="/gap/docs/submissionguide#ssmds">SSM</a>) dataset.</li>
|
||
<li>Name and version of the reference panel used for imputations should be included in the Experiment Description or Report file</li>
|
||
<li>If not in the Experiment Description or Report file, include separately in a README<ul>
|
||
<li>Genotype set that was used as input</li>
|
||
<li>Software used</li>
|
||
<li>Thresholds or filters that were applied</li>
|
||
</ul>
|
||
</li>
|
||
<li>Large datasets, greater than 10GB, should be split by chromosomes for faster processing time</li>
|
||
</ul>
|
||
|
||
|
||
<p><a name="expressionepigenetic" id="expressionepigenetic"></a></p>
|
||
|
||
|
||
<h3 id="7-how-should-expression-and-epig">7. How should Expression and Epigenetic data be formatted?</h3>
|
||
|
||
|
||
<p>RNA microarray, RNA-seq derived expression, and methylation data may be submitted in the form of expression/methylation levels, exon/transcript/gene reads (number of reads overlapping a given feature such as an exon/transcript/gene), RPKMs (reads per kilobase million), or TPKMs (transcripts per kilobase million). If your data does not require controlled-access, please submit to NCBI <a href="https://www.ncbi.nlm.nih.gov/geo/info/faq.html">GEO</a>, which is an unrestricted access database. To submit to dbGaP:</p>
|
||
|
||
|
||
<ul>
|
||
<li>See <a href="#genosampID">sample ID requirements</a>. Every sample ID found in an individual level Molecular data file must be mapped to a consented subject in the Subject Sample Mapping (<a href="/gap/docs/submissionguide#ssmds">SSM</a>) dataset.</li>
|
||
<li>Data should be tab-delimited text-formatted multisample matrices that have markers listed as the first column in each row and samples as column headers.</li>
|
||
<li>There should be the same number of columns in each row.</li>
|
||
<li>Meta information and datasets should be submitted together to make submission MIAME compliant: <a href="https://www.ncbi.nlm.nih.gov/geo/info/MIAME.html">https://www.ncbi.nlm.nih.gov/geo/info/MIAME.html</a>. </li>
|
||
<li>Meta information as txt formatted files should include:<ul>
|
||
<li>General description of the experiments and datasets</li>
|
||
<li>Normalization procedures</li>
|
||
<li>Sample and marker filters</li>
|
||
</ul>
|
||
</li>
|
||
<li>For arrays submitted as Illumina .idat or Affymetrix .cel files, follow instructions under <a href="#rawgeno">"Raw Genotype Data"</a> above.</li>
|
||
</ul>
|
||
|
||
|
||
<p><a name="amaf" id="amaf"></a></p>
|
||
|
||
|
||
<h3 id="8-how-should-somatic-andor-germl">8. How should Somatic and/or Germline Mutation Annotations be formatted?</h3>
|
||
|
||
|
||
<p>Mutation Annotation Format (MAF) is a tab-delimited text file with aggregated mutation information from VCF files. It is used to describe genomic variations between tumor-normal tissues in cancer research. The column headers can be found <a href="https://docs.gdc.cancer.gov/Data/File_Formats/MAF_Format/#protected-maf-file-structure">here</a>.</p>
|
||
|
||
|
||
<ul>
|
||
<li>See <a href="#genosampID">sample ID requirements</a>. Every sample ID found in an individual level Molecular data file must be mapped to a consented subject in the Subject Sample Mapping (<a href="/gap/docs/submissionguide#ssmds">SSM</a>) dataset.</li>
|
||
<li>If any column in a submitted MAF file is different from those in the description, provide a data dictionary for your MAF file.</li>
|
||
</ul>
|
||
|
||
|
||
<p><a name="aother" id="aother"></a></p>
|
||
|
||
|
||
<h3 id="9-how-should-molecular-data-incl">9. How should Molecular data, including -omics data, in non-standard format be formatted?</h3>
|
||
|
||
|
||
<p>For molecular data that cannot be submitted in any of the formats listed above, for example, individual and summary level data, -omics, single cell, UCSC BED format, gVCFs. </p>
|
||
|
||
|
||
<ul>
|
||
<li>See <a href="#genosampID">sample ID requirements</a>. Every sample ID found in an individual level Molecular data file must be mapped to a consented subject in the Subject Sample Mapping (<a href="/gap/docs/submissionguide#ssmds">SSM</a>) dataset.</li>
|
||
<li>Provide platform, probe/marker set or genome build for the reference genome in a README or with the experiment description.</li>
|
||
<li>Include a File Sample Mapping (FSM) file to map sample IDs to single sample data files. For multisamples, mark the column containing sample IDs and let us know how to split the content on sample IDs if it is not obviously labeled. Generally for multisample matrices, data should be tab-delimited, text-formatted, and have markers listed as the first column in each row and samples as column headers.</li>
|
||
<li>There should be the same number of columns in each row.</li>
|
||
<li>Provide data dictionary for the column headers.</li>
|
||
<li>Include chr/pos/ref_allele/alt_allele and any number of relevant meta information.</li>
|
||
<li>Remove failed and excluded samples (do not mark/highlight) from data sheets.</li>
|
||
<li>Indicate which files are supplementary or summary-level results.</li>
|
||
<li>Large datasets, greater than 10GB, should be split by chromosomes for faster processing time</li>
|
||
<li>Include description and data (IBD results, .genome file, thresholds, etc.) resulting from your data cleaning process. The QC data will be included in the release as a 'genotype-qc' component.</li>
|
||
<li>Data that cannot be QC'ed will be split by consents and packed.</li>
|
||
</ul>
|
||
|
||
|
||
<p><a name="genoerrors" id="genoerrors"></a></p>
|
||
|
||
|
||
<h3 id="10-what-are-common-errors-to-che">10. What are common errors to check for and what will happen after I submit Molecular data?</h3>
|
||
|
||
|
||
<p>We expect submitters to have checked all of the consistency issues below prior to submitting. dbGaP genotype curators will verify and package the molecular data for release. Any exceptional case, such as loss of heterozygosity (LOH), Mendelian violations that cannot be resolved, policy issues with distributing pedigree information, should be submitted with an additional README or other form of documentation. Please specify if these documentation can be provided to dbGaP users or should stay internal to dbGaP.</p>
|
||
|
||
|
||
<p>Sample identity is verified</p>
|
||
|
||
|
||
<ul>
|
||
<li>Expected or Unexpected duplicates: samples found to have nearly identical genotypes are expected to belong to the same person unless the samples belong to a set of twins demarcated in the <a href="/gap/docs/submissionguide#pdds">Pedigree DS</a>. If a set of samples are expected duplicates, it means that the subject IDs (aka individual identifier (IID)) linked to the sample IDs in the <a href="/gap/docs/submissionguide#ssmds">SSM DS</a> will be identical. </li>
|
||
</ul>
|
||
|
||
|
||
<p>Sex of the samples are verified</p>
|
||
|
||
|
||
<ul>
|
||
<li>Sex is checked using PLINK software and/or dbGaP <a href="https://www.ncbi.nlm.nih.gov/projects/gap/cgi-bin/Software.cgi">GRAF</a> using X chromosome heterozygosity rates and verified against the <a href="/gap/docs/submissionguide#spds">phenotype data</a> if sex is reported.</li>
|
||
</ul>
|
||
|
||
|
||
<p>Pedigree relations are verified</p>
|
||
|
||
|
||
<ul>
|
||
<li>Pedigree relations are checked using IBD and/or dbGaP <a href="https://www.ncbi.nlm.nih.gov/projects/gap/cgi-bin/Software.cgi">GRAF</a> and verified against the phenotype data if a <a href="/gap/docs/submissionguide#pdds">Pedigree DS</a> is provided.</li>
|
||
</ul>
|
||
|
||
|
||
<p>SNP filtering</p>
|
||
|
||
|
||
<ul>
|
||
<li>Minor allele frequencies (MAF), missing call rates (MCR), Mendelian errors are checked using PLINK and other software.</li>
|
||
</ul>
|
||
|
||
|
||
<p>Ancestry-specific allele frequencies are verified</p>
|
||
|
||
|
||
<ul>
|
||
<li>
|
||
<p>dbGaP subjects with genomic data and that have been designated "non-sensitive" for release of <a href="/gap/docs/submissionguide#agsr">Genomic Summary Results (GSR)</a> in the dbGaP <a href="/gap/docs/submissionguide#subsys">Submission System</a> will also be analyzed using <a href="https://www.ncbi.nlm.nih.gov/projects/gap/cgi-bin/Software.cgi">GRAF-pop</a> and included for the <a href="/gap/docs/submissionguide#aalfa">ALFA</a> (<strong>Al</strong>lele <strong>F</strong>requency <strong>A</strong>ggregator) project. Studies may be contacted to correct the submitted data or provide a README if:</p>
|
||
<ol>
|
||
<li>They contain allele frequencies that deviate from the expected range of known allele frequencies for the <a href="https://www.ncbi.nlm.nih.gov/snp/docs/gsr/data_inclusion/#population">12 diverse populations</a>
|
||
and/or</li>
|
||
<li>The submitted ancestry or population deviates from the computed ancestry for a large number of samples.</li>
|
||
</ol>
|
||
</li>
|
||
</ul>
|
||
|
||
|
||
<p>Results of the checks may require the submitter to correct molecular data, phenotype data, or both. The most common error is that the IDs do not match between the molecular data and the phenotype data. Other common errors include missing samples and chromosomes, data to sample mapping errors, and data formatting errors.</p>
|
||
|
||
|
||
<p>Once all the qc checks pass, the individual level genotype data will be parsed by consents as demarcated in the <a href="/gap/docs/submissionguide#scds">Subject Consent DS</a> and packed in a tar. Publicly available controls such as Coriell HapMaps will be included in a separate .MULTI tar file if there are multiple consent groups or with the individual level data if there is a single consent group.</p>
|
||
|
||
|
||
<p>All annotation and QC data that were submitted or generated by dbGaP to process and analyze the data are packed within download tars:
|
||
- genotype-qc
|
||
- sample-info
|
||
- marker-info</p>
|
||
</div>
|
||
<!--/.col1-->
|
||
<div class="col2">
|
||
|
||
</div>
|
||
<!--/.col2-->
|
||
<div class="col3">
|
||
|
||
</div>
|
||
<!--/.col3-->
|
||
<div class="col4">
|
||
|
||
</div>
|
||
<!--/.col4-->
|
||
<div class="col5">
|
||
|
||
</div>
|
||
<div class="col6">
|
||
|
||
</div>
|
||
<div class="col7">
|
||
|
||
</div>
|
||
<div class="col8">
|
||
|
||
</div>
|
||
<div class="col9">
|
||
|
||
</div>
|
||
</div><!--/.content-->
|
||
</div><!--/.container-->
|
||
<div id="NCBIFooter_dynamic">
|
||
<div class="breadcrumbs">You are here:
|
||
<span id="breadcrumb_text"><a href="/guide/">NCBI</a></span></div>
|
||
<a id="help-desk-link" class="help_desk" href="https://support.ncbi.nlm.nih.gov/ics/support/default.asp?Time=2025-03-12T17:57:12-04:00&Snapshot=%2Fprojects%2FdbGap%2Fgapdocs@1.2&Host=portal105&ncbi_phid=CE8C416E7D1F84C10000000000BC00A9&ncbi_session=CE8B5AF87C7FFCB1_0191SID&from=https%3A%2F%2Fwww.ncbi.nlm.nih.gov%2Fgap%2Fdocs%2Fmoleculardatasection%2F&Ncbi_App=dbgapdocs&Page=static&style=classic&deptID=28049" target="_blank">Support Center</a>
|
||
<noscript><img alt="" src="/stat?jsdisabled=true&ncbi_app=dbgapdocs&ncbi_db=&ncbi_pdid=static&ncbi_phid=CE8C416E7D1F84C10000000000BC00A9" /></noscript>
|
||
</div>
|
||
|
||
|
||
<div xmlns:xi="http://www.w3.org/2001/XInclude">
|
||
<div xmlns="http://www.w3.org/1999/xhtml" class="footer" id="footer" xml:base="http://127.0.0.1/sites/static/header_footer">
|
||
<section class="icon-section">
|
||
<div id="icon-section-header" class="icon-section_header">Follow NCBI</div>
|
||
<div class="grid-container container">
|
||
<div class="icon-section_container">
|
||
<a class="footer-icon" id="footer_twitter" href="https://twitter.com/ncbi" aria-label="Twitter">
|
||
<svg xmlns="http://www.w3.org/2000/svg" width="40" height="40" viewBox="0 0 40 40" fill="none">
|
||
<title>Twitter</title>
|
||
<g id="twitterx1008">
|
||
<path id="path1008" d="M6.06736 7L16.8778 20.8991L6.00001 32.2H10.2L18.6 23.1L25.668 32.2H34L22.8 17.5L31.9 7H28.4L20.7 15.4L14.401 7H6.06898H6.06736ZM9.66753 8.73423H12.9327L29.7327 30.4658H26.5697L9.66753 8.73423Z" fill="#5B616B"></path>
|
||
</g>
|
||
</svg>
|
||
</a>
|
||
<a class="footer-icon" id="footer_facebook" href="https://www.facebook.com/ncbi.nlm" aria-label="Facebook"><svg xmlns="http://www.w3.org/2000/svg" data-name="Layer 1" viewBox="0 0 300 300">
|
||
<title>Facebook</title>
|
||
<path class="cls-11" d="M210.5,115.12H171.74V97.82c0-8.14,5.39-10,9.19-10h27.14V52l-39.32-.12c-35.66,0-42.42,26.68-42.42,43.77v19.48H99.09v36.32h27.24v109h45.41v-109h35Z">
|
||
</path>
|
||
</svg></a>
|
||
<a class="footer-icon" id="footer_linkedin" href="https://www.linkedin.com/company/ncbinlm" aria-label="LinkedIn"><svg xmlns="http://www.w3.org/2000/svg" data-name="Layer 1" viewBox="0 0 300 300">
|
||
<title>LinkedIn</title>
|
||
<path class="cls-11" d="M101.64,243.37H57.79v-114h43.85Zm-22-131.54h-.26c-13.25,0-21.82-10.36-21.82-21.76,0-11.65,8.84-21.15,22.33-21.15S101.7,78.72,102,90.38C102,101.77,93.4,111.83,79.63,111.83Zm100.93,52.61A17.54,17.54,0,0,0,163,182v61.39H119.18s.51-105.23,0-114H163v13a54.33,54.33,0,0,1,34.54-12.66c26,0,44.39,18.8,44.39,55.29v58.35H198.1V182A17.54,17.54,0,0,0,180.56,164.44Z">
|
||
</path>
|
||
</svg></a>
|
||
<a class="footer-icon" id="footer_github" href="https://github.com/ncbi" aria-label="GitHub"><svg xmlns="http://www.w3.org/2000/svg" data-name="Layer 1" viewBox="0 0 300 300">
|
||
<defs>
|
||
<style>
|
||
.cls-11,
|
||
.cls-12 {
|
||
fill: #737373;
|
||
}
|
||
|
||
.cls-11 {
|
||
fill-rule: evenodd;
|
||
}
|
||
</style>
|
||
</defs>
|
||
<title>GitHub</title>
|
||
<path class="cls-11" d="M151.36,47.28a105.76,105.76,0,0,0-33.43,206.1c5.28,1,7.22-2.3,7.22-5.09,0-2.52-.09-10.85-.14-19.69-29.42,6.4-35.63-12.48-35.63-12.48-4.81-12.22-11.74-15.47-11.74-15.47-9.59-6.56.73-6.43.73-6.43,10.61.75,16.21,10.9,16.21,10.9,9.43,16.17,24.73,11.49,30.77,8.79,1-6.83,3.69-11.5,6.71-14.14C108.57,197.1,83.88,188,83.88,147.51a40.92,40.92,0,0,1,10.9-28.39c-1.1-2.66-4.72-13.42,1-28,0,0,8.88-2.84,29.09,10.84a100.26,100.26,0,0,1,53,0C198,88.3,206.9,91.14,206.9,91.14c5.76,14.56,2.14,25.32,1,28a40.87,40.87,0,0,1,10.89,28.39c0,40.62-24.74,49.56-48.29,52.18,3.79,3.28,7.17,9.71,7.17,19.58,0,14.15-.12,25.54-.12,29,0,2.82,1.9,6.11,7.26,5.07A105.76,105.76,0,0,0,151.36,47.28Z">
|
||
</path>
|
||
<path class="cls-12" d="M85.66,199.12c-.23.52-1.06.68-1.81.32s-1.2-1.06-.95-1.59,1.06-.69,1.82-.33,1.21,1.07.94,1.6Zm-1.3-1">
|
||
</path>
|
||
<path class="cls-12" d="M90,203.89c-.51.47-1.49.25-2.16-.49a1.61,1.61,0,0,1-.31-2.19c.52-.47,1.47-.25,2.17.49s.82,1.72.3,2.19Zm-1-1.08">
|
||
</path>
|
||
<path class="cls-12" d="M94.12,210c-.65.46-1.71,0-2.37-.91s-.64-2.07,0-2.52,1.7,0,2.36.89.65,2.08,0,2.54Zm0,0"></path>
|
||
<path class="cls-12" d="M99.83,215.87c-.58.64-1.82.47-2.72-.41s-1.18-2.06-.6-2.7,1.83-.46,2.74.41,1.2,2.07.58,2.7Zm0,0">
|
||
</path>
|
||
<path class="cls-12" d="M107.71,219.29c-.26.82-1.45,1.2-2.64.85s-2-1.34-1.74-2.17,1.44-1.23,2.65-.85,2,1.32,1.73,2.17Zm0,0">
|
||
</path>
|
||
<path class="cls-12" d="M116.36,219.92c0,.87-1,1.59-2.24,1.61s-2.29-.68-2.3-1.54,1-1.59,2.26-1.61,2.28.67,2.28,1.54Zm0,0">
|
||
</path>
|
||
<path class="cls-12" d="M124.42,218.55c.15.85-.73,1.72-2,1.95s-2.37-.3-2.52-1.14.73-1.75,2-2,2.37.29,2.53,1.16Zm0,0"></path>
|
||
</svg></a>
|
||
<a class="footer-icon" id="footer_blog" href="https://ncbiinsights.ncbi.nlm.nih.gov/" aria-label="Blog">
|
||
<svg xmlns="http://www.w3.org/2000/svg" id="Layer_1" data-name="Layer 1" viewBox="0 0 40 40">
|
||
<defs><style>.cls-1{fill:#737373;}</style></defs>
|
||
<title>NCBI Insights Blog</title>
|
||
<path class="cls-1" d="M14,30a4,4,0,1,1-4-4,4,4,0,0,1,4,4Zm11,3A19,19,0,0,0,7.05,15a1,1,0,0,0-1,1v3a1,1,0,0,0,.93,1A14,14,0,0,1,20,33.07,1,1,0,0,0,21,34h3a1,1,0,0,0,1-1Zm9,0A28,28,0,0,0,7,6,1,1,0,0,0,6,7v3a1,1,0,0,0,1,1A23,23,0,0,1,29,33a1,1,0,0,0,1,1h3A1,1,0,0,0,34,33Z"></path>
|
||
</svg>
|
||
</a>
|
||
</div>
|
||
</div>
|
||
</section>
|
||
|
||
<section class="container-fluid bg-primary">
|
||
<div class="container pt-5">
|
||
<div class="row mt-3">
|
||
<div class="col-lg-3 col-12">
|
||
<p><a class="text-white" href="https://www.nlm.nih.gov/socialmedia/index.html">Connect with NLM</a></p>
|
||
<ul class="list-inline social_media">
|
||
<li class="list-inline-item"><a href="https://twitter.com/NLM_NIH" aria-label="Twitter" target="_blank" rel="noopener noreferrer">
|
||
<svg xmlns="http://www.w3.org/2000/svg" width="35" height="35" viewBox="0 0 36 35" fill="none">
|
||
<title>Twitter</title>
|
||
<g id="twitterx1009" clip-path="url(#clip0_65276_3946)">
|
||
<path id="Vector_Twitter" d="M17.5006 34.6565C26.9761 34.6565 34.6575 26.9751 34.6575 17.4996C34.6575 8.02416 26.9761 0.342773 17.5006 0.342773C8.02514 0.342773 0.34375 8.02416 0.34375 17.4996C0.34375 26.9751 8.02514 34.6565 17.5006 34.6565Z" fill="#205493" stroke="white" stroke-width="1.0" stroke-miterlimit="10"></path>
|
||
<path id="path1009" d="M8.54811 8.5L16.2698 18.4279L8.50001 26.5H11.5L17.5 20L22.5486 26.5H28.5L20.5 16L27 8.5H24.5L19 14.5L14.5007 8.5H8.54927H8.54811ZM11.1197 9.73873H13.4519L25.4519 25.2613H23.1926L11.1197 9.73873Z" fill="white"></path>
|
||
</g>
|
||
<defs>
|
||
<clipPath id="clip0_65276_3946">
|
||
<rect width="35" height="35" fill="white"></rect>
|
||
</clipPath>
|
||
</defs>
|
||
</svg>
|
||
</a></li>
|
||
<li class="list-inline-item"><a href="https://www.facebook.com/nationallibraryofmedicine" aria-label="Facebook" rel="noopener noreferrer" target="_blank">
|
||
<svg xmlns="http://www.w3.org/2000/svg" width="35" height="35" viewBox="0 0 36 35" fill="none">
|
||
<title>Facebook</title>
|
||
<g id="Facebook" clip-path="url(#clip0_1717_1086)">
|
||
<path id="Vector_Facebook" d="M15.1147 29.1371C15.1147 29.0822 15.1147 29.0296 15.1147 28.9747V18.9414H11.8183C11.6719 18.9414 11.6719 18.9414 11.6719 18.8018C11.6719 17.5642 11.6719 16.3289 11.6719 15.0937C11.6719 14.9793 11.7062 14.9518 11.816 14.9518C12.8683 14.9518 13.9206 14.9518 14.9751 14.9518H15.1215V14.8329C15.1215 13.8057 15.1215 12.774 15.1215 11.7492C15.1274 10.9262 15.3148 10.1146 15.6706 9.37241C16.1301 8.38271 16.9475 7.60378 17.9582 7.19235C18.6492 6.90525 19.3923 6.76428 20.1405 6.7783C21.0029 6.79202 21.8653 6.83091 22.7278 6.86065C22.8879 6.86065 23.048 6.89496 23.2082 6.90182C23.2974 6.90182 23.3271 6.94071 23.3271 7.02993C23.3271 7.54235 23.3271 8.05477 23.3271 8.5649C23.3271 9.16882 23.3271 9.77274 23.3271 10.3767C23.3271 10.4819 23.2974 10.5139 23.1921 10.5116C22.5379 10.5116 21.8814 10.5116 21.2271 10.5116C20.9287 10.5184 20.6316 10.5528 20.3395 10.6146C20.0822 10.6619 19.8463 10.7891 19.6653 10.9779C19.4842 11.1668 19.3672 11.4078 19.3307 11.6669C19.2857 11.893 19.2612 12.1226 19.2575 12.3531C19.2575 13.1904 19.2575 14.0299 19.2575 14.8695C19.2575 14.8946 19.2575 14.9198 19.2575 14.9564H23.0229C23.1807 14.9564 23.183 14.9564 23.1624 15.1074C23.0778 15.7662 22.9885 16.425 22.9039 17.0816C22.8322 17.6321 22.7636 18.1827 22.698 18.7332C22.6729 18.9437 22.6797 18.9437 22.4693 18.9437H19.2644V28.8992C19.2644 28.9793 19.2644 29.0593 19.2644 29.1394L15.1147 29.1371Z" fill="white"></path>
|
||
<path id="Vector_2_Facebook" d="M17.5006 34.657C26.9761 34.657 34.6575 26.9756 34.6575 17.5001C34.6575 8.02465 26.9761 0.343262 17.5006 0.343262C8.02514 0.343262 0.34375 8.02465 0.34375 17.5001C0.34375 26.9756 8.02514 34.657 17.5006 34.657Z" stroke="white" stroke-width="1.0" stroke-miterlimit="10"></path>
|
||
</g>
|
||
<defs>
|
||
<clipPath id="clip0_1717_1086">
|
||
<rect width="35" height="35" fill="white"></rect>
|
||
</clipPath>
|
||
</defs>
|
||
</svg>
|
||
</a></li>
|
||
<li class="list-inline-item"><a href="https://www.youtube.com/user/NLMNIH" aria-label="Youtube" target="_blank" rel="noopener noreferrer">
|
||
<svg xmlns="http://www.w3.org/2000/svg" width="35" height="35" viewBox="0 0 36 35" fill="none">
|
||
<title>Youtube</title>
|
||
<g id="YouTube" clip-path="url(#clip0_1717_1101)">
|
||
<path id="Vector_Youtube" d="M26.2571 11.4791C25.9025 11.1589 25.5709 10.9576 24.228 10.834C22.5512 10.6785 20.2797 10.6556 18.564 10.6533H16.4365C14.7208 10.6533 12.4493 10.6785 10.7725 10.834C9.43196 10.9576 9.09798 11.1589 8.7434 11.4791C7.81464 12.321 7.6202 14.6268 7.59961 16.8938C7.59961 17.3178 7.59961 17.741 7.59961 18.1635C7.62706 20.4121 7.82837 22.686 8.7434 23.521C9.09798 23.8412 9.42967 24.0425 10.7725 24.1661C12.4493 24.3216 14.7208 24.3445 16.4365 24.3468H18.564C20.2797 24.3468 22.5512 24.3216 24.228 24.1661C25.5686 24.0425 25.9025 23.8412 26.2571 23.521C27.1722 22.6929 27.3735 20.451 27.4009 18.2206C27.4009 17.7402 27.4009 17.2599 27.4009 16.7795C27.3735 14.5491 27.1699 12.3072 26.2571 11.4791ZM15.5604 20.5311V14.652L20.561 17.5001L15.5604 20.5311Z" fill="white"></path>
|
||
<path id="Vector_2_Youtube" d="M17.5006 34.657C26.9761 34.657 34.6575 26.9756 34.6575 17.5001C34.6575 8.02465 26.9761 0.343262 17.5006 0.343262C8.02514 0.343262 0.34375 8.02465 0.34375 17.5001C0.34375 26.9756 8.02514 34.657 17.5006 34.657Z" stroke="white" stroke-width="1.0" stroke-miterlimit="10"></path>
|
||
</g>
|
||
<defs>
|
||
<clipPath id="clip0_1717_1101">
|
||
<rect width="35" height="35" fill="white"></rect>
|
||
</clipPath>
|
||
</defs>
|
||
</svg>
|
||
</a></li>
|
||
</ul>
|
||
</div>
|
||
<div class="col-lg-3 col-12">
|
||
<p class="address_footer text-white">National Library of Medicine<br />
|
||
<a href="https://www.google.com/maps/place/8600+Rockville+Pike,+Bethesda,+MD+20894/@38.9959508,-77.101021,17z/data=!3m1!4b1!4m5!3m4!1s0x89b7c95e25765ddb:0x19156f88b27635b8!8m2!3d38.9959508!4d-77.0988323" class="text-white" target="_blank" rel="noopener noreferrer">8600 Rockville Pike<br />
|
||
Bethesda, MD 20894</a></p>
|
||
</div>
|
||
<div class="col-lg-3 col-12 centered-lg">
|
||
<p><a href="https://www.nlm.nih.gov/web_policies.html" class="text-white">Web Policies</a><br />
|
||
<a href="https://www.nih.gov/institutes-nih/nih-office-director/office-communications-public-liaison/freedom-information-act-office" class="text-white">FOIA</a><br />
|
||
<a href="https://www.hhs.gov/vulnerability-disclosure-policy/index.html" class="text-white" id="vdp">HHS Vulnerability Disclosure</a></p>
|
||
</div>
|
||
<div class="col-lg-3 col-12 centered-lg">
|
||
<p><a class="supportLink text-white" href="https://support.nlm.nih.gov/">Help</a><br />
|
||
<a href="https://www.nlm.nih.gov/accessibility.html" class="text-white">Accessibility</a><br />
|
||
<a href="https://www.nlm.nih.gov/careers/careers.html" class="text-white">Careers</a></p>
|
||
</div>
|
||
</div>
|
||
<div class="row">
|
||
<div class="col-lg-12 centered-lg">
|
||
<nav class="bottom-links">
|
||
<ul class="mt-3">
|
||
<li>
|
||
<a class="text-white" href="//www.nlm.nih.gov/">NLM</a>
|
||
</li>
|
||
<li>
|
||
<a class="text-white" href="https://www.nih.gov/">NIH</a>
|
||
</li>
|
||
<li>
|
||
<a class="text-white" href="https://www.hhs.gov/">HHS</a>
|
||
</li>
|
||
<li>
|
||
<a class="text-white" href="https://www.usa.gov/">USA.gov</a>
|
||
</li>
|
||
</ul>
|
||
</nav>
|
||
</div>
|
||
</div>
|
||
</div>
|
||
</section>
|
||
<script type="text/javascript" src="/portal/portal3rc.fcgi/rlib/js/InstrumentOmnitureBaseJS/InstrumentNCBIConfigJS/InstrumentNCBIBaseJS/InstrumentPageStarterJS.js?v=1"> </script>
|
||
<script type="text/javascript" src="/portal/portal3rc.fcgi/static/js/hfjs2.js"> </script>
|
||
</div>
|
||
</div>
|
||
<!--/.footer-->
|
||
<p class="last-updated small">Last updated: 2024-04-12T20:18:35Z</p>
|
||
</div>
|
||
<!--/.page-->
|
||
</div>
|
||
<!--/.wrap-->
|
||
<span class="PAFAppResources"></span>
|
||
|
||
|
||
</div><!-- /.twelve_col -->
|
||
</div>
|
||
<!-- /.grid -->
|
||
|
||
|
||
|
||
<!-- usually for JS scripts at page bottom -->
|
||
<span class="pagefixtures"></span>
|
||
|
||
|
||
<!-- CE8B5AF87C7FFCB1_0191SID /projects/dbGap/gapdocs@1.2 portal105 v4.1.r689238 Tue, Oct 22 2024 16:10:51 -->
|
||
<span id="portal-csrf-token" style="display:none" data-token="CE8B5AF87C7FFCB1_0191SID"></span>
|
||
|
||
<script type="text/javascript" src="//static.pubmed.gov/portal/portal3rc.fcgi/4176647/js/3879255/4121861/4175147/4087685.js" snapshot="gap"></script></body>
|
||
</html>
|
||
|