nih-gov/www.nlm.nih.gov/webcollecting/index.html
2025-02-26 13:17:41 -05:00

303 lines
21 KiB
HTML
Raw Permalink Blame History

This file contains ambiguous Unicode characters

This file contains Unicode characters that might be confused with other characters. If you think that this is intentional, you can safely ignore this warning. Use the Escape button to reveal them.

<!doctype html>
<html lang="en">
<head>
<meta name="viewport" content="width=device-width, initial-scale=1, shrink-to-fit=no">
<meta http-equiv="X-UA-Compatible" content="IE=edge" />
<meta http-equiv="Content-Type" content="text/html; charset=utf-8" />
<meta http-equiv="X-UA-Compatible" content="IE=edge,chrome=1"/>
<link rel="preconnect" href="https://fonts.googleapis.com">
<link rel="preconnect" href="https://fonts.gstatic.com" crossorigin>
<link href="https://fonts.googleapis.com/css2?family=Roboto:wght@100;300;400;500;700&display=swap" rel="stylesheet">
<link rel="stylesheet" href="https://use.fontawesome.com/releases/v5.0.10/css/all.css" integrity="sha384-+d0P83n9kaQMCwj8F4RJB66tzIwOKmrdb46+porD/OvrJ+37WqIM7UoBtwHO6Nlg" crossorigin="anonymous">
<link rel="stylesheet" href="/home_assets/uswds/css/styles.css">
<title>NLM Web Collecting and Archiving</title>
<link rel="schema.DC" href="http://purl.org/dc/elements/1.1/" title="The Dublin Core metadata Element Set" />
<meta name="DC.Title" content="NLM Web Collecting and Archiving" />
<meta name="DC.Publisher" content="U.S. National Library of Medicine" />
<meta name="DC.Date.Issued" content="2012-11-06" />
<meta name="DC.Date.Modified" content="2024-10-17" />
<meta name="NLMDC.Date.LastReviewed" content="2024-10-17" />
<meta name="NLM.Contact.Email" content="moffattc@mail.nlm.nih.gov" />
<meta name="DC.Type" content="Product, Program, and Project Descriptions" />
<meta name="NLM.Permanence.Level" content="Permanence Not Guaranteed" />
<meta name="DC.Rights" content="Public Domain" />
<meta name="DC.Language" content="eng" />
<link rel="stylesheet" href="/styles/responsive_images.css" media="all" />
<!-- Google Tag Manager --><script>(function(w,d,s,l,i){w[l]=w[l]||[];w[l].push(
{'gtm.start': new Date().getTime(),event:'gtm.js'}
);var f=d.getElementsByTagName(s)[0],j=d.createElement(s),dl=l!='dataLayer'?'&l='+l:'';j.async=true;j.src='//www.googletagmanager.com/gtm.js?id='+i+dl;f.parentNode.insertBefore(j,f);})(window,document,'script','dataLayer','GTM-MT6MLL');</script>
<!-- End Google Tag Manager -->
</head>
<body>
<!-- Google Tag Manager -->
<noscript><iframe src="//www.googletagmanager.com/ns.html?id=GTM-MT6MLL" height="0" width="0" style="display:none;visibility:hidden" title="googletagmanager"></iframe></noscript>
<!-- End Google Tag Manager -->
<!-- TOP NAV -->
<a class="usa-skipnav" href="#main">Skip to main content</a>
<section class="usa-banner" aria-label="Official website of the United States government">
<div class="usa-accordion">
<header class="usa-banner__header">
<div class="usa-banner__inner">
<div class="grid-col-auto"> <img class="usa-banner__header-flag" src="https://assets.nlm.nih.gov/uswds/img/us_flag_small.png" alt="U.S. flag"/> </div>
<div class="grid-col-fill tablet:grid-col-auto">
<p class="usa-banner__header-text"> An official website of the United States government </p>
<p class="usa-banner__header-action" aria-hidden="true"> Heres how you know </p>
</div>
<button class="usa-accordion__button usa-banner__button" aria-expanded="false" aria-controls="gov-banner"> <span class="usa-banner__button-text">Heres how you know</span> </button>
</div>
</header>
<div class="usa-banner__content usa-accordion__content" id="gov-banner">
<div class="grid-row grid-gap-lg">
<div class="usa-banner__guidance tablet:grid-col-6"> <img class="usa-banner__icon usa-media-block__img" src="https://assets.nlm.nih.gov/uswds/img/icon-dot-gov.svg" role="img" alt="" aria-hidden="true"/>
<div class="usa-media-block__body">
<p> <strong> Official websites use .gov </strong> <br />
A <strong>.gov</strong> website belongs to an official government
organization in the United States. </p>
</div>
</div>
<div class="usa-banner__guidance tablet:grid-col-6"> <img class="usa-banner__icon usa-media-block__img" src="https://assets.nlm.nih.gov/uswds/img/icon-https.svg" role="img" alt="" aria-hidden="true"/>
<div class="usa-media-block__body">
<p> <strong> Secure .gov websites use HTTPS </strong> <br />
A <strong>lock</strong> ( <span class="icon-lock">
<svg xmlns="http://www.w3.org/2000/svg" width="52" height="64" viewBox="0 0 52 64" class="usa-banner__lock-image" role="img" aria-labelledby="banner-lock-title-default banner-lock-description-default" focusable="false">
<title id="banner-lock-title-default">Lock</title>
<desc id="banner-lock-description-default">A locked padlock</desc>
<path fill="#000000" fill-rule="evenodd" d="M26 0c10.493 0 19 8.507 19 19v9h3a4 4 0 0 1 4 4v28a4 4 0 0 1-4 4H4a4 4 0 0 1-4-4V32a4 4 0 0 1 4-4h3v-9C7 8.507 15.507 0 26 0zm0 8c-5.979 0-10.843 4.77-10.996 10.712L15 19v9h22v-9c0-6.075-4.925-11-11-11z"/>
</svg>
</span> ) or <strong>https://</strong> means youve safely connected to the .gov website. Share sensitive information only on official, secure websites. </p>
</div>
</div>
</div>
</div>
</div>
</section>
<!-- HEADER -->
<header id="siteheader" class="usa-header usa-header--basic">
<div class="usa-nav-container tablet:padding-x-4 mobile-lg:padding-x-2 padding-y-1">
<div class="grid-row padding-y-105">
<div class="grid-col-8 desktop:grid-col-4 tablet-lg:grid-col-4 tablet:grid-col-6"> <a href="https://www.nlm.nih.gov/"> <img src="https://assets.nlm.nih.gov/uswds/img/NLM_White.png" alt="NLM logo" class="logo margin-top-1"> </a> </div>
<div class="desktop:grid-col-4 desktop:grid-offset-4 tablet-lg:grid-col-6 tablet-lg:grid-offset-2 tablet:grid-col-6 grid-col-12">
<form class="usa-search desktop:margin-top-2 tablet:margin-top-2 mobile:margin-top-1" role="search" data-gtm-form-interact-id="0" method="get" action="//vsearch.nlm.nih.gov/vivisimo/cgi-bin/query-meta" target="_self" name="searchForm" id="searchForm2">
<input class="usa-input ui-autocomplete-input" aria-label="Search" type="search" name="query" data-gtm-form-interact-field-id="0" id="search2" autocomplete="off" placeholder="Search NLM" >
<input type="hidden" name="v:project" value="nlm-main-website">
<button class="usa-button border border-top border-bottom border-right border-white" role="button" aria-label="Search" type="submit"> <span class="usa-search__submit-text"> <i class="fas fa-search"></i> </span> </button>
</form>
</div>
</div>
</div>
</header>
<div class="bg-secondary insertCOOP">
<div class="usa-nav-container">
<div class="usa-navbar ">
<button class="usa-menu-btn">Menu</button>
</div>
<nav aria-label="Primary navigation" class="usa-nav">
<button class="usa-nav__close"><img src="https://assets.nlm.nih.gov/uswds/img/close.svg" alt="close"></button>
<ul class="usa-nav__primary usa-accordion insertNav">
<li class="usa-nav__primary-item desktop-lg:margin-x-5 desktop:margin-x-3 tablet:margin-x-0">
<button type="button" class="usa-accordion__button usa-nav__link usa-current" aria-expanded="false" aria-controls="basic-nav-section-one"> <span>Products and Services <i class="fas fa-caret-down margin-left-05"></i> </span> </button>
<ul id="basic-nav-section-one" class="usa-nav__submenu bg-secondary" hidden="">
<li class="usa-nav__submenu-item"> <a href="//eresources.nlm.nih.gov/nlm_eresources/"><span>All Products and Services</span></a> </li>
<li class="usa-nav__submenu-item"> <a href="//clinicaltrials.gov/"><span>ClinicalTrials.gov</span></a> </li>
<li class="usa-nav__submenu-item"> <a href="//collections.nlm.nih.gov/"><span>Digital Collections</span></a> </li>
<li class="usa-nav__submenu-item"> <a href="//catalog.nlm.nih.gov"><span>LocatorPlus Catalog</span></a> </li>
<li class="usa-nav__submenu-item"> <a href="//meshb.nlm.nih.gov/search"><span>Medical Subject Headings (MeSH)</span></a> </li>
<li class="usa-nav__submenu-item"> <a href="//medlineplus.gov/"><span>MedlinePlus</span></a> </li>
<li class="usa-nav__submenu-item"> <a href="//pubmed.ncbi.nlm.nih.gov/"><span>PubMed/MEDLINE</span></a> </li>
<li class="usa-nav__submenu-item"> <a href="//uts.nlm.nih.gov/uts/"><span>Unified Medical Language System (UMLS)</span></a> </li>
</ul>
</li>
<li class="usa-nav__primary-item desktop-lg:margin-x-5 desktop:margin-x-3 tablet:margin-x-0">
<button type="button" class="usa-accordion__button usa-nav__link usa-current" aria-expanded="false" aria-controls="basic-nav-section-two"> <span> Resources for You <i class="fas fa-caret-down margin-left-05"></i></span> </button>
<ul id="basic-nav-section-two" class="usa-nav__submenu bg-secondary" hidden="">
<li class="usa-nav__submenu-item"> <a href="/portals/researchers.html"><span>For Researchers</span></a> </li>
<li class="usa-nav__submenu-item"> <a href="/portals/publishers.html "><span>For Publishers</span></a> </li>
<li class="usa-nav__submenu-item"> <a href="/portals/librarians.html"><span>For Librarians</span></a> </li>
<li class="usa-nav__submenu-item"> <a href="/training.html "><span>For Educators/Trainers </span></a> </li>
<li class="usa-nav__submenu-item"> <a href="/portals/healthcare.html"><span>For Health care Professionals</span></a> </li>
<li class="usa-nav__submenu-item"> <a href="/portals/public.html "><span>For the Public</span></a> </li>
</ul>
</li>
<li class="usa-nav__primary-item desktop-lg:margin-x-5 desktop:margin-x-3 tablet:margin-x-0">
<button type="button" class="usa-accordion__button usa-nav__link usa-current" aria-expanded="false" aria-controls="basic-nav-section-three"> <span>Explore NLM <i class="fas fa-caret-down margin-left-05"></i> </span> </button>
<ul id="basic-nav-section-three" class="usa-nav__submenu bg-secondary" hidden="">
<li class="usa-nav__submenu-item"> <a href="/about/index.html"><span>About the Library</span></a> </li>
<li class="usa-nav__submenu-item"> <a href="/about/visitor.html"><span>Visit the Library</span></a> </li>
<li class="usa-nav__submenu-item"> <a href="/hmd/index.html"><span>History of Medicine</span></a> </li>
<li class="usa-nav__submenu-item"> <a href="/about/org.html"><span>NLM by Organization</span></a> </li>
<li class="usa-nav__submenu-item"> <a href="/news/newsandevents.html"><span>News, Events, and Updates</span></a> </li>
</ul>
</li>
<li class="usa-nav__primary-item desktop-lg:margin-x-5 desktop:margin-x-3 tablet:margin-x-0">
<button type="button" class="usa-accordion__button usa-nav__link usa-current" aria-expanded="false" aria-controls="basic-nav-section-four"> <span> Grants and Research <i class="fas fa-caret-down margin-left-05"></i> </span> </button>
<ul id="basic-nav-section-four" class="usa-nav__submenu bg-secondary" hidden="">
<li class="usa-nav__submenu-item"> <a href="/ep/index.html"><span>NLM Extramural Programs</span></a> </li>
<li class="usa-nav__submenu-item"> <a href="/research/index.html"><span>NLM Division of Intramural Research</span></a> </li>
<li class="usa-nav__submenu-item"> <a href="https://www.ncbi.nlm.nih.gov/"><span>National Center for Biotechnology Information</span></a> </li>
<li class="usa-nav__submenu-item"> <a href="//lhncbc.nlm.nih.gov/"><span>Lister Hill National Center for Biomedical Communications</span></a> </li>
</ul>
</li>
</ul>
</nav>
</div>
</div>
<!-- End of TOP NAV -->
<!-- Breadcrumbs -->
<div class="grid-container">
<nav class="usa-breadcrumb usa-breadcrumb--wrap padding-top-1" aria-label="Breadcrumbs">
<ol class="usa-breadcrumb__list">
<li class="usa-breadcrumb__list-item"> <a href="/" class="usa-breadcrumb__link"><span>Home</span></a> </li>
</ol>
</nav>
</div>
<!-- End Breadcrumbs -->
<main class="padding-bottom-5" id="main">
<div class="grid-container">
<div class="grid-row">
<div class="grid-col">
<div class="h1">NLM Web Collecting and Archiving</div>
</div>
</div>
<div class="mult_img_container"><a title="Ebola Outbreak 2014 Web Archive Collection" href="https://archive-it.org/collections/4887?fc=websiteGroup%3AEbola+Outbreak+2014" target="_blank" rel="noopener noreferrer"><img title="Ebola Outbreak 2014 Web Archive Collection" src="/webcollecting/images/CDC_US_532_400.jpg" alt="CDC home page" /></a> <a title="Health and Medicine Blogs Web Archive Collection" href="https://archive-it.org/collections/2722" target="_blank" rel="noopener noreferrer"><img title="Health and Medicine Blogs Web Archive Collection" src="/webcollecting/images/emergiblog_400x157.jpg" alt="Emergiblog" /></a> <a title="Environmental Health Web Archive Collection" href="https://archive-it.org/collections/7219" target="_blank" rel="noopener noreferrer"><img title="Environmental Health Web Archive Collection" src="/webcollecting/images/PHE400x157.jpg" alt="Detail of Public Health Emergency page of the Office of the Assistant Secretary for Preparedness and Response" /></a></div>
<h3>&nbsp;</h3>
<div style="text-align: center;">Search NLM's web archive collections</div>
<form action="https://www.archive-it.org/organizations/350">
<div style="text-align: center;"><input name="q" type="text" /> <input name="show" type="hidden" value="ArchivedPages" /> <input name="go" type="submit" value="Go" /></div>
</form>
<h3><strong>Background</strong></h3>
<p>The National Library of Medicine (NLM) has a mandate to collect, preserve and make accessible the scholarly biomedical literature as well as resources that illustrate a diversity of philosophical and cultural perspectives. New forms of publication on the web, such as blogs authored by doctors and patients, illuminate health care thought and practice in the 21st century. In 2011 NLM piloted a project, resulting in the Health and Medicine Blogs collection, to better understand the processes and challenges of collecting born-digital web content. Since then, NLM has developed collections on the H7N9 Avian Flu, Autism and Alzheimer&rsquo;s on the Web, and Global Health Events, including the 2014 Ebola Outbreak. NLM continues to carefully build capacity in this area to better understand the acquisition, accessibility and preservation of the diverse digital formats found on the web.</p>
<h3>&nbsp;</h3>
<h3><strong>Web Archive Collections</strong></h3>
<p>NLM's web collecting and archiving are primarily collection-based activities. Multiple web sites are collected as part of a broader theme, event or topic. NLM gives highest priority to content that is at-risk of loss or that is believed to be of vital interest to current and future NLM audiences and unlikely to be preserved elsewhere. The Library's goal is to collect and preserve selected web content at a particular point in time (i.e., snapshots) or over a period of time (e.g., daily, monthly, quarterly, etc.).&nbsp; NLM's web archive collections are hosted and stored at the Internet Archive data centers.</p>
<h4>&nbsp;</h4>
<ul>
<li><a href="https://archive-it.org/organizations/350?fc=meta_Group%3AThematic+and+Event-Based+Collections">Explore NLM Thematic and Event-Based Collections</a></li>
<li><a href="https://archive-it.org/organizations/350?fc=meta_Group%3ANLM+Institutional+Archives">Explore NLM Institutional Archives</a></li>
<li><a title="NLM Archives and Manuscrip Collection web archives" href="https://archive-it.org/organizations/350?fc=meta_Group%3AArchives+and+Manuscripts+Collections">Explore NLM Archives and Manuscripts Collections</a></li>
</ul>
<br />
<h4><strong>Collaborative efforts:</strong></h4>
<ul>
<li><a href="https://siarchives.si.edu/about/partnerships/fedweb">Federal Web Archiving Interest Group</a> (2014-present)</li>
<li>Contributors to the <a href="https://eotarchive.org/">End of Term web archive</a> (2016-present)</li>
<li><a href="https://archive-it.org/collections/13529" target="_blank" rel="noopener noreferrer">Novel Coronavirus (Covid-19)</a> web archive (2020), in collaboration with the <span id="orgId">Content Development Group of the <a href="http://netpreserve.org/" target="_blank" rel="noopener noreferrer">International Internet Preservation Consortium</a> and <a href="https://archive-it.org/" target="_blank" rel="noopener noreferrer">Archive-It</a></span></li>
</ul>
<p>&nbsp;</p>
<h3><strong>Learn more </strong></h3>
<ul>
<li>Collection Development Guidelines of the National Library of Medicine: <a title="NLM Collection Development Manual: Web Content" href="https://www.ncbi.nlm.nih.gov/books/NBK518732/" target="_blank" rel="noopener noreferrer">Web Content</a></li>
<li><a title="FAQs" href="/webcollecting/faq.html">NLM Web Collecting and Archiving FAQs</a></li>
<li><span style="color: #1b1b1b; font-family: Roboto, sans-serif; font-size: 16px; font-style: normal; font-variant-ligatures: normal; font-variant-caps: normal; font-weight: 400; letter-spacing: normal; orphans: 2; text-align: start; text-indent: 0px; text-transform: none; widows: 2; word-spacing: 0px; -webkit-text-stroke-width: 0px; white-space: normal; text-decoration-thickness: initial; text-decoration-style: initial; text-decoration-color: initial; float: none; display: inline !important;">User Services and Collection Division (USCD)</span> blog <a title="Circulating Now posts on web collecting" href="https://circulatingnow.nlm.nih.gov/?s=web+collecting" target="_blank" rel="noopener noreferrer"><em>Circulating Now</em></a></li>
</ul>
<p>&nbsp;</p>
<h3>Questions?</h3>
<p>&nbsp;Please contact us at <a id="anch_100" href="mailto:nlmwebcollecting@nlm.nih.gov">nlmwebcollecting@nlm.nih.gov</a></p>
<p class=”margin-top-5”><small>Last Reviewed: October 17, 2024</small></p>
</div>
</main>
<!-- FOOTER -->
<footer class="usa-footer__primary-section padding-top-5 padding-bottom-3 insertfooter">
<div class="grid-container">
<div class="grid-row">
<div class="desktop:grid-col-3 grid-col-6"> <a href="https://www.nlm.nih.gov/socialmedia/index.html">
<p class="text-white margin-bottom-1">Connect with NLM</p>
</a>
<ul class="social_media add-list-reset">
<li class="margin-right-05"><a href="https://www.facebook.com/nationallibraryofmedicine"><img class="bg-secondary" src="https://www.nlm.nih.gov/images/facebook.svg" alt="Facebook"></a></li>
<li class="margin-right-05"><a title="External link: please review our privacy policy." href="https://www.linkedin.com/company/national-library-of-medicine-nlm/"><img class="bg-secondary" src="//www.nlm.nih.gov/images/linkedin.svg" alt="LinkedIn"></a></li>
<li class="margin-right-05"><a title="External link: please review our privacy policy." href="https://twitter.com/NLM_NIH"><img src="https://www.nlm.nih.gov/images/twitter.svg" class="padding-1 bg-secondary" alt="Twitter"></a></li>
<li class="margin-right-05"><a title="External link: please review our privacy policy." href="https://www.youtube.com/user/NLMNIH"><img src="//www.nlm.nih.gov/images/youtube.svg" class="bg-secondary" alt="You Tube"></a></li>
<li class="margin-right-05"><a title="External link: please review our privacy policy." href="https://public.govdelivery.com/accounts/USNLMOCPL/subscriber/new?preferences=true"><img src="//www.nlm.nih.gov/images/mail.svg" class=" bg-secondary" alt="Government Delivery"></a></li>
</ul>
</div>
<div class="desktop:grid-col-3 grid-col-6">
<p class="address_footer text-white"> National Library of Medicine <br>
<a href="https://www.google.com/maps/place/8600+Rockville+Pike,+Bethesda,+MD+20894/@38.9959508,-77.101021,17z/data=!3m1!4b1!4m5!3m4!1s0x89b7c95e25765ddb:0x19156f88b27635b8!8m2!3d38.9959508!4d-77.0988323" class="text-white"> 8600 Rockville Pike <br>
Bethesda, MD 20894 </a></p>
</div>
<div class="desktop:grid-col-3 grid-col-6">
<p><a href="/web_policies.html" class="text-white"> Web Policies </a><br>
<a href="https://www.nih.gov/institutes-nih/nih-office-director/office-communications-public-liaison/freedom-information-act-office" class="text-white"> FOIA </a><br>
<a href="https://www.hhs.gov/vulnerability-disclosure-policy/index.html" class="text-white">HHS Vulnerability Disclosure</a> </p>
</div>
<div class="desktop:grid-col-3 grid-col-6">
<p><a class="supportLink text-white" href="//support.nlm.nih.gov?from="> NLM Support Center </a> <br>
<a href="/accessibility.html" class="text-white"> Accessibility </a><br>
<a href="/careers/careers.html" class="text-white"> Careers </a></p>
</div>
</div>
<div class="grid-row">
<div class="grid-col-12">
<p class="text-center text-white"> <a class="text-white" href="//www.nlm.nih.gov/">NLM</a> | <a class="text-white" href="https://www.nih.gov/">NIH</a> | <a class="text-white" href="https://www.hhs.gov/">HHS</a> | <a class="text-white" href="https://www.usa.gov/">USA.gov</a></p>
</div>
</div>
</div>
</footer>
<script src="//assets.nlm.nih.gov/uswds/js/uswds.min.js"></script>
<script src="//assets.nlm.nih.gov/jquery/jquery-latest.min.js"></script>
<script src="//assets.nlm.nih.gov/jquery/jquery-migrate-latest.min.js"></script>
<script src="/scripts/nlm_autocomplete.js"></script>
<script src="/scripts/nlm_uswds.js"></script>
</body>
</html>