nih-gov/circulatingnow.nlm.nih.gov/2021/05/13/exploring-the-data-of-web-archives-as-part-of-data-science-nlm/index.html

1438 lines
167 KiB
HTML
Raw Blame History

This file contains invisible Unicode characters

This file contains invisible Unicode characters that are indistinguishable to humans but may be processed differently by a computer. If you think that this is intentional, you can safely ignore this warning. Use the Escape button to reveal them.

This file contains Unicode characters that might be confused with other characters. If you think that this is intentional, you can safely ignore this warning. Use the Escape button to reveal them.

<!DOCTYPE html>
<html lang="en-US">
<head>
<meta charset="UTF-8">
<meta name="viewport" content="width=device-width, initial-scale=1">
<link rel="profile" href="http://gmpg.org/xfn/11">
<link rel="pingback" href="https://circulatingnow.nlm.nih.gov/xmlrpc.php">
<title>Exploring the Data of Web Archives as Part of Data Science @ NLM &#8211; Circulating Now from the NLM Historical Collections</title>
<script type="text/javascript">
WebFontConfig = {"google":{"families":["Lato:r,i,b,bi:latin,latin-ext","Raleway:r:latin,latin-ext"]},"api_url":"https:\/\/fonts-api.wp.com\/css"};
(function() {
var wf = document.createElement('script');
wf.src = 'https://circulatingnow.nlm.nih.gov/wp-content/mu-plugins/wpcomsh/vendor/automattic/custom-fonts/js/webfont.js';
wf.type = 'text/javascript';
wf.async = 'true';
var s = document.getElementsByTagName('script')[0];
s.parentNode.insertBefore(wf, s);
})();
</script><style id="jetpack-custom-fonts-css"></style>
<meta name='robots' content='max-image-preview:large' />
<style>img:is([sizes="auto" i], [sizes^="auto," i]) { contain-intrinsic-size: 3000px 1500px }</style>
<!-- Jetpack Site Verification Tags -->
<link rel='dns-prefetch' href='//secure.gravatar.com' />
<link rel='dns-prefetch' href='//stats.wp.com' />
<link rel='dns-prefetch' href='//widgets.wp.com' />
<link rel='dns-prefetch' href='//jetpack.wordpress.com' />
<link rel='dns-prefetch' href='//s0.wp.com' />
<link rel='dns-prefetch' href='//public-api.wordpress.com' />
<link rel='dns-prefetch' href='//0.gravatar.com' />
<link rel='dns-prefetch' href='//1.gravatar.com' />
<link rel='dns-prefetch' href='//2.gravatar.com' />
<link rel='preconnect' href='//i0.wp.com' />
<link rel='preconnect' href='//c0.wp.com' />
<link rel="alternate" type="application/rss+xml" title="Circulating Now from the NLM Historical Collections &raquo; Feed" href="https://circulatingnow.nlm.nih.gov/feed/" />
<link rel="alternate" type="application/rss+xml" title="Circulating Now from the NLM Historical Collections &raquo; Comments Feed" href="https://circulatingnow.nlm.nih.gov/comments/feed/" />
<link rel="alternate" type="application/rss+xml" title="Circulating Now from the NLM Historical Collections &raquo; Exploring the Data of Web Archives as Part of Data Science @ NLM Comments Feed" href="https://circulatingnow.nlm.nih.gov/2021/05/13/exploring-the-data-of-web-archives-as-part-of-data-science-nlm/feed/" />
<script type="text/javascript">
/* <![CDATA[ */
window._wpemojiSettings = {"baseUrl":"https:\/\/s.w.org\/images\/core\/emoji\/15.0.3\/72x72\/","ext":".png","svgUrl":"https:\/\/s.w.org\/images\/core\/emoji\/15.0.3\/svg\/","svgExt":".svg","source":{"concatemoji":"https:\/\/circulatingnow.nlm.nih.gov\/wp-includes\/js\/wp-emoji-release.min.js?ver=6.7.2"}};
/*! This file is auto-generated */
!function(i,n){var o,s,e;function c(e){try{var t={supportTests:e,timestamp:(new Date).valueOf()};sessionStorage.setItem(o,JSON.stringify(t))}catch(e){}}function p(e,t,n){e.clearRect(0,0,e.canvas.width,e.canvas.height),e.fillText(t,0,0);var t=new Uint32Array(e.getImageData(0,0,e.canvas.width,e.canvas.height).data),r=(e.clearRect(0,0,e.canvas.width,e.canvas.height),e.fillText(n,0,0),new Uint32Array(e.getImageData(0,0,e.canvas.width,e.canvas.height).data));return t.every(function(e,t){return e===r[t]})}function u(e,t,n){switch(t){case"flag":return n(e,"\ud83c\udff3\ufe0f\u200d\u26a7\ufe0f","\ud83c\udff3\ufe0f\u200b\u26a7\ufe0f")?!1:!n(e,"\ud83c\uddfa\ud83c\uddf3","\ud83c\uddfa\u200b\ud83c\uddf3")&&!n(e,"\ud83c\udff4\udb40\udc67\udb40\udc62\udb40\udc65\udb40\udc6e\udb40\udc67\udb40\udc7f","\ud83c\udff4\u200b\udb40\udc67\u200b\udb40\udc62\u200b\udb40\udc65\u200b\udb40\udc6e\u200b\udb40\udc67\u200b\udb40\udc7f");case"emoji":return!n(e,"\ud83d\udc26\u200d\u2b1b","\ud83d\udc26\u200b\u2b1b")}return!1}function f(e,t,n){var r="undefined"!=typeof WorkerGlobalScope&&self instanceof WorkerGlobalScope?new OffscreenCanvas(300,150):i.createElement("canvas"),a=r.getContext("2d",{willReadFrequently:!0}),o=(a.textBaseline="top",a.font="600 32px Arial",{});return e.forEach(function(e){o[e]=t(a,e,n)}),o}function t(e){var t=i.createElement("script");t.src=e,t.defer=!0,i.head.appendChild(t)}"undefined"!=typeof Promise&&(o="wpEmojiSettingsSupports",s=["flag","emoji"],n.supports={everything:!0,everythingExceptFlag:!0},e=new Promise(function(e){i.addEventListener("DOMContentLoaded",e,{once:!0})}),new Promise(function(t){var n=function(){try{var e=JSON.parse(sessionStorage.getItem(o));if("object"==typeof e&&"number"==typeof e.timestamp&&(new Date).valueOf()<e.timestamp+604800&&"object"==typeof e.supportTests)return e.supportTests}catch(e){}return null}();if(!n){if("undefined"!=typeof Worker&&"undefined"!=typeof OffscreenCanvas&&"undefined"!=typeof URL&&URL.createObjectURL&&"undefined"!=typeof Blob)try{var e="postMessage("+f.toString()+"("+[JSON.stringify(s),u.toString(),p.toString()].join(",")+"));",r=new Blob([e],{type:"text/javascript"}),a=new Worker(URL.createObjectURL(r),{name:"wpTestEmojiSupports"});return void(a.onmessage=function(e){c(n=e.data),a.terminate(),t(n)})}catch(e){}c(n=f(s,u,p))}t(n)}).then(function(e){for(var t in e)n.supports[t]=e[t],n.supports.everything=n.supports.everything&&n.supports[t],"flag"!==t&&(n.supports.everythingExceptFlag=n.supports.everythingExceptFlag&&n.supports[t]);n.supports.everythingExceptFlag=n.supports.everythingExceptFlag&&!n.supports.flag,n.DOMReady=!1,n.readyCallback=function(){n.DOMReady=!0}}).then(function(){return e}).then(function(){var e;n.supports.everything||(n.readyCallback(),(e=n.source||{}).concatemoji?t(e.concatemoji):e.wpemoji&&e.twemoji&&(t(e.twemoji),t(e.wpemoji)))}))}((window,document),window._wpemojiSettings);
/* ]]> */
</script>
<link rel='stylesheet' id='all-css-27970385127fad0d4d6ecf3ab114824d' href='https://circulatingnow.nlm.nih.gov/_static/??-eJyNUltSwzAMvBBGFEJTPhh+mOEAHIBxbMU19WssmTa3x2kolPBov+KNtNKupG0SKgbGwJBcMTYQvCInqTbgoy4OCTI6yahFisQzdKmILrZfJfr6JVjeKd1e61WvcKWWzfVt0+Ky7burZtmqO1zNWYfGplTYYTbQFes0dC6qjXC2yzIPQDw4/Ivq5BALC5Ot/p5og3JFVxevBB61lejQj8xjkCods3BopBouvQ0n2TV2jI85B2m+iIO6bVLR0xreMOiYQRaOXjJbBYw7niqJrdUGWezVE9Ri8PFnzDl3ZLVPigHHLfw7LxX3wyX4dPiIqarDoGwFT/FRaj3A8yRmqj3unX4o4XWdAAHHzMXI37vOciQR8mSRZC+zFb3DXRd3orc7/HFUf91l9eonp6UjlW1iG4OoUelEfXyEf4me28DZDZ6Y45xy3GyGzi6xlhn1fvzj0wZzivlSlwgUla3GXTSRvoHDbT74+0XbLK5W7eKmeQfN0IOh' type='text/css' media='all' />
<style id='wp-block-library-inline-css'>
.has-text-align-justify{text-align:justify;}
</style>
<style id='tortuga-stylesheet-inline-css'>
.site-title, .site-description { position: absolute; clip: rect(1px, 1px, 1px, 1px); width: 1px; height: 1px; overflow: hidden; }
</style>
<style id='wp-emoji-styles-inline-css'>
img.wp-smiley, img.emoji {
display: inline !important;
border: none !important;
box-shadow: none !important;
height: 1em !important;
width: 1em !important;
margin: 0 0.07em !important;
vertical-align: -0.1em !important;
background: none !important;
padding: 0 !important;
}
</style>
<style id='jetpack-sharing-buttons-style-inline-css'>
.jetpack-sharing-buttons__services-list{display:flex;flex-direction:row;flex-wrap:wrap;gap:0;list-style-type:none;margin:5px;padding:0}.jetpack-sharing-buttons__services-list.has-small-icon-size{font-size:12px}.jetpack-sharing-buttons__services-list.has-normal-icon-size{font-size:16px}.jetpack-sharing-buttons__services-list.has-large-icon-size{font-size:24px}.jetpack-sharing-buttons__services-list.has-huge-icon-size{font-size:36px}@media print{.jetpack-sharing-buttons__services-list{display:none!important}}.editor-styles-wrapper .wp-block-jetpack-sharing-buttons{gap:0;padding-inline-start:0}ul.jetpack-sharing-buttons__services-list.has-background{padding:1.25em 2.375em}
</style>
<style id='classic-theme-styles-inline-css'>
/*! This file is auto-generated */
.wp-block-button__link{color:#fff;background-color:#32373c;border-radius:9999px;box-shadow:none;text-decoration:none;padding:calc(.667em + 2px) calc(1.333em + 2px);font-size:1.125em}.wp-block-file__button{background:#32373c;color:#fff;text-decoration:none}
</style>
<style id='global-styles-inline-css'>
:root{--wp--preset--aspect-ratio--square: 1;--wp--preset--aspect-ratio--4-3: 4/3;--wp--preset--aspect-ratio--3-4: 3/4;--wp--preset--aspect-ratio--3-2: 3/2;--wp--preset--aspect-ratio--2-3: 2/3;--wp--preset--aspect-ratio--16-9: 16/9;--wp--preset--aspect-ratio--9-16: 9/16;--wp--preset--color--black: #000000;--wp--preset--color--cyan-bluish-gray: #abb8c3;--wp--preset--color--white: #ffffff;--wp--preset--color--pale-pink: #f78da7;--wp--preset--color--vivid-red: #cf2e2e;--wp--preset--color--luminous-vivid-orange: #ff6900;--wp--preset--color--luminous-vivid-amber: #fcb900;--wp--preset--color--light-green-cyan: #7bdcb5;--wp--preset--color--vivid-green-cyan: #00d084;--wp--preset--color--pale-cyan-blue: #8ed1fc;--wp--preset--color--vivid-cyan-blue: #0693e3;--wp--preset--color--vivid-purple: #9b51e0;--wp--preset--color--primary: #dd5533;--wp--preset--color--secondary: #c43c1a;--wp--preset--color--tertiary: #aa2200;--wp--preset--color--accent: #3355dd;--wp--preset--color--highlight: #2bc41a;--wp--preset--color--light-gray: #f0f0f0;--wp--preset--color--gray: #999999;--wp--preset--color--dark-gray: #303030;--wp--preset--gradient--vivid-cyan-blue-to-vivid-purple: linear-gradient(135deg,rgba(6,147,227,1) 0%,rgb(155,81,224) 100%);--wp--preset--gradient--light-green-cyan-to-vivid-green-cyan: linear-gradient(135deg,rgb(122,220,180) 0%,rgb(0,208,130) 100%);--wp--preset--gradient--luminous-vivid-amber-to-luminous-vivid-orange: linear-gradient(135deg,rgba(252,185,0,1) 0%,rgba(255,105,0,1) 100%);--wp--preset--gradient--luminous-vivid-orange-to-vivid-red: linear-gradient(135deg,rgba(255,105,0,1) 0%,rgb(207,46,46) 100%);--wp--preset--gradient--very-light-gray-to-cyan-bluish-gray: linear-gradient(135deg,rgb(238,238,238) 0%,rgb(169,184,195) 100%);--wp--preset--gradient--cool-to-warm-spectrum: linear-gradient(135deg,rgb(74,234,220) 0%,rgb(151,120,209) 20%,rgb(207,42,186) 40%,rgb(238,44,130) 60%,rgb(251,105,98) 80%,rgb(254,248,76) 100%);--wp--preset--gradient--blush-light-purple: linear-gradient(135deg,rgb(255,206,236) 0%,rgb(152,150,240) 100%);--wp--preset--gradient--blush-bordeaux: linear-gradient(135deg,rgb(254,205,165) 0%,rgb(254,45,45) 50%,rgb(107,0,62) 100%);--wp--preset--gradient--luminous-dusk: linear-gradient(135deg,rgb(255,203,112) 0%,rgb(199,81,192) 50%,rgb(65,88,208) 100%);--wp--preset--gradient--pale-ocean: linear-gradient(135deg,rgb(255,245,203) 0%,rgb(182,227,212) 50%,rgb(51,167,181) 100%);--wp--preset--gradient--electric-grass: linear-gradient(135deg,rgb(202,248,128) 0%,rgb(113,206,126) 100%);--wp--preset--gradient--midnight: linear-gradient(135deg,rgb(2,3,129) 0%,rgb(40,116,252) 100%);--wp--preset--font-size--small: 13px;--wp--preset--font-size--medium: 20px;--wp--preset--font-size--large: 36px;--wp--preset--font-size--x-large: 42px;--wp--preset--font-family--albert-sans: 'Albert Sans', sans-serif;--wp--preset--font-family--alegreya: Alegreya, serif;--wp--preset--font-family--arvo: Arvo, serif;--wp--preset--font-family--bodoni-moda: 'Bodoni Moda', serif;--wp--preset--font-family--bricolage-grotesque: 'Bricolage Grotesque', sans-serif;--wp--preset--font-family--cabin: Cabin, sans-serif;--wp--preset--font-family--chivo: Chivo, sans-serif;--wp--preset--font-family--commissioner: Commissioner, sans-serif;--wp--preset--font-family--cormorant: Cormorant, serif;--wp--preset--font-family--courier-prime: 'Courier Prime', monospace;--wp--preset--font-family--crimson-pro: 'Crimson Pro', serif;--wp--preset--font-family--dm-mono: 'DM Mono', monospace;--wp--preset--font-family--dm-sans: 'DM Sans', sans-serif;--wp--preset--font-family--dm-serif-display: 'DM Serif Display', serif;--wp--preset--font-family--domine: Domine, serif;--wp--preset--font-family--eb-garamond: 'EB Garamond', serif;--wp--preset--font-family--epilogue: Epilogue, sans-serif;--wp--preset--font-family--fahkwang: Fahkwang, sans-serif;--wp--preset--font-family--figtree: Figtree, sans-serif;--wp--preset--font-family--fira-sans: 'Fira Sans', sans-serif;--wp--preset--font-family--fjalla-one: 'Fjalla One', sans-serif;--wp--preset--font-family--fraunces: Fraunces, serif;--wp--preset--font-family--gabarito: Gabarito, system-ui;--wp--preset--font-family--ibm-plex-mono: 'IBM Plex Mono', monospace;--wp--preset--font-family--ibm-plex-sans: 'IBM Plex Sans', sans-serif;--wp--preset--font-family--ibarra-real-nova: 'Ibarra Real Nova', serif;--wp--preset--font-family--instrument-serif: 'Instrument Serif', serif;--wp--preset--font-family--inter: Inter, sans-serif;--wp--preset--font-family--josefin-sans: 'Josefin Sans', sans-serif;--wp--preset--font-family--jost: Jost, sans-serif;--wp--preset--font-family--libre-baskerville: 'Libre Baskerville', serif;--wp--preset--font-family--libre-franklin: 'Libre Franklin', sans-serif;--wp--preset--font-family--literata: Literata, serif;--wp--preset--font-family--lora: Lora, serif;--wp--preset--font-family--merriweather: Merriweather, serif;--wp--preset--font-family--montserrat: Montserrat, sans-serif;--wp--preset--font-family--newsreader: Newsreader, serif;--wp--preset--font-family--noto-sans-mono: 'Noto Sans Mono', sans-serif;--wp--preset--font-family--nunito: Nunito, sans-serif;--wp--preset--font-family--open-sans: 'Open Sans', sans-serif;--wp--preset--font-family--overpass: Overpass, sans-serif;--wp--preset--font-family--pt-serif: 'PT Serif', serif;--wp--preset--font-family--petrona: Petrona, serif;--wp--preset--font-family--piazzolla: Piazzolla, serif;--wp--preset--font-family--playfair-display: 'Playfair Display', serif;--wp--preset--font-family--plus-jakarta-sans: 'Plus Jakarta Sans', sans-serif;--wp--preset--font-family--poppins: Poppins, sans-serif;--wp--preset--font-family--raleway: Raleway, sans-serif;--wp--preset--font-family--roboto: Roboto, sans-serif;--wp--preset--font-family--roboto-slab: 'Roboto Slab', serif;--wp--preset--font-family--rubik: Rubik, sans-serif;--wp--preset--font-family--rufina: Rufina, serif;--wp--preset--font-family--sora: Sora, sans-serif;--wp--preset--font-family--source-sans-3: 'Source Sans 3', sans-serif;--wp--preset--font-family--source-serif-4: 'Source Serif 4', serif;--wp--preset--font-family--space-mono: 'Space Mono', monospace;--wp--preset--font-family--syne: Syne, sans-serif;--wp--preset--font-family--texturina: Texturina, serif;--wp--preset--font-family--urbanist: Urbanist, sans-serif;--wp--preset--font-family--work-sans: 'Work Sans', sans-serif;--wp--preset--spacing--20: 0.44rem;--wp--preset--spacing--30: 0.67rem;--wp--preset--spacing--40: 1rem;--wp--preset--spacing--50: 1.5rem;--wp--preset--spacing--60: 2.25rem;--wp--preset--spacing--70: 3.38rem;--wp--preset--spacing--80: 5.06rem;--wp--preset--shadow--natural: 6px 6px 9px rgba(0, 0, 0, 0.2);--wp--preset--shadow--deep: 12px 12px 50px rgba(0, 0, 0, 0.4);--wp--preset--shadow--sharp: 6px 6px 0px rgba(0, 0, 0, 0.2);--wp--preset--shadow--outlined: 6px 6px 0px -3px rgba(255, 255, 255, 1), 6px 6px rgba(0, 0, 0, 1);--wp--preset--shadow--crisp: 6px 6px 0px rgba(0, 0, 0, 1);}:where(.is-layout-flex){gap: 0.5em;}:where(.is-layout-grid){gap: 0.5em;}body .is-layout-flex{display: flex;}.is-layout-flex{flex-wrap: wrap;align-items: center;}.is-layout-flex > :is(*, div){margin: 0;}body .is-layout-grid{display: grid;}.is-layout-grid > :is(*, div){margin: 0;}:where(.wp-block-columns.is-layout-flex){gap: 2em;}:where(.wp-block-columns.is-layout-grid){gap: 2em;}:where(.wp-block-post-template.is-layout-flex){gap: 1.25em;}:where(.wp-block-post-template.is-layout-grid){gap: 1.25em;}.has-black-color{color: var(--wp--preset--color--black) !important;}.has-cyan-bluish-gray-color{color: var(--wp--preset--color--cyan-bluish-gray) !important;}.has-white-color{color: var(--wp--preset--color--white) !important;}.has-pale-pink-color{color: var(--wp--preset--color--pale-pink) !important;}.has-vivid-red-color{color: var(--wp--preset--color--vivid-red) !important;}.has-luminous-vivid-orange-color{color: var(--wp--preset--color--luminous-vivid-orange) !important;}.has-luminous-vivid-amber-color{color: var(--wp--preset--color--luminous-vivid-amber) !important;}.has-light-green-cyan-color{color: var(--wp--preset--color--light-green-cyan) !important;}.has-vivid-green-cyan-color{color: var(--wp--preset--color--vivid-green-cyan) !important;}.has-pale-cyan-blue-color{color: var(--wp--preset--color--pale-cyan-blue) !important;}.has-vivid-cyan-blue-color{color: var(--wp--preset--color--vivid-cyan-blue) !important;}.has-vivid-purple-color{color: var(--wp--preset--color--vivid-purple) !important;}.has-black-background-color{background-color: var(--wp--preset--color--black) !important;}.has-cyan-bluish-gray-background-color{background-color: var(--wp--preset--color--cyan-bluish-gray) !important;}.has-white-background-color{background-color: var(--wp--preset--color--white) !important;}.has-pale-pink-background-color{background-color: var(--wp--preset--color--pale-pink) !important;}.has-vivid-red-background-color{background-color: var(--wp--preset--color--vivid-red) !important;}.has-luminous-vivid-orange-background-color{background-color: var(--wp--preset--color--luminous-vivid-orange) !important;}.has-luminous-vivid-amber-background-color{background-color: var(--wp--preset--color--luminous-vivid-amber) !important;}.has-light-green-cyan-background-color{background-color: var(--wp--preset--color--light-green-cyan) !important;}.has-vivid-green-cyan-background-color{background-color: var(--wp--preset--color--vivid-green-cyan) !important;}.has-pale-cyan-blue-background-color{background-color: var(--wp--preset--color--pale-cyan-blue) !important;}.has-vivid-cyan-blue-background-color{background-color: var(--wp--preset--color--vivid-cyan-blue) !important;}.has-vivid-purple-background-color{background-color: var(--wp--preset--color--vivid-purple) !important;}.has-black-border-color{border-color: var(--wp--preset--color--black) !important;}.has-cyan-bluish-gray-border-color{border-color: var(--wp--preset--color--cyan-bluish-gray) !important;}.has-white-border-color{border-color: var(--wp--preset--color--white) !important;}.has-pale-pink-border-color{border-color: var(--wp--preset--color--pale-pink) !important;}.has-vivid-red-border-color{border-color: var(--wp--preset--color--vivid-red) !important;}.has-luminous-vivid-orange-border-color{border-color: var(--wp--preset--color--luminous-vivid-orange) !important;}.has-luminous-vivid-amber-border-color{border-color: var(--wp--preset--color--luminous-vivid-amber) !important;}.has-light-green-cyan-border-color{border-color: var(--wp--preset--color--light-green-cyan) !important;}.has-vivid-green-cyan-border-color{border-color: var(--wp--preset--color--vivid-green-cyan) !important;}.has-pale-cyan-blue-border-color{border-color: var(--wp--preset--color--pale-cyan-blue) !important;}.has-vivid-cyan-blue-border-color{border-color: var(--wp--preset--color--vivid-cyan-blue) !important;}.has-vivid-purple-border-color{border-color: var(--wp--preset--color--vivid-purple) !important;}.has-vivid-cyan-blue-to-vivid-purple-gradient-background{background: var(--wp--preset--gradient--vivid-cyan-blue-to-vivid-purple) !important;}.has-light-green-cyan-to-vivid-green-cyan-gradient-background{background: var(--wp--preset--gradient--light-green-cyan-to-vivid-green-cyan) !important;}.has-luminous-vivid-amber-to-luminous-vivid-orange-gradient-background{background: var(--wp--preset--gradient--luminous-vivid-amber-to-luminous-vivid-orange) !important;}.has-luminous-vivid-orange-to-vivid-red-gradient-background{background: var(--wp--preset--gradient--luminous-vivid-orange-to-vivid-red) !important;}.has-very-light-gray-to-cyan-bluish-gray-gradient-background{background: var(--wp--preset--gradient--very-light-gray-to-cyan-bluish-gray) !important;}.has-cool-to-warm-spectrum-gradient-background{background: var(--wp--preset--gradient--cool-to-warm-spectrum) !important;}.has-blush-light-purple-gradient-background{background: var(--wp--preset--gradient--blush-light-purple) !important;}.has-blush-bordeaux-gradient-background{background: var(--wp--preset--gradient--blush-bordeaux) !important;}.has-luminous-dusk-gradient-background{background: var(--wp--preset--gradient--luminous-dusk) !important;}.has-pale-ocean-gradient-background{background: var(--wp--preset--gradient--pale-ocean) !important;}.has-electric-grass-gradient-background{background: var(--wp--preset--gradient--electric-grass) !important;}.has-midnight-gradient-background{background: var(--wp--preset--gradient--midnight) !important;}.has-small-font-size{font-size: var(--wp--preset--font-size--small) !important;}.has-medium-font-size{font-size: var(--wp--preset--font-size--medium) !important;}.has-large-font-size{font-size: var(--wp--preset--font-size--large) !important;}.has-x-large-font-size{font-size: var(--wp--preset--font-size--x-large) !important;}.has-albert-sans-font-family{font-family: var(--wp--preset--font-family--albert-sans) !important;}.has-alegreya-font-family{font-family: var(--wp--preset--font-family--alegreya) !important;}.has-arvo-font-family{font-family: var(--wp--preset--font-family--arvo) !important;}.has-bodoni-moda-font-family{font-family: var(--wp--preset--font-family--bodoni-moda) !important;}.has-bricolage-grotesque-font-family{font-family: var(--wp--preset--font-family--bricolage-grotesque) !important;}.has-cabin-font-family{font-family: var(--wp--preset--font-family--cabin) !important;}.has-chivo-font-family{font-family: var(--wp--preset--font-family--chivo) !important;}.has-commissioner-font-family{font-family: var(--wp--preset--font-family--commissioner) !important;}.has-cormorant-font-family{font-family: var(--wp--preset--font-family--cormorant) !important;}.has-courier-prime-font-family{font-family: var(--wp--preset--font-family--courier-prime) !important;}.has-crimson-pro-font-family{font-family: var(--wp--preset--font-family--crimson-pro) !important;}.has-dm-mono-font-family{font-family: var(--wp--preset--font-family--dm-mono) !important;}.has-dm-sans-font-family{font-family: var(--wp--preset--font-family--dm-sans) !important;}.has-dm-serif-display-font-family{font-family: var(--wp--preset--font-family--dm-serif-display) !important;}.has-domine-font-family{font-family: var(--wp--preset--font-family--domine) !important;}.has-eb-garamond-font-family{font-family: var(--wp--preset--font-family--eb-garamond) !important;}.has-epilogue-font-family{font-family: var(--wp--preset--font-family--epilogue) !important;}.has-fahkwang-font-family{font-family: var(--wp--preset--font-family--fahkwang) !important;}.has-figtree-font-family{font-family: var(--wp--preset--font-family--figtree) !important;}.has-fira-sans-font-family{font-family: var(--wp--preset--font-family--fira-sans) !important;}.has-fjalla-one-font-family{font-family: var(--wp--preset--font-family--fjalla-one) !important;}.has-fraunces-font-family{font-family: var(--wp--preset--font-family--fraunces) !important;}.has-gabarito-font-family{font-family: var(--wp--preset--font-family--gabarito) !important;}.has-ibm-plex-mono-font-family{font-family: var(--wp--preset--font-family--ibm-plex-mono) !important;}.has-ibm-plex-sans-font-family{font-family: var(--wp--preset--font-family--ibm-plex-sans) !important;}.has-ibarra-real-nova-font-family{font-family: var(--wp--preset--font-family--ibarra-real-nova) !important;}.has-instrument-serif-font-family{font-family: var(--wp--preset--font-family--instrument-serif) !important;}.has-inter-font-family{font-family: var(--wp--preset--font-family--inter) !important;}.has-josefin-sans-font-family{font-family: var(--wp--preset--font-family--josefin-sans) !important;}.has-jost-font-family{font-family: var(--wp--preset--font-family--jost) !important;}.has-libre-baskerville-font-family{font-family: var(--wp--preset--font-family--libre-baskerville) !important;}.has-libre-franklin-font-family{font-family: var(--wp--preset--font-family--libre-franklin) !important;}.has-literata-font-family{font-family: var(--wp--preset--font-family--literata) !important;}.has-lora-font-family{font-family: var(--wp--preset--font-family--lora) !important;}.has-merriweather-font-family{font-family: var(--wp--preset--font-family--merriweather) !important;}.has-montserrat-font-family{font-family: var(--wp--preset--font-family--montserrat) !important;}.has-newsreader-font-family{font-family: var(--wp--preset--font-family--newsreader) !important;}.has-noto-sans-mono-font-family{font-family: var(--wp--preset--font-family--noto-sans-mono) !important;}.has-nunito-font-family{font-family: var(--wp--preset--font-family--nunito) !important;}.has-open-sans-font-family{font-family: var(--wp--preset--font-family--open-sans) !important;}.has-overpass-font-family{font-family: var(--wp--preset--font-family--overpass) !important;}.has-pt-serif-font-family{font-family: var(--wp--preset--font-family--pt-serif) !important;}.has-petrona-font-family{font-family: var(--wp--preset--font-family--petrona) !important;}.has-piazzolla-font-family{font-family: var(--wp--preset--font-family--piazzolla) !important;}.has-playfair-display-font-family{font-family: var(--wp--preset--font-family--playfair-display) !important;}.has-plus-jakarta-sans-font-family{font-family: var(--wp--preset--font-family--plus-jakarta-sans) !important;}.has-poppins-font-family{font-family: var(--wp--preset--font-family--poppins) !important;}.has-raleway-font-family{font-family: var(--wp--preset--font-family--raleway) !important;}.has-roboto-font-family{font-family: var(--wp--preset--font-family--roboto) !important;}.has-roboto-slab-font-family{font-family: var(--wp--preset--font-family--roboto-slab) !important;}.has-rubik-font-family{font-family: var(--wp--preset--font-family--rubik) !important;}.has-rufina-font-family{font-family: var(--wp--preset--font-family--rufina) !important;}.has-sora-font-family{font-family: var(--wp--preset--font-family--sora) !important;}.has-source-sans-3-font-family{font-family: var(--wp--preset--font-family--source-sans-3) !important;}.has-source-serif-4-font-family{font-family: var(--wp--preset--font-family--source-serif-4) !important;}.has-space-mono-font-family{font-family: var(--wp--preset--font-family--space-mono) !important;}.has-syne-font-family{font-family: var(--wp--preset--font-family--syne) !important;}.has-texturina-font-family{font-family: var(--wp--preset--font-family--texturina) !important;}.has-urbanist-font-family{font-family: var(--wp--preset--font-family--urbanist) !important;}.has-work-sans-font-family{font-family: var(--wp--preset--font-family--work-sans) !important;}
:where(.wp-block-columns.is-layout-flex){gap: 2em;}:where(.wp-block-columns.is-layout-grid){gap: 2em;}
:root :where(.wp-block-pullquote){font-size: 1.5em;line-height: 1.6;}
:where(.wp-block-post-template.is-layout-flex){gap: 1.25em;}:where(.wp-block-post-template.is-layout-grid){gap: 1.25em;}
</style>
<link rel='stylesheet' id='dashicons-css' href='https://circulatingnow.nlm.nih.gov/wp-includes/css/dashicons.min.css?ver=6.7.2' media='all' />
<style id='akismet-widget-style-inline-css'>
.a-stats {
--akismet-color-mid-green: #357b49;
--akismet-color-white: #fff;
--akismet-color-light-grey: #f6f7f7;
max-width: 350px;
width: auto;
}
.a-stats * {
all: unset;
box-sizing: border-box;
}
.a-stats strong {
font-weight: 600;
}
.a-stats a.a-stats__link,
.a-stats a.a-stats__link:visited,
.a-stats a.a-stats__link:active {
background: var(--akismet-color-mid-green);
border: none;
box-shadow: none;
border-radius: 8px;
color: var(--akismet-color-white);
cursor: pointer;
display: block;
font-family: -apple-system, BlinkMacSystemFont, 'Segoe UI', 'Roboto', 'Oxygen-Sans', 'Ubuntu', 'Cantarell', 'Helvetica Neue', sans-serif;
font-weight: 500;
padding: 12px;
text-align: center;
text-decoration: none;
transition: all 0.2s ease;
}
/* Extra specificity to deal with TwentyTwentyOne focus style */
.widget .a-stats a.a-stats__link:focus {
background: var(--akismet-color-mid-green);
color: var(--akismet-color-white);
text-decoration: none;
}
.a-stats a.a-stats__link:hover {
filter: brightness(110%);
box-shadow: 0 4px 12px rgba(0, 0, 0, 0.06), 0 0 2px rgba(0, 0, 0, 0.16);
}
.a-stats .count {
color: var(--akismet-color-white);
display: block;
font-size: 1.5em;
line-height: 1.4;
padding: 0 13px;
white-space: nowrap;
}
</style>
<link rel='stylesheet' id='front_end_css-css' href='https://circulatingnow.nlm.nih.gov/wp-content/plugins/broken-link-notifier/includes/css/results-front.css?ver=1.2.0' media='all' />
<style id='jetpack-global-styles-frontend-style-inline-css'>
:root { --font-headings: unset; --font-base: unset; --font-headings-default: -apple-system,BlinkMacSystemFont,"Segoe UI",Roboto,Oxygen-Sans,Ubuntu,Cantarell,"Helvetica Neue",sans-serif; --font-base-default: -apple-system,BlinkMacSystemFont,"Segoe UI",Roboto,Oxygen-Sans,Ubuntu,Cantarell,"Helvetica Neue",sans-serif;}
</style>
<script type="text/javascript" id="jetpack_related-posts-js-extra">
/* <![CDATA[ */
var related_posts_js_options = {"post_heading":"h4"};
/* ]]> */
</script>
<script type='text/javascript' src='https://circulatingnow.nlm.nih.gov/wp-content/plugins/jetpack/_inc/build/related-posts/related-posts.min.js?m=1734358916'></script>
<script type="text/javascript" id="jetpack-mu-wpcom-settings-js-before">
/* <![CDATA[ */
var JETPACK_MU_WPCOM_SETTINGS = {"assetsUrl":"https:\/\/circulatingnow.nlm.nih.gov\/wp-content\/mu-plugins\/wpcomsh\/jetpack_vendor\/automattic\/jetpack-mu-wpcom\/src\/build\/"};
/* ]]> */
</script>
<script type='text/javascript' src='https://circulatingnow.nlm.nih.gov/_static/??-eJyNy0EOQDAQBdALYSjCRpylkUlbMa3403J8Gwfw9u8+6y1F5aiknoVBmi7NzpIFWEE7yKscI3wojYTY7KjuHwnFPRn8lVWWbuqndpiNGV81aiq8'></script>
<script type="text/javascript" src="https://circulatingnow.nlm.nih.gov/wp-includes/js/jquery/jquery.min.js?ver=3.7.1" id="jquery-core-js"></script>
<script type='text/javascript' src='https://circulatingnow.nlm.nih.gov/wp-includes/js/jquery/jquery-migrate.min.js?m=1686289764'></script>
<!-- Google Analytics Code Snippet By GA4WP --><script async src="https://www.googletagmanager.com/gtag/js?id=G-P1FPTH9PL4"></script>
<script>
window.dataLayer = window.dataLayer || [];
function gtag(){dataLayer.push(arguments);}
gtag('js', new Date());gtag('config', 'G-P1FPTH9PL4');</script> <!- end of Google Analytics Code Snippet by GA4WP--><link rel="https://api.w.org/" href="https://circulatingnow.nlm.nih.gov/wp-json/" /><link rel="alternate" title="JSON" type="application/json" href="https://circulatingnow.nlm.nih.gov/wp-json/wp/v2/posts/21153" /><link rel="EditURI" type="application/rsd+xml" title="RSD" href="https://circulatingnow.nlm.nih.gov/xmlrpc.php?rsd" />
<link rel="canonical" href="https://circulatingnow.nlm.nih.gov/2021/05/13/exploring-the-data-of-web-archives-as-part-of-data-science-nlm/" />
<link rel='shortlink' href='https://wp.me/p3xcDk-5vb' />
<link rel="alternate" title="oEmbed (JSON)" type="application/json+oembed" href="https://circulatingnow.nlm.nih.gov/wp-json/oembed/1.0/embed?url=https%3A%2F%2Fcirculatingnow.nlm.nih.gov%2F2021%2F05%2F13%2Fexploring-the-data-of-web-archives-as-part-of-data-science-nlm%2F" />
<link rel="alternate" title="oEmbed (XML)" type="text/xml+oembed" href="https://circulatingnow.nlm.nih.gov/wp-json/oembed/1.0/embed?url=https%3A%2F%2Fcirculatingnow.nlm.nih.gov%2F2021%2F05%2F13%2Fexploring-the-data-of-web-archives-as-part-of-data-science-nlm%2F&#038;format=xml" />
<meta http-equiv="X-UA-Compatible" content="IE=edge"><script async type="text/javascript" id="_fed_an_ua_tag" src="https://dap.digitalgov.gov/Universal-Federated-Analytics-Min.js?agency=HHS&subagency=NIH&sp=query&enhlink=true"></script> <style>img#wpstats{display:none}</style>
<meta name="description" content="Over the past year our project was to gain practical experience with tools and techniques for the study of web archives data." />
<link rel="amphtml" href="https://circulatingnow.nlm.nih.gov/2021/05/13/exploring-the-data-of-web-archives-as-part-of-data-science-nlm/amp/">
<!-- Jetpack Open Graph Tags -->
<meta property="og:type" content="article" />
<meta property="og:title" content="Exploring the Data of Web Archives as Part of Data Science @ NLM" />
<meta property="og:url" content="https://circulatingnow.nlm.nih.gov/2021/05/13/exploring-the-data-of-web-archives-as-part-of-data-science-nlm/" />
<meta property="og:description" content="Over the past year our project was to gain practical experience with tools and techniques for the study of web archives data." />
<meta property="article:published_time" content="2021-05-13T15:30:44+00:00" />
<meta property="article:modified_time" content="2024-10-09T16:49:14+00:00" />
<meta property="og:site_name" content="Circulating Now from the NLM Historical Collections" />
<meta property="og:image" content="https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2021/05/Gephi_zoom_feature.jpg?fit=900%2C400&#038;ssl=1" />
<meta property="og:image:width" content="900" />
<meta property="og:image:height" content="400" />
<meta property="og:image:alt" content="A network of nodes and edges showing the domains and links between them. for the NLM Domestic Violence Awareness and Prevention web archive collection." />
<meta property="og:locale" content="en_US" />
<meta name="twitter:site" content="@NLM_NIH" />
<meta name="twitter:text:title" content="Exploring the Data of Web Archives as Part of Data Science @ NLM" />
<meta name="twitter:image" content="https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2021/05/Gephi_zoom_feature.jpg?fit=900%2C400&#038;ssl=1&#038;w=640" />
<meta name="twitter:image:alt" content="A network of nodes and edges showing the domains and links between them. for the NLM Domestic Violence Awareness and Prevention web archive collection." />
<meta name="twitter:card" content="summary_large_image" />
<!-- End Jetpack Open Graph Tags -->
<link rel="icon" href="https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2017/04/circulating-now-512.gif?fit=32%2C32&#038;ssl=1" sizes="32x32" />
<link rel="icon" href="https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2017/04/circulating-now-512.gif?fit=192%2C192&#038;ssl=1" sizes="192x192" />
<link rel="apple-touch-icon" href="https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2017/04/circulating-now-512.gif?fit=180%2C180&#038;ssl=1" />
<meta name="msapplication-TileImage" content="https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2017/04/circulating-now-512.gif?fit=270%2C270&#038;ssl=1" />
<link rel="stylesheet" type="text/css" id="wp-custom-css" href="https://circulatingnow.nlm.nih.gov/?custom-css=715865f38f" /><!-- Jetpack Google Analytics -->
<script type='text/javascript'>
var _gaq = _gaq || [];
_gaq.push(['_setAccount', 'UA-77373749-1']);
_gaq.push(['_trackPageview']);
(function() {
var ga = document.createElement('script'); ga.type = 'text/javascript'; ga.async = true;
ga.src = ('https:' === document.location.protocol ? 'https://ssl' : 'http://www') + '.google-analytics.com/ga.js';
var s = document.getElementsByTagName('script')[0]; s.parentNode.insertBefore(ga, s);
})();
</script>
<!-- End Jetpack Google Analytics -->
</head>
<body class="post-template-default single single-post postid-21153 single-format-standard wp-custom-logo wp-embed-responsive post-layout-two-columns post-layout-columns">
<div id="page" class="hfeed site">
<a class="skip-link screen-reader-text" href="#content">Skip to content</a>
<header id="masthead" class="site-header clearfix" role="banner">
<div class="header-main container clearfix">
<div id="logo" class="site-branding clearfix">
<a href="https://circulatingnow.nlm.nih.gov/" class="custom-logo-link" rel="home"><img width="507" height="131" src="https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2021/11/circulating-nih-logo-v3.png?fit=507%2C131&amp;ssl=1" class="custom-logo" alt="Circulating Now From the Historical Collections of the National Library of Medicine, NIH" decoding="async" fetchpriority="high" srcset="https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2021/11/circulating-nih-logo-v3.png?w=507&amp;ssl=1 507w, https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2021/11/circulating-nih-logo-v3.png?resize=300%2C78&amp;ssl=1 300w" sizes="(max-width: 507px) 100vw, 507px" data-attachment-id="22721" data-permalink="https://circulatingnow.nlm.nih.gov/circulating-nih-logo-v3-2/" data-orig-file="https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2021/11/circulating-nih-logo-v3.png?fit=507%2C131&amp;ssl=1" data-orig-size="507,131" data-comments-opened="1" data-image-meta="{&quot;aperture&quot;:&quot;0&quot;,&quot;credit&quot;:&quot;&quot;,&quot;camera&quot;:&quot;&quot;,&quot;caption&quot;:&quot;&quot;,&quot;created_timestamp&quot;:&quot;0&quot;,&quot;copyright&quot;:&quot;&quot;,&quot;focal_length&quot;:&quot;0&quot;,&quot;iso&quot;:&quot;0&quot;,&quot;shutter_speed&quot;:&quot;0&quot;,&quot;title&quot;:&quot;&quot;,&quot;orientation&quot;:&quot;0&quot;}" data-image-title="circulating-nih-logo-v3" data-image-description="" data-image-caption="" data-medium-file="https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2021/11/circulating-nih-logo-v3.png?fit=300%2C78&amp;ssl=1" data-large-file="https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2021/11/circulating-nih-logo-v3.png?fit=507%2C131&amp;ssl=1" /></a>
<p class="site-title"><a href="https://circulatingnow.nlm.nih.gov/" rel="home">Circulating Now from the NLM Historical Collections</a></p>
</div><!-- .site-branding -->
<div class="header-widgets clearfix">
</div><!-- .header-widgets -->
</div><!-- .header-main -->
<div id="main-navigation-wrap" class="primary-navigation-wrap">
<div class="primary-navigation-container container">
<button class="primary-menu-toggle menu-toggle" aria-controls="primary-menu" aria-expanded="false" >
<svg class="icon icon-menu" aria-hidden="true" role="img"> <use xlink:href="https://circulatingnow.nlm.nih.gov/wp-content/themes/tortuga/assets/icons/genericons-neue.svg#menu"></use> </svg><svg class="icon icon-close" aria-hidden="true" role="img"> <use xlink:href="https://circulatingnow.nlm.nih.gov/wp-content/themes/tortuga/assets/icons/genericons-neue.svg#close"></use> </svg> <span class="menu-toggle-text">Menu</span>
</button>
<div class="primary-navigation">
<nav id="site-navigation" class="main-navigation" role="navigation" aria-label="Primary Menu">
<ul id="primary-menu" class="menu"><li id="menu-item-250" class="menu-item menu-item-type-custom menu-item-object-custom menu-item-home menu-item-250"><a href="https://circulatingnow.nlm.nih.gov/">Blog</a></li>
<li id="menu-item-256" class="menu-item menu-item-type-custom menu-item-object-custom menu-item-256"><a href="https://circulatingnow.nlm.nih.gov/about/">About</a></li>
<li id="menu-item-10880" class="menu-item menu-item-type-custom menu-item-object-custom menu-item-10880"><a href="https://circulatingnow.nlm.nih.gov/comments-privacy/">COMMENTS &#038; PRIVACY</a></li>
<li id="menu-item-10881" class="menu-item menu-item-type-custom menu-item-object-custom menu-item-10881"><a href="https://www.nlm.nih.gov/hmd" title="The History of Medicine Division">National Library of Medicine</a></li>
</ul> </nav><!-- #site-navigation -->
</div><!-- .primary-navigation -->
</div>
</div>
</header><!-- #masthead -->
<div id="content" class="site-content container clearfix">
<section id="primary" class="content-single content-area">
<main id="main" class="site-main" role="main">
<article id="post-21153" class="post-21153 post type-post status-publish format-standard has-post-thumbnail hentry category-collections category-revealing-data tag-about-us tag-data tag-digital-humanities tag-research tag-research-tools tag-web-collecting">
<img width="600" height="280" src="https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2021/05/Gephi_zoom_feature.jpg?resize=600%2C280&amp;ssl=1" class="attachment-post-thumbnail size-post-thumbnail wp-post-image" alt="A network of nodes and edges showing the domains and links between them. for the NLM Domestic Violence Awareness and Prevention web archive collection." decoding="async" data-attachment-id="21177" data-permalink="https://circulatingnow.nlm.nih.gov/2021/05/13/exploring-the-data-of-web-archives-as-part-of-data-science-nlm/gephi_zoom_feature/" data-orig-file="https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2021/05/Gephi_zoom_feature.jpg?fit=900%2C400&amp;ssl=1" data-orig-size="900,400" data-comments-opened="1" data-image-meta="{&quot;aperture&quot;:&quot;0&quot;,&quot;credit&quot;:&quot;&quot;,&quot;camera&quot;:&quot;&quot;,&quot;caption&quot;:&quot;&quot;,&quot;created_timestamp&quot;:&quot;0&quot;,&quot;copyright&quot;:&quot;&quot;,&quot;focal_length&quot;:&quot;0&quot;,&quot;iso&quot;:&quot;0&quot;,&quot;shutter_speed&quot;:&quot;0&quot;,&quot;title&quot;:&quot;&quot;,&quot;orientation&quot;:&quot;0&quot;}" data-image-title="Gephi_zoom_feature" data-image-description="" data-image-caption="" data-medium-file="https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2021/05/Gephi_zoom_feature.jpg?fit=300%2C133&amp;ssl=1" data-large-file="https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2021/05/Gephi_zoom_feature.jpg?fit=840%2C373&amp;ssl=1" />
<header class="entry-header">
<h1 class="entry-title">Exploring the Data of Web Archives as Part of Data Science @ NLM</h1>
<div class="entry-meta"><span class="meta-date"><svg class="icon icon-standard" aria-hidden="true" role="img"> <use xlink:href="https://circulatingnow.nlm.nih.gov/wp-content/themes/tortuga/assets/icons/genericons-neue.svg#standard"></use> </svg><a href="https://circulatingnow.nlm.nih.gov/2021/05/13/exploring-the-data-of-web-archives-as-part-of-data-science-nlm/" title="11:30 AM" rel="bookmark"><time class="entry-date published updated" datetime="2021-05-13T11:30:44-04:00">May 13, 2021</time></a></span><span class="meta-author"> <svg class="icon icon-user" aria-hidden="true" role="img"> <use xlink:href="https://circulatingnow.nlm.nih.gov/wp-content/themes/tortuga/assets/icons/genericons-neue.svg#user"></use> </svg><span class="author vcard"><a class="url fn n" href="https://circulatingnow.nlm.nih.gov/author/moffattc/" title="View all posts by Circulating Now" rel="author">Circulating Now</a></span></span><span class="meta-category"> <svg class="icon icon-category" aria-hidden="true" role="img"> <use xlink:href="https://circulatingnow.nlm.nih.gov/wp-content/themes/tortuga/assets/icons/genericons-neue.svg#category"></use> </svg><a href="https://circulatingnow.nlm.nih.gov/category/collections/" rel="category tag">Collections</a>, <a href="https://circulatingnow.nlm.nih.gov/category/series/revealing-data/" rel="category tag">Revealing Data</a></span><span class="meta-comments"> <svg class="icon icon-edit" aria-hidden="true" role="img"> <use xlink:href="https://circulatingnow.nlm.nih.gov/wp-content/themes/tortuga/assets/icons/genericons-neue.svg#edit"></use> </svg><a href="https://circulatingnow.nlm.nih.gov/2021/05/13/exploring-the-data-of-web-archives-as-part-of-data-science-nlm/#comments">2 comments</a></span></div>
</header><!-- .entry-header -->
<div class="entry-content clearfix">
<p><em>By Christie Moffatt ~</em></p>
<p>Over the past year (May 2020May 2021) I participated in a National Library of Medicine (NLM) Data Science Mentorship program, which is part of a broader <a href="https://nlmdirector.nlm.nih.gov/2021/04/28/data-science-nlm-journey-continues-and-what-we-have-learned/">Data Science @ NLM</a> training program designed to prepare staff to engage with and participate in the Library&#8217;s developing data science efforts. My mentor was NLM Computer Scientist Marie Gallagher, and our project was to gain a better understanding of and practical experience with tools and techniques for the exploration and study of the data of web archives.</p>
<p>NLM has been actively involved in building <a href="https://archive-it.org/organizations/350">collections of web archives</a> through the work of our Web Collecting and Archiving Group.  A team of archivists, librarians, and historians is primarily using <a href="https://archive-it.org/" target="_blank" rel="noopener">Archive-It</a>, a service of the Internet Archive, to collect on a broad range of topics in line with NLM collection development policies, including <a href="https://circulatingnow.nlm.nih.gov/2017/12/01/archiving-hiv-aids-on-the-web/">HIV/AIDS</a>, the <a href="https://circulatingnow.nlm.nih.gov/2018/09/27/the-opioid-epidemic-collecting-now-for-future-research/">Opioid Epidemic</a>, the <a href="https://circulatingnow.nlm.nih.gov/2014/11/19/future-historical-collections-archiving-the-2014-ebola-outbreak/">2014 Ebola Outbreak</a>, and currently around the <a href="https://circulatingnow.nlm.nih.gov/2021/01/28/covid-19-web-collecting-reflections-at-one-year/">COVID-19 Pandemic</a>.   As a member of this working group, I was interested to learn more about tools such as <a href="https://archivesunleashed.org/" target="_blank" rel="noopener">Archives Unleashed</a> and the <a href="https://glam-workbench.net/web-archives/" target="_blank" rel="noopener">GLAM Workbench</a> to better understand the work and needs of researchers, as well as explore the possibility of using these tools to support ongoing collection development and curation.   I had participated in an Archives Unleashed <a href="https://archivesunleashed.org/events/">datathon</a> in 2019, and recognized that I needed much more hands-on experience to better understand the nature of the tools, how to use them, and the broader picture of web archives data and research.  The NLM Data Science Mentorship program provided a wonderful opportunity to collaborate and learn more about the data of web archives, as well as project design, experimental thinking, science communication, and data storytelling.</p>
<p>The Archives Unleashed project, supported by The Andrew W. Mellon Foundation, provides a set of tools designed to lower barriers for researchers to explore web archives.  The <a href="https://archivesunleashed.org/getting-started/" target="_blank" rel="noopener">Archives Unleashed tools</a> are designed for different levels of experience including the Archives Unleashed Cloud (for beginners), Archives Unleashed Notebooks (for beginner/intermediate users), and Archives Unleashed Toolkit (for advanced users).  My mentor and I reviewed each of these tools and focused on the <a href="https://archivesunleashed.org/cloud/">Archives Unleashed Cloud</a> (migrating soon to Archive-It) to query the data of individual NLM web archive collections and obtain derivative data files for further analysis.</p>
<p>We uploaded the resulting derivative data files into a variety of data visualization and text analysis tools and learned a number of lessons on the value of a flexible computer environment to install programs and software, the need for advanced data cleaning skills, and generally, the need for patience and flexibility.  I also gained an appreciation for the complexity of the analysis tools and the need for more time to understand how the data is interpreted and presented.</p>
<p>In one experiment, following learning guides from Archives Unleashed, we loaded one of the derivative files (the <a href="https://gexf.net/">GEFX</a> file) into an open source graph visualization program called <a href="https://gephi.org/">Gephi</a> to create a visualization of the network of nodes (domains) and edges (hyperlinks between them) for a small <a href="https://archive-it.org/collections/8370">collection</a> of sites related to the NLM exhibition <em><a href="https://www.nlm.nih.gov/exhibition/confrontingviolence/index.html">Confronting Violence, Improving Womens Lives</a></em>.</p>
<div class="tiled-gallery type-rectangular tiled-gallery-unresized" data-original-width="840" data-carousel-extra='{&quot;blog_id&quot;:1,&quot;permalink&quot;:&quot;https:\/\/circulatingnow.nlm.nih.gov\/2021\/05\/13\/exploring-the-data-of-web-archives-as-part-of-data-science-nlm\/&quot;,&quot;likes_blog_id&quot;:&quot;52242398&quot;}' itemscope itemtype="http://schema.org/ImageGallery" > <div class="gallery-row" style="width: 840px; height: 196px;" data-original-width="840" data-original-height="196" > <div class="gallery-group images-1" style="width: 285px; height: 196px;" data-original-width="285" data-original-height="196" > <div class="tiled-gallery-item tiled-gallery-item-large" itemprop="associatedMedia" itemscope itemtype="http://schema.org/ImageObject"> <a href="https://circulatingnow.nlm.nih.gov/gephi_fullcollection/" border="0" itemprop="url"> <meta itemprop="width" content="281"> <meta itemprop="height" content="192"> <img decoding="async" class="" data-attachment-id="21113" data-orig-file="https://circulatingnow.nlm.nih.gov/wp-content/uploads/2021/05/Gephi_fullCollection.jpg" data-orig-size="1124,769" data-comments-opened="1" data-image-meta="{&quot;aperture&quot;:&quot;0&quot;,&quot;credit&quot;:&quot;&quot;,&quot;camera&quot;:&quot;&quot;,&quot;caption&quot;:&quot;&quot;,&quot;created_timestamp&quot;:&quot;0&quot;,&quot;copyright&quot;:&quot;&quot;,&quot;focal_length&quot;:&quot;0&quot;,&quot;iso&quot;:&quot;0&quot;,&quot;shutter_speed&quot;:&quot;0&quot;,&quot;title&quot;:&quot;&quot;,&quot;orientation&quot;:&quot;0&quot;}" data-image-title="Full Gephi Visualization" data-image-description="" data-medium-file="https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2021/05/Gephi_fullCollection.jpg?fit=300%2C205&#038;ssl=1" data-large-file="https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2021/05/Gephi_fullCollection.jpg?fit=840%2C575&#038;ssl=1" src="https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2021/05/Gephi_fullCollection.jpg?w=281&#038;h=192&#038;ssl=1" srcset="https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2021/05/Gephi_fullCollection.jpg?w=1124&amp;ssl=1 1124w, https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2021/05/Gephi_fullCollection.jpg?resize=300%2C205&amp;ssl=1 300w, https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2021/05/Gephi_fullCollection.jpg?resize=1024%2C701&amp;ssl=1 1024w, https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2021/05/Gephi_fullCollection.jpg?resize=768%2C525&amp;ssl=1 768w, https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2021/05/Gephi_fullCollection.jpg?resize=840%2C575&amp;ssl=1 840w" width="281" height="192" loading="lazy" data-original-width="281" data-original-height="192" itemprop="http://schema.org/image" title="Full Gephi Visualization" alt="A large network of web domains (nodes) and hyperlinks between them (edges) in various colors." style="width: 281px; height: 192px;" /> </a> <div class="tiled-gallery-caption" itemprop="caption description"> Graphic visualization in Gephi, of network connections between domains in an NLM web archive collection related to NLM exhibition Confronting Violence, Improving Womens Lives. </div> </div> </div> <!-- close group --> <div class="gallery-group images-1" style="width: 277px; height: 196px;" data-original-width="277" data-original-height="196" > <div class="tiled-gallery-item tiled-gallery-item-large" itemprop="associatedMedia" itemscope itemtype="http://schema.org/ImageObject"> <a href="https://circulatingnow.nlm.nih.gov/gephi_zoom2/" border="0" itemprop="url"> <meta itemprop="width" content="273"> <meta itemprop="height" content="192"> <img decoding="async" class="" data-attachment-id="21114" data-orig-file="https://circulatingnow.nlm.nih.gov/wp-content/uploads/2021/05/Gephi_Zoom2.jpg" data-orig-size="1139,801" data-comments-opened="1" data-image-meta="{&quot;aperture&quot;:&quot;0&quot;,&quot;credit&quot;:&quot;&quot;,&quot;camera&quot;:&quot;&quot;,&quot;caption&quot;:&quot;&quot;,&quot;created_timestamp&quot;:&quot;0&quot;,&quot;copyright&quot;:&quot;&quot;,&quot;focal_length&quot;:&quot;0&quot;,&quot;iso&quot;:&quot;0&quot;,&quot;shutter_speed&quot;:&quot;0&quot;,&quot;title&quot;:&quot;&quot;,&quot;orientation&quot;:&quot;0&quot;}" data-image-title="Close-up of Major Nodes" data-image-description="" data-medium-file="https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2021/05/Gephi_Zoom2.jpg?fit=300%2C211&#038;ssl=1" data-large-file="https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2021/05/Gephi_Zoom2.jpg?fit=840%2C591&#038;ssl=1" src="https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2021/05/Gephi_Zoom2.jpg?w=273&#038;h=192&#038;ssl=1" srcset="https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2021/05/Gephi_Zoom2.jpg?w=1139&amp;ssl=1 1139w, https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2021/05/Gephi_Zoom2.jpg?resize=300%2C211&amp;ssl=1 300w, https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2021/05/Gephi_Zoom2.jpg?resize=1024%2C720&amp;ssl=1 1024w, https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2021/05/Gephi_Zoom2.jpg?resize=768%2C540&amp;ssl=1 768w, https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2021/05/Gephi_Zoom2.jpg?resize=840%2C591&amp;ssl=1 840w" width="273" height="192" loading="lazy" data-original-width="273" data-original-height="192" itemprop="http://schema.org/image" title="Close-up of Major Nodes" alt="A large network of web domains (nodes) and hyperlinks between them (edges) in various colors." style="width: 273px; height: 192px;" /> </a> <div class="tiled-gallery-caption" itemprop="caption description"> Graphic visualization in Gephi, of network connections between domains in an NLM web archive collection related to NLM exhibition Confronting Violence, Improving Womens Lives. </div> </div> </div> <!-- close group --> <div class="gallery-group images-1" style="width: 278px; height: 196px;" data-original-width="278" data-original-height="196" > <div class="tiled-gallery-item tiled-gallery-item-large" itemprop="associatedMedia" itemscope itemtype="http://schema.org/ImageObject"> <a href="https://circulatingnow.nlm.nih.gov/gephi_zoom3/" border="0" itemprop="url"> <meta itemprop="width" content="274"> <meta itemprop="height" content="192"> <img decoding="async" class="" data-attachment-id="21115" data-orig-file="https://circulatingnow.nlm.nih.gov/wp-content/uploads/2021/05/Gephi_zoom3.jpg" data-orig-size="1188,831" data-comments-opened="1" data-image-meta="{&quot;aperture&quot;:&quot;0&quot;,&quot;credit&quot;:&quot;&quot;,&quot;camera&quot;:&quot;&quot;,&quot;caption&quot;:&quot;&quot;,&quot;created_timestamp&quot;:&quot;0&quot;,&quot;copyright&quot;:&quot;&quot;,&quot;focal_length&quot;:&quot;0&quot;,&quot;iso&quot;:&quot;0&quot;,&quot;shutter_speed&quot;:&quot;0&quot;,&quot;title&quot;:&quot;&quot;,&quot;orientation&quot;:&quot;0&quot;}" data-image-title="Detail of Edges Around forensicnurses.org" data-image-description="" data-medium-file="https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2021/05/Gephi_zoom3.jpg?fit=300%2C210&#038;ssl=1" data-large-file="https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2021/05/Gephi_zoom3.jpg?fit=840%2C587&#038;ssl=1" src="https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2021/05/Gephi_zoom3.jpg?w=274&#038;h=192&#038;ssl=1" srcset="https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2021/05/Gephi_zoom3.jpg?w=1188&amp;ssl=1 1188w, https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2021/05/Gephi_zoom3.jpg?resize=300%2C210&amp;ssl=1 300w, https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2021/05/Gephi_zoom3.jpg?resize=1024%2C716&amp;ssl=1 1024w, https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2021/05/Gephi_zoom3.jpg?resize=768%2C537&amp;ssl=1 768w, https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2021/05/Gephi_zoom3.jpg?resize=840%2C588&amp;ssl=1 840w" width="274" height="192" loading="lazy" data-original-width="274" data-original-height="192" itemprop="http://schema.org/image" title="Detail of Edges Around forensicnurses.org" alt="A large network of web domains (nodes) and hyperlinks between them (edges) in various colors." style="width: 274px; height: 192px;" /> </a> <div class="tiled-gallery-caption" itemprop="caption description"> Graphic visualization in Gephi, of network connections between domains in an NLM web archive collection related to NLM exhibition Confronting Violence, Improving Womens Lives. </div> </div> </div> <!-- close group --> </div> <!-- close row --> </div>
<figure id="attachment_11953" class="wp-caption aligncenter"><figcaption class="wp-caption-text" style="width: 800px;">Graphic visualization in Gephi, of network connections between domains in an NLM web archive collection related to NLM exhibition <em>Confronting Violence, Improving Womens Lives.</em></figcaption></figure>
<p>If we look closely, we can see that there are arrows between the domains, indicating hyperlink connections.  The size of the labels and nodes is significant, representing how many times the source is linked to. Researchers can use this visualization to see who is linking to who, and the most popular domains in the collection.  In this case, we found that forensicnurses.org, Twitter, Facebook, and Youtube are domains frequently linked to in the collection. We can look specifically at forensicnurses.org and focus attention on the links to and from this particular domain, with <span data-ccp-charstyle="Hyperlink">safeta.org</span><span data-contrast="auto">, then </span><span data-ccp-charstyle="Hyperlink">community.iafn.org,</span> having the largest number of links.</p>
<p>In another experiment we used a derivative file containing the text extracted from HTML documents  within the web archive (a csv file).  We explored this data using a web-based text analysis set of tools called <a href="https://voyant-tools.org/" target="_blank" rel="noopener">Voyant Tools</a>.   Data cleanup of the text in our larger collections proved challenging, and we ended up creating a very small sample data set created for this project. The text was still a challenge with unrecognizable characters, though a bit easier to manage. We removed content in languages not English or Spanish (which made sense for this data set), and removed file formats that were not text. You can see a big difference in the visualizations using the “before” and “after” version of the derivative text file.</p>
<div class="tiled-gallery type-rectangular tiled-gallery-unresized" data-original-width="840" data-carousel-extra='{&quot;blog_id&quot;:1,&quot;permalink&quot;:&quot;https:\/\/circulatingnow.nlm.nih.gov\/2021\/05\/13\/exploring-the-data-of-web-archives-as-part-of-data-science-nlm\/&quot;,&quot;likes_blog_id&quot;:&quot;52242398&quot;}' itemscope itemtype="http://schema.org/ImageGallery" > <div class="gallery-row" style="width: 840px; height: 209px;" data-original-width="840" data-original-height="209" > <div class="gallery-group images-1" style="width: 420px; height: 209px;" data-original-width="420" data-original-height="209" > <div class="tiled-gallery-item tiled-gallery-item-large" itemprop="associatedMedia" itemscope itemtype="http://schema.org/ImageObject"> <a href="https://circulatingnow.nlm.nih.gov/voyant1/" border="0" itemprop="url"> <meta itemprop="width" content="416"> <meta itemprop="height" content="205"> <img decoding="async" class="" data-attachment-id="21119" data-orig-file="https://circulatingnow.nlm.nih.gov/wp-content/uploads/2021/05/Voyant1.jpg" data-orig-size="1655,814" data-comments-opened="1" data-image-meta="{&quot;aperture&quot;:&quot;0&quot;,&quot;credit&quot;:&quot;&quot;,&quot;camera&quot;:&quot;&quot;,&quot;caption&quot;:&quot;&quot;,&quot;created_timestamp&quot;:&quot;0&quot;,&quot;copyright&quot;:&quot;&quot;,&quot;focal_length&quot;:&quot;0&quot;,&quot;iso&quot;:&quot;0&quot;,&quot;shutter_speed&quot;:&quot;0&quot;,&quot;title&quot;:&quot;&quot;,&quot;orientation&quot;:&quot;0&quot;}" data-image-title="Before" data-image-description="" data-medium-file="https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2021/05/Voyant1.jpg?fit=300%2C148&#038;ssl=1" data-large-file="https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2021/05/Voyant1.jpg?fit=840%2C413&#038;ssl=1" src="https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2021/05/Voyant1.jpg?w=416&#038;h=205&#038;ssl=1" srcset="https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2021/05/Voyant1.jpg?w=1655&amp;ssl=1 1655w, https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2021/05/Voyant1.jpg?resize=300%2C148&amp;ssl=1 300w, https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2021/05/Voyant1.jpg?resize=1024%2C504&amp;ssl=1 1024w, https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2021/05/Voyant1.jpg?resize=768%2C378&amp;ssl=1 768w, https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2021/05/Voyant1.jpg?resize=1536%2C755&amp;ssl=1 1536w, https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2021/05/Voyant1.jpg?resize=1200%2C590&amp;ssl=1 1200w, https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2021/05/Voyant1.jpg?resize=840%2C413&amp;ssl=1 840w" width="416" height="205" loading="lazy" data-original-width="416" data-original-height="205" itemprop="http://schema.org/image" title="Before" alt="A screenshot of a dashboard showing unmeaningful displays of information." style="width: 416px; height: 205px;" /> </a> <div class="tiled-gallery-caption" itemprop="caption description"> A Voyant display of data before it has been cleaned. </div> </div> </div> <!-- close group --> <div class="gallery-group images-1" style="width: 420px; height: 209px;" data-original-width="420" data-original-height="209" > <div class="tiled-gallery-item tiled-gallery-item-large" itemprop="associatedMedia" itemscope itemtype="http://schema.org/ImageObject"> <a href="https://circulatingnow.nlm.nih.gov/voyant2/" border="0" itemprop="url"> <meta itemprop="width" content="416"> <meta itemprop="height" content="205"> <img decoding="async" class="" data-attachment-id="21120" data-orig-file="https://circulatingnow.nlm.nih.gov/wp-content/uploads/2021/05/Voyant2.jpg" data-orig-size="1655,814" data-comments-opened="1" data-image-meta="{&quot;aperture&quot;:&quot;0&quot;,&quot;credit&quot;:&quot;&quot;,&quot;camera&quot;:&quot;&quot;,&quot;caption&quot;:&quot;&quot;,&quot;created_timestamp&quot;:&quot;0&quot;,&quot;copyright&quot;:&quot;&quot;,&quot;focal_length&quot;:&quot;0&quot;,&quot;iso&quot;:&quot;0&quot;,&quot;shutter_speed&quot;:&quot;0&quot;,&quot;title&quot;:&quot;&quot;,&quot;orientation&quot;:&quot;0&quot;}" data-image-title="After" data-image-description="" data-medium-file="https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2021/05/Voyant2.jpg?fit=300%2C148&#038;ssl=1" data-large-file="https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2021/05/Voyant2.jpg?fit=840%2C413&#038;ssl=1" src="https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2021/05/Voyant2.jpg?w=416&#038;h=205&#038;ssl=1" srcset="https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2021/05/Voyant2.jpg?w=1655&amp;ssl=1 1655w, https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2021/05/Voyant2.jpg?resize=300%2C148&amp;ssl=1 300w, https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2021/05/Voyant2.jpg?resize=1024%2C504&amp;ssl=1 1024w, https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2021/05/Voyant2.jpg?resize=768%2C378&amp;ssl=1 768w, https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2021/05/Voyant2.jpg?resize=1536%2C755&amp;ssl=1 1536w, https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2021/05/Voyant2.jpg?resize=1200%2C590&amp;ssl=1 1200w, https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2021/05/Voyant2.jpg?resize=840%2C413&amp;ssl=1 840w" width="416" height="205" loading="lazy" data-original-width="416" data-original-height="205" itemprop="http://schema.org/image" title="After" alt="A program dashboard displaying a wordcloud, text associations, graph and frequency data drawn from a text analysis" style="width: 416px; height: 205px;" /> </a> <div class="tiled-gallery-caption" itemprop="caption description"> A Voyent display using cleaned data. </div> </div> </div> <!-- close group --> </div> <!-- close row --> </div>
<figure id="attachment_11953" class="wp-caption aligncenter"><figcaption class="wp-caption-text" style="width: 800px;">A &#8220;before&#8221; and &#8220;after&#8221; data cleaning text visualization in Voyant, using data from a test NLM web archive collection related to HHS efforts to address hesitancy around COVID-19 vaccines.</figcaption>With Voyant Tools researchers can visualize the text in multiple ways: a word cloud showing the most frequent words used in the collection, the context of the word or words used in a collection (for example, what text comes before or after the word “vaccine”), where in the text the terms of interest are most concentrated, and the terms highlighted in the text itself.  There are all kinds of ways to filter this data, and researchers can swap out the visualizations (there are 28 available) depending on what is most useful to their research.</figure>
<p>We also tested out a set of Jupyter notebooks, released in 2020 as part of the <a href="https://glam-workbench.net/web-archives/" target="_blank" rel="noopener">GLAM Workbench</a> (Galleries, Libraries, Archives, and Museums) with funding from the <a href="https://netpreserve.org/">International Internet Preservation Consortium (IIPC)</a>. Like Archives Unleashed Cloud, the notebooks (there are 16) are intended to be a starting point specifically for researchers who want to make use of web archives.  The notebooks offer a range of options for examining content in the Internet Archive (and other archives); and—even easier on the researcher—run using <a href="https://jupyter.org/binder" target="_blank" rel="noopener">Binder</a>, a virtual machine that you dont need any software installed on your own computer to use.</p>
<p>Researchers can use a notebook, &#8220;<a href="https://glam-workbench.net/web-archives/#create-and-compare-full-page-screenshots-from-archived-web-pages" target="_blank" rel="noopener">Get full page screenshots from archived web pages</a>,&#8221; for example, to examine visual changes in a website over time.  In the visual below, we reviewed the the CDC coronavirus homepage as it changed throughout 2020.</p>
<figure id="attachment_21118" aria-describedby="caption-attachment-21118" style="width: 996px" class="wp-caption aligncenter"><a href="https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2021/05/GLAMWorkbench_GetFullPageScreenshots.jpg?ssl=1"><img data-recalc-dims="1" decoding="async" data-attachment-id="21118" data-permalink="https://circulatingnow.nlm.nih.gov/2021/05/13/exploring-the-data-of-web-archives-as-part-of-data-science-nlm/glamworkbench_getfullpagescreenshots/" data-orig-file="https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2021/05/GLAMWorkbench_GetFullPageScreenshots.jpg?fit=996%2C820&amp;ssl=1" data-orig-size="996,820" data-comments-opened="1" data-image-meta="{&quot;aperture&quot;:&quot;0&quot;,&quot;credit&quot;:&quot;&quot;,&quot;camera&quot;:&quot;&quot;,&quot;caption&quot;:&quot;&quot;,&quot;created_timestamp&quot;:&quot;0&quot;,&quot;copyright&quot;:&quot;&quot;,&quot;focal_length&quot;:&quot;0&quot;,&quot;iso&quot;:&quot;0&quot;,&quot;shutter_speed&quot;:&quot;0&quot;,&quot;title&quot;:&quot;&quot;,&quot;orientation&quot;:&quot;0&quot;}" data-image-title="GLAMWorkbench_GetFullPageScreenshots" data-image-description="" data-image-caption="&lt;p&gt;A GLAM Workbench tool displaying archives of a webpage on three different dates.&lt;/p&gt;
" data-medium-file="https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2021/05/GLAMWorkbench_GetFullPageScreenshots.jpg?fit=300%2C247&amp;ssl=1" data-large-file="https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2021/05/GLAMWorkbench_GetFullPageScreenshots.jpg?fit=840%2C692&amp;ssl=1" class="wp-image-21118 size-full" title="CDC Page on COVID-19 in January, February, and March of 2020" src="https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2021/05/GLAMWorkbench_GetFullPageScreenshots.jpg?resize=840%2C692&#038;ssl=1" alt="A display of three versions of a CDC wepage from January, February and March of 2020 showing how it got longer and more complex." width="840" height="692" srcset="https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2021/05/GLAMWorkbench_GetFullPageScreenshots.jpg?w=996&amp;ssl=1 996w, https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2021/05/GLAMWorkbench_GetFullPageScreenshots.jpg?resize=300%2C247&amp;ssl=1 300w, https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2021/05/GLAMWorkbench_GetFullPageScreenshots.jpg?resize=768%2C632&amp;ssl=1 768w, https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2021/05/GLAMWorkbench_GetFullPageScreenshots.jpg?resize=840%2C692&amp;ssl=1 840w" sizes="(max-width: 840px) 100vw, 840px" /></a><figcaption id="caption-attachment-21118" class="wp-caption-text">Screenshot of the target URL <a href="https://www.cdc.gov/coronavirus/2019-ncov/" rel="nofollow">https://www.cdc.gov/coronavirus/2019-ncov/</a> over time using &#8220;Get full page screenshots from archived web pages&#8221; GLAM Workbench notebook.</figcaption></figure>
<p>Other notebooks in the collection allow researchers to discover changes to text on a webpage over time, for example, or to discover when a piece of text first appears in an archived webpage. In the example below, we used the notebook &#8220;<a href="https://glam-workbench.net/web-archives/#find-when-a-piece-of-text-appears-in-an-archived-web-page" target="_blank" rel="noopener">Find when a piece of text appears in an archived web page</a>&#8221; to discover the first time “social distancing” was used on the CDC coronavirus homepage.</p>
<figure id="attachment_21117" aria-describedby="caption-attachment-21117" style="width: 970px" class="wp-caption aligncenter"><a href="https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2021/05/GLAMWorkbench_FindWhenAPieceOfTextAppears.jpg?ssl=1"><img data-recalc-dims="1" decoding="async" data-attachment-id="21117" data-permalink="https://circulatingnow.nlm.nih.gov/2021/05/13/exploring-the-data-of-web-archives-as-part-of-data-science-nlm/glamworkbench_findwhenapieceoftextappears/" data-orig-file="https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2021/05/GLAMWorkbench_FindWhenAPieceOfTextAppears.jpg?fit=970%2C800&amp;ssl=1" data-orig-size="970,800" data-comments-opened="1" data-image-meta="{&quot;aperture&quot;:&quot;0&quot;,&quot;credit&quot;:&quot;&quot;,&quot;camera&quot;:&quot;&quot;,&quot;caption&quot;:&quot;&quot;,&quot;created_timestamp&quot;:&quot;0&quot;,&quot;copyright&quot;:&quot;&quot;,&quot;focal_length&quot;:&quot;0&quot;,&quot;iso&quot;:&quot;0&quot;,&quot;shutter_speed&quot;:&quot;0&quot;,&quot;title&quot;:&quot;&quot;,&quot;orientation&quot;:&quot;0&quot;}" data-image-title="GLAMWorkbench_FindWhenAPieceOfTextAppears" data-image-description="" data-image-caption="&lt;p&gt;A GLAM Workbench tool displaying the first use of &#8220;social distancing&#8221; on a cdc webpage on June 15, 2020.&lt;/p&gt;
" data-medium-file="https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2021/05/GLAMWorkbench_FindWhenAPieceOfTextAppears.jpg?fit=300%2C247&amp;ssl=1" data-large-file="https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2021/05/GLAMWorkbench_FindWhenAPieceOfTextAppears.jpg?fit=840%2C693&amp;ssl=1" class="wp-image-21117 size-full" title="&quot;Social Distancing&quot; first appeared on the CDC coronavirus homepage on June 15, 2020" src="https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2021/05/GLAMWorkbench_FindWhenAPieceOfTextAppears.jpg?resize=840%2C693&#038;ssl=1" alt="A screenshot of a tool that locates specific phrases in webpage text accross time." width="840" height="693" srcset="https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2021/05/GLAMWorkbench_FindWhenAPieceOfTextAppears.jpg?w=970&amp;ssl=1 970w, https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2021/05/GLAMWorkbench_FindWhenAPieceOfTextAppears.jpg?resize=300%2C247&amp;ssl=1 300w, https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2021/05/GLAMWorkbench_FindWhenAPieceOfTextAppears.jpg?resize=768%2C633&amp;ssl=1 768w, https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2021/05/GLAMWorkbench_FindWhenAPieceOfTextAppears.jpg?resize=840%2C693&amp;ssl=1 840w" sizes="(max-width: 840px) 100vw, 840px" /></a><figcaption id="caption-attachment-21117" class="wp-caption-text">Screenshot of results from searching for First Occurrence of the text &#8220;Social Distancing&#8221; on <a href="https://www.cdc.gov/coronavirus/2019-ncov/" rel="nofollow">https://www.cdc.gov/coronavirus/2019-ncov/</a> using &#8220;Find when a piece of text appears in an archived web page&#8221; GLAM Workbench notebook.</figcaption></figure>
<p>These notebooks are not without challenges themselves.  While really easy to use, it takes time to query the entire Internet Archive for results (sometimes hours) and the notebooks can time out.  This work provided the opportunity to compare approaches to querying the data of web archives, as well as more lessons on patience and persistence.</p>
<p>The work we started during this mentorship is ongoing and the landscape of tools is evolving.  There is definitely more room for further exploration of analysis tools to better understand how researchers can use web archives and how web collecting organizations like NLM can support their work. We learned midway through the project that Archives Unleashed Cloud will be decommissioned at the end of June 2021 and migrated to Archive-It.  I look forward to learning more about what opportunities this will bring for making NLM web archive collections available as data, whether through providing tidy derivative data sets for our researchers, or sharing notebooks querying the web archive data.  Supporting researchers through description and transparency about the scope of a collection is also important, as well as helping them understand the nature of web content as historical materials (on this topic I read, and consulted many times throughout this project, Ian Milligans <a href="https://www.ianmilligan.ca/publication/history-in-the-age-of-abundance/"><em>History in the Age of Abundance?  How the Web is Transforming Historical Research</em></a>). There is much exciting and important work possible ahead.</p>
<figure id="attachment_21182" aria-describedby="caption-attachment-21182" style="width: 350px" class="wp-caption alignright"><a href="https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2021/05/NLMstaffnetwork.jpg?ssl=1"><img data-recalc-dims="1" loading="lazy" decoding="async" data-attachment-id="21182" data-permalink="https://circulatingnow.nlm.nih.gov/2021/05/13/exploring-the-data-of-web-archives-as-part-of-data-science-nlm/nlmstaffnetwork/" data-orig-file="https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2021/05/NLMstaffnetwork.jpg?fit=1253%2C769&amp;ssl=1" data-orig-size="1253,769" data-comments-opened="1" data-image-meta="{&quot;aperture&quot;:&quot;0&quot;,&quot;credit&quot;:&quot;&quot;,&quot;camera&quot;:&quot;&quot;,&quot;caption&quot;:&quot;&quot;,&quot;created_timestamp&quot;:&quot;0&quot;,&quot;copyright&quot;:&quot;&quot;,&quot;focal_length&quot;:&quot;0&quot;,&quot;iso&quot;:&quot;0&quot;,&quot;shutter_speed&quot;:&quot;0&quot;,&quot;title&quot;:&quot;&quot;,&quot;orientation&quot;:&quot;0&quot;}" data-image-title="Thanks to NLM Staff" data-image-description="&lt;p&gt;Patti Brennan, Dianne Babski, Maryam Zaringhalam, Maria Collins, Peter Cooper, Mike Davidson, Lisa Federer, Anna Ripple, Nicole Sroka, Emma Write, LO Management, Jennifer Marill, HMD Management, Rebecca Warlow, Mentees, Mentors, LHNCBC Management, Rachel Tohn, Jim Mork, Marie Gallagher, OCCS Management&lt;/p&gt;
" data-image-caption="" data-medium-file="https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2021/05/NLMstaffnetwork.jpg?fit=300%2C184&amp;ssl=1" data-large-file="https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2021/05/NLMstaffnetwork.jpg?fit=840%2C515&amp;ssl=1" class="wp-image-21182" title="Thank you NLM!" src="https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2021/05/NLMstaffnetwork.jpg?resize=350%2C215&#038;ssl=1" alt="Network graphic naming NLM staff and offices that supported the project." width="350" height="215" longdesc="Patti Brennan, Dianne Babski, Maryam Zaringhalam, Maria Collins, Peter Cooper, Mike Davidson, Lisa Federer, Anna Ripple, Nicole Sroka, Emma Write, LO Management, Jennifer Marill, HMD Management, Rebecca Warlow, Mentees, Mentors, LHNCBC Management, Rachel Tohn, Jim Mork, Marie Gallagher, OCCS Management" srcset="https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2021/05/NLMstaffnetwork.jpg?resize=300%2C184&amp;ssl=1 300w, https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2021/05/NLMstaffnetwork.jpg?resize=1024%2C628&amp;ssl=1 1024w, https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2021/05/NLMstaffnetwork.jpg?resize=768%2C471&amp;ssl=1 768w, https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2021/05/NLMstaffnetwork.jpg?resize=1200%2C736&amp;ssl=1 1200w, https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2021/05/NLMstaffnetwork.jpg?resize=840%2C516&amp;ssl=1 840w, https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2021/05/NLMstaffnetwork.jpg?w=1253&amp;ssl=1 1253w" sizes="auto, (max-width: 350px) 100vw, 350px" /></a><figcaption id="caption-attachment-21182" class="wp-caption-text">Thanks to everyone across NLM for support on this project!</figcaption></figure>
<p>Im grateful for this opportunity to work with a mentor to explore and learn about the bigger picture of working with web archives as data over this past year.  Many, many thanks to Marie Gallagher, the entire Data Science @ NLM training program team, and all those at NLM supporting this work.</p>
<p><em><a href="https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2018/05/christie-moffatt.jpg?ssl=1"><img data-recalc-dims="1" loading="lazy" decoding="async" data-attachment-id="14591" data-permalink="https://circulatingnow.nlm.nih.gov/2019/10/15/nlms-profiles-in-science-exploring-the-stories-of-scientific-discovery/nlm-staff-head-shots/" data-orig-file="https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2018/05/christie-moffatt.jpg?fit=800%2C1200&amp;ssl=1" data-orig-size="800,1200" data-comments-opened="1" data-image-meta="{&quot;aperture&quot;:&quot;3.5&quot;,&quot;credit&quot;:&quot;Chia-Chi \&quot;Charlie\&quot; Chang 703-431&quot;,&quot;camera&quot;:&quot;Canon EOS 5D Mark IV&quot;,&quot;caption&quot;:&quot;&quot;,&quot;created_timestamp&quot;:&quot;1525258458&quot;,&quot;copyright&quot;:&quot;www.ImageCaffeine.com&quot;,&quot;focal_length&quot;:&quot;100&quot;,&quot;iso&quot;:&quot;800&quot;,&quot;shutter_speed&quot;:&quot;0.00625&quot;,&quot;title&quot;:&quot;NLM Staff Head Shots&quot;,&quot;orientation&quot;:&quot;1&quot;}" data-image-title="Christie Moffatt" data-image-description="" data-image-caption="" data-medium-file="https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2018/05/christie-moffatt.jpg?fit=200%2C300&amp;ssl=1" data-large-file="https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2018/05/christie-moffatt.jpg?fit=683%2C1024&amp;ssl=1" class="alignleft wp-image-14591" src="https://i0.wp.com/circulatingnow.nlm.nih.gov/wp-content/uploads/2018/05/christie-moffatt.jpg?resize=67%2C100&#038;ssl=1" alt="An informal portrait of Christie Moffatt." width="67" height="100" /></a>Christie Moffatt is Manager of the Digital Manuscripts Program in the History of Medicine Division at the National Library of Medicine and Chair of NLMs Web Collecting and Archiving Working Group.</em></p>
<div class="sharedaddy sd-sharing-enabled"><div class="robots-nocontent sd-block sd-social sd-social-icon sd-sharing"><h3 class="sd-title">Circulate this:</h3><div class="sd-content"><ul><li class="share-twitter"><a rel="nofollow noopener noreferrer" data-shared="sharing-twitter-21153" class="share-twitter sd-button share-icon no-text" href="https://circulatingnow.nlm.nih.gov/2021/05/13/exploring-the-data-of-web-archives-as-part-of-data-science-nlm/?share=twitter" target="_blank" title="Click to share on Twitter" ><span></span><span class="sharing-screen-reader-text">Click to share on Twitter (Opens in new window)</span></a></li><li class="share-facebook"><a rel="nofollow noopener noreferrer" data-shared="sharing-facebook-21153" class="share-facebook sd-button share-icon no-text" href="https://circulatingnow.nlm.nih.gov/2021/05/13/exploring-the-data-of-web-archives-as-part-of-data-science-nlm/?share=facebook" target="_blank" title="Click to share on Facebook" ><span></span><span class="sharing-screen-reader-text">Click to share on Facebook (Opens in new window)</span></a></li><li class="share-pinterest"><a rel="nofollow noopener noreferrer" data-shared="sharing-pinterest-21153" class="share-pinterest sd-button share-icon no-text" href="https://circulatingnow.nlm.nih.gov/2021/05/13/exploring-the-data-of-web-archives-as-part-of-data-science-nlm/?share=pinterest" target="_blank" title="Click to share on Pinterest" ><span></span><span class="sharing-screen-reader-text">Click to share on Pinterest (Opens in new window)</span></a></li><li class="share-tumblr"><a rel="nofollow noopener noreferrer" data-shared="" class="share-tumblr sd-button share-icon no-text" href="https://circulatingnow.nlm.nih.gov/2021/05/13/exploring-the-data-of-web-archives-as-part-of-data-science-nlm/?share=tumblr" target="_blank" title="Click to share on Tumblr" ><span></span><span class="sharing-screen-reader-text">Click to share on Tumblr (Opens in new window)</span></a></li><li class="share-reddit"><a rel="nofollow noopener noreferrer" data-shared="" class="share-reddit sd-button share-icon no-text" href="https://circulatingnow.nlm.nih.gov/2021/05/13/exploring-the-data-of-web-archives-as-part-of-data-science-nlm/?share=reddit" target="_blank" title="Click to share on Reddit" ><span></span><span class="sharing-screen-reader-text">Click to share on Reddit (Opens in new window)</span></a></li><li class="share-linkedin"><a rel="nofollow noopener noreferrer" data-shared="sharing-linkedin-21153" class="share-linkedin sd-button share-icon no-text" href="https://circulatingnow.nlm.nih.gov/2021/05/13/exploring-the-data-of-web-archives-as-part-of-data-science-nlm/?share=linkedin" target="_blank" title="Click to share on LinkedIn" ><span></span><span class="sharing-screen-reader-text">Click to share on LinkedIn (Opens in new window)</span></a></li><li class="share-email"><a rel="nofollow noopener noreferrer" data-shared="" class="share-email sd-button share-icon no-text" href="mailto:?subject=%5BShared%20Post%5D%20Exploring%20the%20Data%20of%20Web%20Archives%20as%20Part%20of%20Data%20Science%20%40%20NLM&body=https%3A%2F%2Fcirculatingnow.nlm.nih.gov%2F2021%2F05%2F13%2Fexploring-the-data-of-web-archives-as-part-of-data-science-nlm%2F&share=email" target="_blank" title="Click to email a link to a friend" data-email-share-error-title="Do you have email set up?" data-email-share-error-text="If you&#039;re having problems sharing via email, you might not have email set up for your browser. You may need to create a new email yourself." data-email-share-nonce="ab4d12bb55" data-email-share-track-url="https://circulatingnow.nlm.nih.gov/2021/05/13/exploring-the-data-of-web-archives-as-part-of-data-science-nlm/?share=email"><span></span><span class="sharing-screen-reader-text">Click to email a link to a friend (Opens in new window)</span></a></li><li><a href="#" class="sharing-anchor sd-button share-more"><span>More</span></a></li><li class="share-end"></li></ul><div class="sharing-hidden"><div class="inner" style="display: none;"><ul><li class="share-print"><a rel="nofollow noopener noreferrer" data-shared="" class="share-print sd-button share-icon no-text" href="https://circulatingnow.nlm.nih.gov/2021/05/13/exploring-the-data-of-web-archives-as-part-of-data-science-nlm/#print" target="_blank" title="Click to print" ><span></span><span class="sharing-screen-reader-text">Click to print (Opens in new window)</span></a></li><li class="share-jetpack-whatsapp"><a rel="nofollow noopener noreferrer" data-shared="" class="share-jetpack-whatsapp sd-button share-icon no-text" href="https://circulatingnow.nlm.nih.gov/2021/05/13/exploring-the-data-of-web-archives-as-part-of-data-science-nlm/?share=jetpack-whatsapp" target="_blank" title="Click to share on WhatsApp" ><span></span><span class="sharing-screen-reader-text">Click to share on WhatsApp (Opens in new window)</span></a></li><li class="share-pocket"><a rel="nofollow noopener noreferrer" data-shared="" class="share-pocket sd-button share-icon no-text" href="https://circulatingnow.nlm.nih.gov/2021/05/13/exploring-the-data-of-web-archives-as-part-of-data-science-nlm/?share=pocket" target="_blank" title="Click to share on Pocket" ><span></span><span class="sharing-screen-reader-text">Click to share on Pocket (Opens in new window)</span></a></li><li class="share-telegram"><a rel="nofollow noopener noreferrer" data-shared="" class="share-telegram sd-button share-icon no-text" href="https://circulatingnow.nlm.nih.gov/2021/05/13/exploring-the-data-of-web-archives-as-part-of-data-science-nlm/?share=telegram" target="_blank" title="Click to share on Telegram" ><span></span><span class="sharing-screen-reader-text">Click to share on Telegram (Opens in new window)</span></a></li><li class="share-end"></li></ul></div></div></div></div></div><div class='sharedaddy sd-block sd-like jetpack-likes-widget-wrapper jetpack-likes-widget-unloaded' id='like-post-wrapper-52242398-21153-67c7ac579f22f' data-src='https://widgets.wp.com/likes/?ver=14.4#blog_id=52242398&amp;post_id=21153&amp;origin=circulatingnow.nlm.nih.gov&amp;obj_id=52242398-21153-67c7ac579f22f' data-name='like-post-frame-52242398-21153-67c7ac579f22f' data-title='Like or Reblog'><h3 class="sd-title">Like this:</h3><div class='likes-widget-placeholder post-likes-widget-placeholder' style='height: 55px;'><span class='button'><span>Like</span></span> <span class="loading">Loading...</span></div><span class='sd-text-color'></span><a class='sd-link-color'></a></div>
<div id='jp-relatedposts' class='jp-relatedposts' >
<h3 class="jp-relatedposts-headline"><em>Related</em></h3>
</div>
<div class="wp-block-group has-border-color" style="border-style:none;border-width:0px;margin-top:32px;margin-bottom:32px;padding-top:0px;padding-right:0px;padding-bottom:0px;padding-left:0px"><div class="wp-block-group__inner-container is-layout-flow wp-block-group-is-layout-flow">
<hr class="wp-block-separator has-alpha-channel-opacity is-style-wide" style="margin-bottom:24px"/>
<h3 class="wp-block-heading has-text-align-center" style="margin-top:4px;margin-bottom:10px">Discover more from Circulating Now from the NLM Historical Collections</h3>
<p class="has-text-align-center" style="margin-top:10px;margin-bottom:10px;font-size:15px">Subscribe to get the latest posts sent to your email.</p>
<div class="wp-block-group"><div class="wp-block-group__inner-container is-layout-constrained wp-container-core-group-is-layout-1 wp-block-group-is-layout-constrained">
<div class="wp-block-jetpack-subscriptions__supports-newline wp-block-jetpack-subscriptions">
<div class="wp-block-jetpack-subscriptions__container is-not-subscriber">
<form
action="https://wordpress.com/email-subscriptions"
method="post"
accept-charset="utf-8"
data-blog="52242398"
data-post_access_level="everybody"
data-subscriber_email=""
id="subscribe-blog"
>
<div class="wp-block-jetpack-subscriptions__form-elements">
<p id="subscribe-email">
<label
id="subscribe-field-label"
for="subscribe-field"
class="screen-reader-text"
>
Type your email… </label>
<input
required="required"
type="email"
name="email"
class="no-border-radius "
style="font-size: 16px;padding: 15px 23px 15px 23px;border-radius: 0px;border-width: 1px;"
placeholder="Type your email…"
value=""
id="subscribe-field"
title="Please fill in this field."
/> </p>
<p id="subscribe-submit"
>
<input type="hidden" name="action" value="subscribe"/>
<input type="hidden" name="blog_id" value="52242398"/>
<input type="hidden" name="source" value="https://circulatingnow.nlm.nih.gov/2021/05/13/exploring-the-data-of-web-archives-as-part-of-data-science-nlm/"/>
<input type="hidden" name="sub-type" value="subscribe-block"/>
<input type="hidden" name="app_source" value="subscribe-block-post-end"/>
<input type="hidden" name="redirect_fragment" value="subscribe-blog"/>
<input type="hidden" name="lang" value="en_US"/>
<input type="hidden" id="_wpnonce" name="_wpnonce" value="d3fcec8ab9" /><input type="hidden" name="_wp_http_referer" value="/2021/05/13/exploring-the-data-of-web-archives-as-part-of-data-science-nlm/" /><input type="hidden" name="post_id" value="21153"/> <button type="submit"
class="wp-block-button__link no-border-radius"
style="font-size: 16px;padding: 15px 23px 15px 23px;margin: 0; margin-left: 10px;border-radius: 0px;border-width: 1px;"
name="jetpack_subscriptions_widget"
>
Subscribe </button>
</p>
</div>
</form>
</div>
</div>
</div></div>
</div></div>
</div><!-- .entry-content -->
<footer class="entry-footer">
<div class="entry-tags clearfix">
<span class="meta-tags">
<a href="https://circulatingnow.nlm.nih.gov/tag/about-us/" rel="tag">About Us</a><a href="https://circulatingnow.nlm.nih.gov/tag/data/" rel="tag">data</a><a href="https://circulatingnow.nlm.nih.gov/tag/digital-humanities/" rel="tag">digital humanities</a><a href="https://circulatingnow.nlm.nih.gov/tag/research/" rel="tag">research</a><a href="https://circulatingnow.nlm.nih.gov/tag/research-tools/" rel="tag">Research Tools</a><a href="https://circulatingnow.nlm.nih.gov/tag/web-collecting/" rel="tag">web collecting</a> </span>
</div><!-- .entry-tags -->
<nav class="navigation post-navigation" aria-label="Posts">
<h2 class="screen-reader-text">Post navigation</h2>
<div class="nav-links"><div class="nav-previous"><a href="https://circulatingnow.nlm.nih.gov/2021/05/06/an-articella-in-catalan-1475/" rel="prev"><span class="screen-reader-text">Previous Post:</span>An Articella in Catalan, 1475</a></div><div class="nav-next"><a href="https://circulatingnow.nlm.nih.gov/2021/05/20/nlm-collections-tour-mental-health/" rel="next"><span class="screen-reader-text">Next Post:</span>NLM Collection Tour: Mental Health</a></div></div>
</nav>
</footer><!-- .entry-footer -->
</article>
<div id="comments" class="comments-area">
<header class="comments-header">
<h2 class="comments-title">
2 comments </h2>
</header><!-- .comment-header -->
<ol class="comment-list">
<li id="comment-86079" class="comment even thread-even depth-1">
<article id="div-comment-86079" class="comment-body">
<footer class="comment-meta">
<div class="comment-author vcard">
<img alt='' src='https://secure.gravatar.com/avatar/c19b566d0dc4245aba204c976266d3db?s=56&#038;d=mm&#038;r=pg' srcset='https://secure.gravatar.com/avatar/c19b566d0dc4245aba204c976266d3db?s=112&#038;d=mm&#038;r=pg 2x' class='avatar avatar-56 photo' height='56' width='56' loading='lazy' decoding='async'/> <b class="fn">James</b> <span class="says">says:</span> </div><!-- .comment-author -->
<div class="comment-metadata">
<a href="https://circulatingnow.nlm.nih.gov/2021/05/13/exploring-the-data-of-web-archives-as-part-of-data-science-nlm/#comment-86079"><time datetime="2021-05-22T15:41:53-04:00">May 22, 2021 at 3:41 PM</time></a> </div><!-- .comment-metadata -->
</footer><!-- .comment-meta -->
<div class="comment-content">
<p>Very interesting. Great read, thanks.</p>
<div class='jetpack-comment-likes-widget-wrapper jetpack-likes-widget-unloaded' id='like-comment-wrapper-52242398-86079-67c7ac57a339e' data-src='https://widgets.wp.com/likes/#blog_id=52242398&amp;comment_id=86079&amp;origin=circulatingnow.nlm.nih.gov&amp;obj_id=52242398-86079-67c7ac57a339e' data-name='like-comment-frame-52242398-86079-67c7ac57a339e'>
<div class='likes-widget-placeholder comment-likes-widget-placeholder comment-likes'><span class='loading'>Loading...</span></div>
<div class='comment-likes-widget jetpack-likes-widget comment-likes'><span class='comment-like-feedback'></span><span class='sd-text-color'></span><a class='sd-link-color'></a></div>
</div>
</div><!-- .comment-content -->
<div class="reply"><a rel="nofollow" class="comment-reply-link" href="https://circulatingnow.nlm.nih.gov/2021/05/13/exploring-the-data-of-web-archives-as-part-of-data-science-nlm/?replytocom=86079#respond" data-commentid="86079" data-postid="21153" data-belowelement="div-comment-86079" data-respondelement="respond" data-replyto="Reply to James" aria-label="Reply to James">Reply</a></div> </article><!-- .comment-body -->
</li><!-- #comment-## -->
<li id="comment-86102" class="pingback odd alt thread-odd thread-alt depth-1">
<div class="comment-body">
Pingback: <a href="https://archive-it.org/blog/post/archive-it-partner-news-july-2021/" class="url" rel="ugc external nofollow">Archive-It Blog &#8211; Archive-It Partner News, June 2021</a> </div>
</li><!-- #comment-## -->
</ol><!-- .comment-list -->
<div id="respond" class="comment-respond">
<h3 id="reply-title" class="comment-reply-title">Leave a Reply<small><a rel="nofollow" id="cancel-comment-reply-link" href="/2021/05/13/exploring-the-data-of-web-archives-as-part-of-data-science-nlm/#respond" style="display:none;">Cancel reply</a></small></h3> <form id="commentform" class="comment-form">
<iframe
title="Comment Form"
src="https://jetpack.wordpress.com/jetpack-comment/?blogid=52242398&#038;postid=21153&#038;comment_registration=0&#038;require_name_email=1&#038;stc_enabled=1&#038;stb_enabled=1&#038;show_avatars=1&#038;avatar_default=mystery&#038;greeting=Leave+a+Reply&#038;jetpack_comments_nonce=4133bf21a2&#038;greeting_reply=Leave+a+Reply+to+%25s&#038;color_scheme=light&#038;lang=en_US&#038;jetpack_version=14.4&#038;iframe_unique_id=1&#038;show_cookie_consent=10&#038;has_cookie_consent=0&#038;is_current_user_subscribed=0&#038;token_key=%3Bnormal%3B&#038;sig=27fa0197fd4ff48a5a4bf86ca6719080ea9d83df#parent=https%3A%2F%2Fcirculatingnow.nlm.nih.gov%2F2021%2F05%2F13%2Fexploring-the-data-of-web-archives-as-part-of-data-science-nlm%2F"
name="jetpack_remote_comment"
style="width:100%; height: 430px; border:0;"
class="jetpack_remote_comment"
id="jetpack_remote_comment"
sandbox="allow-same-origin allow-top-navigation allow-scripts allow-forms allow-popups"
>
</iframe>
<!--[if !IE]><!-->
<script>
document.addEventListener('DOMContentLoaded', function () {
var commentForms = document.getElementsByClassName('jetpack_remote_comment');
for (var i = 0; i < commentForms.length; i++) {
commentForms[i].allowTransparency = false;
commentForms[i].scrolling = 'no';
}
});
</script>
<!--<![endif]-->
</form>
</div>
<input type="hidden" name="comment_parent" id="comment_parent" value="" />
<p class="akismet_comment_form_privacy_notice">This site uses Akismet to reduce spam. <a href="https://akismet.com/privacy/" target="_blank" rel="nofollow noopener">Learn how your comment data is processed.</a></p>
</div><!-- #comments -->
</main><!-- #main -->
</section><!-- #primary -->
<section id="secondary" class="sidebar widget-area clearfix" role="complementary">
<div class="widget-wrap"><aside id="search-3" class="widget widget_search clearfix">
<form role="search" method="get" class="search-form" action="https://circulatingnow.nlm.nih.gov/">
<label>
<span class="screen-reader-text">Search for:</span>
<input type="search" class="search-field"
placeholder="Search &hellip;"
value="" name="s"
title="Search for:" />
</label>
<button type="submit" class="search-submit">
<svg class="icon icon-search" aria-hidden="true" role="img"> <use xlink:href="https://circulatingnow.nlm.nih.gov/wp-content/themes/tortuga/assets/icons/genericons-neue.svg#search"></use> </svg> <span class="screen-reader-text">Search</span>
</button>
</form>
</aside></div><div class="widget-wrap"><aside id="blog_subscription-4" class="widget widget_blog_subscription jetpack_subscription_widget clearfix"><div class="widget-header"><h3 class="widget-title">Follow Us via Email</h3></div>
<div class="wp-block-jetpack-subscriptions__container">
<form action="#" method="post" accept-charset="utf-8" id="subscribe-blog-blog_subscription-4"
data-blog="52242398"
data-post_access_level="everybody" >
<div id="subscribe-text"><p>Enter your email address to follow this blog and receive notifications of new posts by email.</p>
</div>
<p id="subscribe-email">
<label id="jetpack-subscribe-label"
class="screen-reader-text"
for="subscribe-field-blog_subscription-4">
Email Address </label>
<input type="email" name="email" required="required"
value=""
id="subscribe-field-blog_subscription-4"
placeholder="Email Address"
/>
</p>
<p id="subscribe-submit"
>
<input type="hidden" name="action" value="subscribe"/>
<input type="hidden" name="source" value="https://circulatingnow.nlm.nih.gov/2021/05/13/exploring-the-data-of-web-archives-as-part-of-data-science-nlm/"/>
<input type="hidden" name="sub-type" value="widget"/>
<input type="hidden" name="redirect_fragment" value="subscribe-blog-blog_subscription-4"/>
<input type="hidden" id="_wpnonce" name="_wpnonce" value="d3fcec8ab9" /><input type="hidden" name="_wp_http_referer" value="/2021/05/13/exploring-the-data-of-web-archives-as-part-of-data-science-nlm/" /> <button type="submit"
class="wp-block-button__link"
name="jetpack_subscriptions_widget"
>
Follow </button>
</p>
</form>
</div>
</aside></div><div class="widget-wrap"><aside id="rss_links-4" class="widget widget_rss_links clearfix"><div class="widget-header"><h3 class="widget-title">Subscribe via RSS</h3></div><ul><li><a target="_self" href="https://circulatingnow.nlm.nih.gov/feed/" title="Subscribe to posts">RSS - Posts</a></li><li><a target="_self" href="https://circulatingnow.nlm.nih.gov/comments/feed/" title="Subscribe to comments">RSS - Comments</a></li></ul>
</aside></div><div class="widget-wrap"><aside id="categories-5" class="widget widget_categories clearfix"><div class="widget-header"><h3 class="widget-title">Topics</h3></div>
<ul>
<li class="cat-item cat-item-14520"><a href="https://circulatingnow.nlm.nih.gov/category/about-us/">About Us</a>
</li>
<li class="cat-item cat-item-12763"><a href="https://circulatingnow.nlm.nih.gov/category/collections/">Collections</a>
<ul class='children'>
<li class="cat-item cat-item-42333869"><a href="https://circulatingnow.nlm.nih.gov/category/collections/archives-manuscripts/">Archives &amp; Manuscripts</a>
</li>
<li class="cat-item cat-item-1359464"><a href="https://circulatingnow.nlm.nih.gov/category/collections/films-videos/">Films &amp; Videos</a>
</li>
<li class="cat-item cat-item-4940351"><a href="https://circulatingnow.nlm.nih.gov/category/collections/prints-photographs/">Prints &amp; Photographs</a>
</li>
<li class="cat-item cat-item-347145303"><a href="https://circulatingnow.nlm.nih.gov/category/collections/rare-books-journals/">Rare Books &amp; Journals</a>
</li>
</ul>
</li>
<li class="cat-item cat-item-2029"><a href="https://circulatingnow.nlm.nih.gov/category/exhibitions/">Exhibitions</a>
<ul class='children'>
<li class="cat-item cat-item-51873791"><a href="https://circulatingnow.nlm.nih.gov/category/exhibitions/confronting-violence/">Confronting Violence</a>
</li>
<li class="cat-item cat-item-51136828"><a href="https://circulatingnow.nlm.nih.gov/category/exhibitions/for-all-the-people/">For All the People</a>
</li>
<li class="cat-item cat-item-207572835"><a href="https://circulatingnow.nlm.nih.gov/category/exhibitions/from-dna-to-beer/">From DNA to Beer</a>
</li>
<li class="cat-item cat-item-43646346"><a href="https://circulatingnow.nlm.nih.gov/category/exhibitions/graphic-medicine/">Graphic Medicine</a>
</li>
<li class="cat-item cat-item-39242778"><a href="https://circulatingnow.nlm.nih.gov/category/exhibitions/harry-potters-world/">Harry Potters World</a>
</li>
<li class="cat-item cat-item-678875970"><a href="https://circulatingnow.nlm.nih.gov/category/exhibitions/making-the-greatest-medical-library-in-america/">Making the Greatest Medical Library in America</a>
</li>
</ul>
</li>
<li class="cat-item cat-item-51014"><a href="https://circulatingnow.nlm.nih.gov/category/guests/">Guests</a>
</li>
<li class="cat-item cat-item-103"><a href="https://circulatingnow.nlm.nih.gov/category/news/">News</a>
</li>
<li class="cat-item cat-item-2347"><a href="https://circulatingnow.nlm.nih.gov/category/series/">Series</a>
<ul class='children'>
<li class="cat-item cat-item-608566155"><a href="https://circulatingnow.nlm.nih.gov/category/series/a-new-history-of-nlm/">A New History of NLM</a>
</li>
<li class="cat-item cat-item-204221395"><a href="https://circulatingnow.nlm.nih.gov/category/series/andreas-vesalius-at-500/">Andreas Vesalius at 500</a>
</li>
<li class="cat-item cat-item-354547839"><a href="https://circulatingnow.nlm.nih.gov/category/series/curious-herbals/">Curious Herbals</a>
</li>
<li class="cat-item cat-item-321229776"><a href="https://circulatingnow.nlm.nih.gov/category/series/deciphering-the-genetic-code/">Deciphering the Genetic Code</a>
</li>
<li class="cat-item cat-item-8370612"><a href="https://circulatingnow.nlm.nih.gov/category/series/garfield-assassination/">Garfield Assassination</a>
</li>
<li class="cat-item cat-item-610680187"><a href="https://circulatingnow.nlm.nih.gov/category/series/making-exhibition-connections/">Making Exhibition Connections</a>
</li>
<li class="cat-item cat-item-678875949"><a href="https://circulatingnow.nlm.nih.gov/category/series/nlm-collections-tour/">NLM Collection Tour</a>
</li>
<li class="cat-item cat-item-76943049"><a href="https://circulatingnow.nlm.nih.gov/category/series/revealing-data/">Revealing Data</a>
</li>
<li class="cat-item cat-item-1269102"><a href="https://circulatingnow.nlm.nih.gov/category/series/the-great-war/">The Great War</a>
</li>
</ul>
</li>
</ul>
</aside></div><div class="widget-wrap"><aside id="tag_cloud-3" class="widget widget_tag_cloud clearfix"><div class="widget-header"><h3 class="widget-title">Explore</h3></div><div class="tagcloud"><a href="https://circulatingnow.nlm.nih.gov/tag/1500s/" class="tag-cloud-link tag-link-903712 tag-link-position-1" style="font-size: 12.106666666667pt;" aria-label="1500s (35 items)">1500s</a>
<a href="https://circulatingnow.nlm.nih.gov/tag/1600s/" class="tag-cloud-link tag-link-275516 tag-link-position-2" style="font-size: 12.666666666667pt;" aria-label="1600s (38 items)">1600s</a>
<a href="https://circulatingnow.nlm.nih.gov/tag/1700s/" class="tag-cloud-link tag-link-411245 tag-link-position-3" style="font-size: 11.36pt;" aria-label="1700s (32 items)">1700s</a>
<a href="https://circulatingnow.nlm.nih.gov/tag/1800s/" class="tag-cloud-link tag-link-273905 tag-link-position-4" style="font-size: 20.88pt;" aria-label="1800s (107 items)">1800s</a>
<a href="https://circulatingnow.nlm.nih.gov/tag/1900s/" class="tag-cloud-link tag-link-273907 tag-link-position-5" style="font-size: 20.32pt;" aria-label="1900s (99 items)">1900s</a>
<a href="https://circulatingnow.nlm.nih.gov/tag/1950s/" class="tag-cloud-link tag-link-24741 tag-link-position-6" style="font-size: 9.68pt;" aria-label="1950s (26 items)">1950s</a>
<a href="https://circulatingnow.nlm.nih.gov/tag/1960s/" class="tag-cloud-link tag-link-24742 tag-link-position-7" style="font-size: 12.106666666667pt;" aria-label="1960s (35 items)">1960s</a>
<a href="https://circulatingnow.nlm.nih.gov/tag/african-american-history/" class="tag-cloud-link tag-link-168941 tag-link-position-8" style="font-size: 15.093333333333pt;" aria-label="African American History (52 items)">African American History</a>
<a href="https://circulatingnow.nlm.nih.gov/tag/america/" class="tag-cloud-link tag-link-8055 tag-link-position-9" style="font-size: 9.12pt;" aria-label="America (24 items)">America</a>
<a href="https://circulatingnow.nlm.nih.gov/tag/anatomy/" class="tag-cloud-link tag-link-26371 tag-link-position-10" style="font-size: 10.613333333333pt;" aria-label="anatomy (29 items)">anatomy</a>
<a href="https://circulatingnow.nlm.nih.gov/tag/animals/" class="tag-cloud-link tag-link-490 tag-link-position-11" style="font-size: 10.613333333333pt;" aria-label="animals (29 items)">animals</a>
<a href="https://circulatingnow.nlm.nih.gov/tag/anniversaries/" class="tag-cloud-link tag-link-678875953 tag-link-position-12" style="font-size: 11.173333333333pt;" aria-label="anniversaries (31 items)">anniversaries</a>
<a href="https://circulatingnow.nlm.nih.gov/tag/archives/" class="tag-cloud-link tag-link-12080 tag-link-position-13" style="font-size: 14.533333333333pt;" aria-label="archives (48 items)">archives</a>
<a href="https://circulatingnow.nlm.nih.gov/tag/art/" class="tag-cloud-link tag-link-177 tag-link-position-14" style="font-size: 18.64pt;" aria-label="art (80 items)">art</a>
<a href="https://circulatingnow.nlm.nih.gov/tag/book-illustration/" class="tag-cloud-link tag-link-1480675 tag-link-position-15" style="font-size: 16.4pt;" aria-label="book illustration (61 items)">book illustration</a>
<a href="https://circulatingnow.nlm.nih.gov/tag/children/" class="tag-cloud-link tag-link-1343 tag-link-position-16" style="font-size: 8pt;" aria-label="children (21 items)">children</a>
<a href="https://circulatingnow.nlm.nih.gov/tag/covid-19/" class="tag-cloud-link tag-link-678875829 tag-link-position-17" style="font-size: 10.613333333333pt;" aria-label="COVID-19 (29 items)">COVID-19</a>
<a href="https://circulatingnow.nlm.nih.gov/tag/data/" class="tag-cloud-link tag-link-22379 tag-link-position-18" style="font-size: 16.586666666667pt;" aria-label="data (62 items)">data</a>
<a href="https://circulatingnow.nlm.nih.gov/tag/digital-humanities/" class="tag-cloud-link tag-link-541876 tag-link-position-19" style="font-size: 12.106666666667pt;" aria-label="digital humanities (35 items)">digital humanities</a>
<a href="https://circulatingnow.nlm.nih.gov/tag/digitization/" class="tag-cloud-link tag-link-106484 tag-link-position-20" style="font-size: 13.04pt;" aria-label="digitization (40 items)">digitization</a>
<a href="https://circulatingnow.nlm.nih.gov/tag/drugs/" class="tag-cloud-link tag-link-6200 tag-link-position-21" style="font-size: 9.12pt;" aria-label="drugs (24 items)">drugs</a>
<a href="https://circulatingnow.nlm.nih.gov/tag/education/" class="tag-cloud-link tag-link-1342 tag-link-position-22" style="font-size: 13.04pt;" aria-label="education (40 items)">education</a>
<a href="https://circulatingnow.nlm.nih.gov/tag/epidemic/" class="tag-cloud-link tag-link-136219 tag-link-position-23" style="font-size: 15.84pt;" aria-label="epidemic (56 items)">epidemic</a>
<a href="https://circulatingnow.nlm.nih.gov/tag/film/" class="tag-cloud-link tag-link-524 tag-link-position-24" style="font-size: 17.52pt;" aria-label="film (70 items)">film</a>
<a href="https://circulatingnow.nlm.nih.gov/tag/food/" class="tag-cloud-link tag-link-586 tag-link-position-25" style="font-size: 11.546666666667pt;" aria-label="food (33 items)">food</a>
<a href="https://circulatingnow.nlm.nih.gov/tag/france/" class="tag-cloud-link tag-link-4704 tag-link-position-26" style="font-size: 10.613333333333pt;" aria-label="France (29 items)">France</a>
<a href="https://circulatingnow.nlm.nih.gov/tag/germany/" class="tag-cloud-link tag-link-3550 tag-link-position-27" style="font-size: 8pt;" aria-label="Germany (21 items)">Germany</a>
<a href="https://circulatingnow.nlm.nih.gov/tag/hidden-treasure/" class="tag-cloud-link tag-link-1487506 tag-link-position-28" style="font-size: 13.226666666667pt;" aria-label="Hidden Treasure (41 items)">Hidden Treasure</a>
<a href="https://circulatingnow.nlm.nih.gov/tag/hospitals/" class="tag-cloud-link tag-link-38746 tag-link-position-29" style="font-size: 13.04pt;" aria-label="hospitals (40 items)">hospitals</a>
<a href="https://circulatingnow.nlm.nih.gov/tag/interview/" class="tag-cloud-link tag-link-11788 tag-link-position-30" style="font-size: 22pt;" aria-label="interview (121 items)">interview</a>
<a href="https://circulatingnow.nlm.nih.gov/tag/legislation/" class="tag-cloud-link tag-link-5563 tag-link-position-31" style="font-size: 12.853333333333pt;" aria-label="legislation (39 items)">legislation</a>
<a href="https://circulatingnow.nlm.nih.gov/tag/letter/" class="tag-cloud-link tag-link-50991 tag-link-position-32" style="font-size: 9.68pt;" aria-label="letter (26 items)">letter</a>
<a href="https://circulatingnow.nlm.nih.gov/tag/librarians/" class="tag-cloud-link tag-link-15380 tag-link-position-33" style="font-size: 9.68pt;" aria-label="librarians (26 items)">librarians</a>
<a href="https://circulatingnow.nlm.nih.gov/tag/libraries/" class="tag-cloud-link tag-link-12499 tag-link-position-34" style="font-size: 10.613333333333pt;" aria-label="libraries (29 items)">libraries</a>
<a href="https://circulatingnow.nlm.nih.gov/tag/manuscript/" class="tag-cloud-link tag-link-517998 tag-link-position-35" style="font-size: 16.4pt;" aria-label="manuscript (60 items)">manuscript</a>
<a href="https://circulatingnow.nlm.nih.gov/tag/medicine-on-screen/" class="tag-cloud-link tag-link-671616459 tag-link-position-36" style="font-size: 12.106666666667pt;" aria-label="Medicine on Screen (35 items)">Medicine on Screen</a>
<a href="https://circulatingnow.nlm.nih.gov/tag/mental-health/" class="tag-cloud-link tag-link-5004 tag-link-position-37" style="font-size: 10.8pt;" aria-label="mental health (30 items)">mental health</a>
<a href="https://circulatingnow.nlm.nih.gov/tag/michael-e-debakey/" class="tag-cloud-link tag-link-1753209 tag-link-position-38" style="font-size: 8.7466666666667pt;" aria-label="Michael E. DeBakey (23 items)">Michael E. DeBakey</a>
<a href="https://circulatingnow.nlm.nih.gov/tag/military/" class="tag-cloud-link tag-link-488 tag-link-position-39" style="font-size: 18.266666666667pt;" aria-label="military (76 items)">military</a>
<a href="https://circulatingnow.nlm.nih.gov/tag/nih/" class="tag-cloud-link tag-link-631875 tag-link-position-40" style="font-size: 8.3733333333333pt;" aria-label="NIH (22 items)">NIH</a>
<a href="https://circulatingnow.nlm.nih.gov/tag/fellowship/" class="tag-cloud-link tag-link-58980 tag-link-position-41" style="font-size: 12.853333333333pt;" aria-label="NLM DeBakey Fellowship (39 items)">NLM DeBakey Fellowship</a>
<a href="https://circulatingnow.nlm.nih.gov/tag/nlmhisttalk/" class="tag-cloud-link tag-link-5711 tag-link-position-42" style="font-size: 19.013333333333pt;" aria-label="NLM History Talks (85 items)">NLM History Talks</a>
<a href="https://circulatingnow.nlm.nih.gov/tag/nursing/" class="tag-cloud-link tag-link-7193 tag-link-position-43" style="font-size: 11.36pt;" aria-label="nursing (32 items)">nursing</a>
<a href="https://circulatingnow.nlm.nih.gov/tag/photograph/" class="tag-cloud-link tag-link-12074 tag-link-position-44" style="font-size: 12.293333333333pt;" aria-label="photograph (36 items)">photograph</a>
<a href="https://circulatingnow.nlm.nih.gov/tag/physician/" class="tag-cloud-link tag-link-541893 tag-link-position-45" style="font-size: 10.613333333333pt;" aria-label="physician (29 items)">physician</a>
<a href="https://circulatingnow.nlm.nih.gov/tag/plants/" class="tag-cloud-link tag-link-15734 tag-link-position-46" style="font-size: 9.12pt;" aria-label="plants (24 items)">plants</a>
<a href="https://circulatingnow.nlm.nih.gov/tag/posters/" class="tag-cloud-link tag-link-7195 tag-link-position-47" style="font-size: 12.106666666667pt;" aria-label="posters (35 items)">posters</a>
<a href="https://circulatingnow.nlm.nih.gov/tag/profiles-in-science/" class="tag-cloud-link tag-link-5535849 tag-link-position-48" style="font-size: 9.68pt;" aria-label="Profiles in Science (26 items)">Profiles in Science</a>
<a href="https://circulatingnow.nlm.nih.gov/tag/public-health/" class="tag-cloud-link tag-link-28006 tag-link-position-49" style="font-size: 19.946666666667pt;" aria-label="public health (95 items)">public health</a>
<a href="https://circulatingnow.nlm.nih.gov/tag/race/" class="tag-cloud-link tag-link-678875950 tag-link-position-50" style="font-size: 11.733333333333pt;" aria-label="race (34 items)">race</a>
<a href="https://circulatingnow.nlm.nih.gov/tag/rare-books/" class="tag-cloud-link tag-link-393736 tag-link-position-51" style="font-size: 9.68pt;" aria-label="Rare Books (26 items)">Rare Books</a>
<a href="https://circulatingnow.nlm.nih.gov/tag/recent-acquisitions/" class="tag-cloud-link tag-link-2971278 tag-link-position-52" style="font-size: 15.093333333333pt;" aria-label="Recent Acquisitions (51 items)">Recent Acquisitions</a>
<a href="https://circulatingnow.nlm.nih.gov/tag/research/" class="tag-cloud-link tag-link-668 tag-link-position-53" style="font-size: 20.693333333333pt;" aria-label="research (104 items)">research</a>
<a href="https://circulatingnow.nlm.nih.gov/tag/surgeon-general/" class="tag-cloud-link tag-link-385674 tag-link-position-54" style="font-size: 9.12pt;" aria-label="Surgeon General (24 items)">Surgeon General</a>
<a href="https://circulatingnow.nlm.nih.gov/tag/surgery/" class="tag-cloud-link tag-link-57544 tag-link-position-55" style="font-size: 8pt;" aria-label="surgery (21 items)">surgery</a>
<a href="https://circulatingnow.nlm.nih.gov/tag/traveling-exhibitions/" class="tag-cloud-link tag-link-6044794 tag-link-position-56" style="font-size: 9.68pt;" aria-label="traveling exhibitions (26 items)">traveling exhibitions</a>
<a href="https://circulatingnow.nlm.nih.gov/tag/web-collecting/" class="tag-cloud-link tag-link-238214791 tag-link-position-57" style="font-size: 8pt;" aria-label="web collecting (21 items)">web collecting</a>
<a href="https://circulatingnow.nlm.nih.gov/tag/womens-history/" class="tag-cloud-link tag-link-97077 tag-link-position-58" style="font-size: 17.146666666667pt;" aria-label="Women&#039;s History (66 items)">Women&#039;s History</a>
<a href="https://circulatingnow.nlm.nih.gov/tag/world-war-i/" class="tag-cloud-link tag-link-110820 tag-link-position-59" style="font-size: 14.906666666667pt;" aria-label="World War I (50 items)">World War I</a>
<a href="https://circulatingnow.nlm.nih.gov/tag/world-war-ii/" class="tag-cloud-link tag-link-62291 tag-link-position-60" style="font-size: 13.6pt;" aria-label="World War II (43 items)">World War II</a></div>
</aside></div><div class="widget-wrap"><aside id="archives-5" class="widget widget_archive clearfix"><div class="widget-header"><h3 class="widget-title">Archives</h3></div> <label class="screen-reader-text" for="archives-dropdown-5">Archives</label>
<select id="archives-dropdown-5" name="archive-dropdown">
<option value="">Select Month</option>
<option value='https://circulatingnow.nlm.nih.gov/2025/01/'> January 2025 </option>
<option value='https://circulatingnow.nlm.nih.gov/2024/12/'> December 2024 </option>
<option value='https://circulatingnow.nlm.nih.gov/2024/11/'> November 2024 </option>
<option value='https://circulatingnow.nlm.nih.gov/2024/10/'> October 2024 </option>
<option value='https://circulatingnow.nlm.nih.gov/2024/09/'> September 2024 </option>
<option value='https://circulatingnow.nlm.nih.gov/2024/08/'> August 2024 </option>
<option value='https://circulatingnow.nlm.nih.gov/2024/07/'> July 2024 </option>
<option value='https://circulatingnow.nlm.nih.gov/2024/06/'> June 2024 </option>
<option value='https://circulatingnow.nlm.nih.gov/2024/05/'> May 2024 </option>
<option value='https://circulatingnow.nlm.nih.gov/2024/04/'> April 2024 </option>
<option value='https://circulatingnow.nlm.nih.gov/2024/03/'> March 2024 </option>
<option value='https://circulatingnow.nlm.nih.gov/2024/02/'> February 2024 </option>
<option value='https://circulatingnow.nlm.nih.gov/2024/01/'> January 2024 </option>
<option value='https://circulatingnow.nlm.nih.gov/2023/12/'> December 2023 </option>
<option value='https://circulatingnow.nlm.nih.gov/2023/11/'> November 2023 </option>
<option value='https://circulatingnow.nlm.nih.gov/2023/10/'> October 2023 </option>
<option value='https://circulatingnow.nlm.nih.gov/2023/09/'> September 2023 </option>
<option value='https://circulatingnow.nlm.nih.gov/2023/08/'> August 2023 </option>
<option value='https://circulatingnow.nlm.nih.gov/2023/07/'> July 2023 </option>
<option value='https://circulatingnow.nlm.nih.gov/2023/06/'> June 2023 </option>
<option value='https://circulatingnow.nlm.nih.gov/2023/05/'> May 2023 </option>
<option value='https://circulatingnow.nlm.nih.gov/2023/04/'> April 2023 </option>
<option value='https://circulatingnow.nlm.nih.gov/2023/03/'> March 2023 </option>
<option value='https://circulatingnow.nlm.nih.gov/2023/02/'> February 2023 </option>
<option value='https://circulatingnow.nlm.nih.gov/2023/01/'> January 2023 </option>
<option value='https://circulatingnow.nlm.nih.gov/2022/12/'> December 2022 </option>
<option value='https://circulatingnow.nlm.nih.gov/2022/11/'> November 2022 </option>
<option value='https://circulatingnow.nlm.nih.gov/2022/10/'> October 2022 </option>
<option value='https://circulatingnow.nlm.nih.gov/2022/09/'> September 2022 </option>
<option value='https://circulatingnow.nlm.nih.gov/2022/08/'> August 2022 </option>
<option value='https://circulatingnow.nlm.nih.gov/2022/07/'> July 2022 </option>
<option value='https://circulatingnow.nlm.nih.gov/2022/06/'> June 2022 </option>
<option value='https://circulatingnow.nlm.nih.gov/2022/05/'> May 2022 </option>
<option value='https://circulatingnow.nlm.nih.gov/2022/04/'> April 2022 </option>
<option value='https://circulatingnow.nlm.nih.gov/2022/03/'> March 2022 </option>
<option value='https://circulatingnow.nlm.nih.gov/2022/02/'> February 2022 </option>
<option value='https://circulatingnow.nlm.nih.gov/2022/01/'> January 2022 </option>
<option value='https://circulatingnow.nlm.nih.gov/2021/12/'> December 2021 </option>
<option value='https://circulatingnow.nlm.nih.gov/2021/11/'> November 2021 </option>
<option value='https://circulatingnow.nlm.nih.gov/2021/10/'> October 2021 </option>
<option value='https://circulatingnow.nlm.nih.gov/2021/09/'> September 2021 </option>
<option value='https://circulatingnow.nlm.nih.gov/2021/08/'> August 2021 </option>
<option value='https://circulatingnow.nlm.nih.gov/2021/07/'> July 2021 </option>
<option value='https://circulatingnow.nlm.nih.gov/2021/06/'> June 2021 </option>
<option value='https://circulatingnow.nlm.nih.gov/2021/05/'> May 2021 </option>
<option value='https://circulatingnow.nlm.nih.gov/2021/04/'> April 2021 </option>
<option value='https://circulatingnow.nlm.nih.gov/2021/03/'> March 2021 </option>
<option value='https://circulatingnow.nlm.nih.gov/2021/02/'> February 2021 </option>
<option value='https://circulatingnow.nlm.nih.gov/2021/01/'> January 2021 </option>
<option value='https://circulatingnow.nlm.nih.gov/2020/12/'> December 2020 </option>
<option value='https://circulatingnow.nlm.nih.gov/2020/11/'> November 2020 </option>
<option value='https://circulatingnow.nlm.nih.gov/2020/10/'> October 2020 </option>
<option value='https://circulatingnow.nlm.nih.gov/2020/09/'> September 2020 </option>
<option value='https://circulatingnow.nlm.nih.gov/2020/08/'> August 2020 </option>
<option value='https://circulatingnow.nlm.nih.gov/2020/07/'> July 2020 </option>
<option value='https://circulatingnow.nlm.nih.gov/2020/06/'> June 2020 </option>
<option value='https://circulatingnow.nlm.nih.gov/2020/05/'> May 2020 </option>
<option value='https://circulatingnow.nlm.nih.gov/2020/04/'> April 2020 </option>
<option value='https://circulatingnow.nlm.nih.gov/2020/03/'> March 2020 </option>
<option value='https://circulatingnow.nlm.nih.gov/2020/02/'> February 2020 </option>
<option value='https://circulatingnow.nlm.nih.gov/2020/01/'> January 2020 </option>
<option value='https://circulatingnow.nlm.nih.gov/2019/12/'> December 2019 </option>
<option value='https://circulatingnow.nlm.nih.gov/2019/11/'> November 2019 </option>
<option value='https://circulatingnow.nlm.nih.gov/2019/10/'> October 2019 </option>
<option value='https://circulatingnow.nlm.nih.gov/2019/09/'> September 2019 </option>
<option value='https://circulatingnow.nlm.nih.gov/2019/08/'> August 2019 </option>
<option value='https://circulatingnow.nlm.nih.gov/2019/07/'> July 2019 </option>
<option value='https://circulatingnow.nlm.nih.gov/2019/06/'> June 2019 </option>
<option value='https://circulatingnow.nlm.nih.gov/2019/05/'> May 2019 </option>
<option value='https://circulatingnow.nlm.nih.gov/2019/04/'> April 2019 </option>
<option value='https://circulatingnow.nlm.nih.gov/2019/03/'> March 2019 </option>
<option value='https://circulatingnow.nlm.nih.gov/2019/02/'> February 2019 </option>
<option value='https://circulatingnow.nlm.nih.gov/2019/01/'> January 2019 </option>
<option value='https://circulatingnow.nlm.nih.gov/2018/12/'> December 2018 </option>
<option value='https://circulatingnow.nlm.nih.gov/2018/11/'> November 2018 </option>
<option value='https://circulatingnow.nlm.nih.gov/2018/10/'> October 2018 </option>
<option value='https://circulatingnow.nlm.nih.gov/2018/09/'> September 2018 </option>
<option value='https://circulatingnow.nlm.nih.gov/2018/08/'> August 2018 </option>
<option value='https://circulatingnow.nlm.nih.gov/2018/07/'> July 2018 </option>
<option value='https://circulatingnow.nlm.nih.gov/2018/06/'> June 2018 </option>
<option value='https://circulatingnow.nlm.nih.gov/2018/05/'> May 2018 </option>
<option value='https://circulatingnow.nlm.nih.gov/2018/04/'> April 2018 </option>
<option value='https://circulatingnow.nlm.nih.gov/2018/03/'> March 2018 </option>
<option value='https://circulatingnow.nlm.nih.gov/2018/02/'> February 2018 </option>
<option value='https://circulatingnow.nlm.nih.gov/2018/01/'> January 2018 </option>
<option value='https://circulatingnow.nlm.nih.gov/2017/12/'> December 2017 </option>
<option value='https://circulatingnow.nlm.nih.gov/2017/11/'> November 2017 </option>
<option value='https://circulatingnow.nlm.nih.gov/2017/10/'> October 2017 </option>
<option value='https://circulatingnow.nlm.nih.gov/2017/09/'> September 2017 </option>
<option value='https://circulatingnow.nlm.nih.gov/2017/08/'> August 2017 </option>
<option value='https://circulatingnow.nlm.nih.gov/2017/07/'> July 2017 </option>
<option value='https://circulatingnow.nlm.nih.gov/2017/06/'> June 2017 </option>
<option value='https://circulatingnow.nlm.nih.gov/2017/05/'> May 2017 </option>
<option value='https://circulatingnow.nlm.nih.gov/2017/04/'> April 2017 </option>
<option value='https://circulatingnow.nlm.nih.gov/2017/03/'> March 2017 </option>
<option value='https://circulatingnow.nlm.nih.gov/2017/02/'> February 2017 </option>
<option value='https://circulatingnow.nlm.nih.gov/2017/01/'> January 2017 </option>
<option value='https://circulatingnow.nlm.nih.gov/2016/12/'> December 2016 </option>
<option value='https://circulatingnow.nlm.nih.gov/2016/11/'> November 2016 </option>
<option value='https://circulatingnow.nlm.nih.gov/2016/10/'> October 2016 </option>
<option value='https://circulatingnow.nlm.nih.gov/2016/09/'> September 2016 </option>
<option value='https://circulatingnow.nlm.nih.gov/2016/08/'> August 2016 </option>
<option value='https://circulatingnow.nlm.nih.gov/2016/07/'> July 2016 </option>
<option value='https://circulatingnow.nlm.nih.gov/2016/06/'> June 2016 </option>
<option value='https://circulatingnow.nlm.nih.gov/2016/05/'> May 2016 </option>
<option value='https://circulatingnow.nlm.nih.gov/2016/04/'> April 2016 </option>
<option value='https://circulatingnow.nlm.nih.gov/2016/03/'> March 2016 </option>
<option value='https://circulatingnow.nlm.nih.gov/2016/02/'> February 2016 </option>
<option value='https://circulatingnow.nlm.nih.gov/2016/01/'> January 2016 </option>
<option value='https://circulatingnow.nlm.nih.gov/2015/12/'> December 2015 </option>
<option value='https://circulatingnow.nlm.nih.gov/2015/11/'> November 2015 </option>
<option value='https://circulatingnow.nlm.nih.gov/2015/10/'> October 2015 </option>
<option value='https://circulatingnow.nlm.nih.gov/2015/09/'> September 2015 </option>
<option value='https://circulatingnow.nlm.nih.gov/2015/08/'> August 2015 </option>
<option value='https://circulatingnow.nlm.nih.gov/2015/07/'> July 2015 </option>
<option value='https://circulatingnow.nlm.nih.gov/2015/06/'> June 2015 </option>
<option value='https://circulatingnow.nlm.nih.gov/2015/05/'> May 2015 </option>
<option value='https://circulatingnow.nlm.nih.gov/2015/04/'> April 2015 </option>
<option value='https://circulatingnow.nlm.nih.gov/2015/03/'> March 2015 </option>
<option value='https://circulatingnow.nlm.nih.gov/2015/02/'> February 2015 </option>
<option value='https://circulatingnow.nlm.nih.gov/2015/01/'> January 2015 </option>
<option value='https://circulatingnow.nlm.nih.gov/2014/12/'> December 2014 </option>
<option value='https://circulatingnow.nlm.nih.gov/2014/11/'> November 2014 </option>
<option value='https://circulatingnow.nlm.nih.gov/2014/10/'> October 2014 </option>
<option value='https://circulatingnow.nlm.nih.gov/2014/09/'> September 2014 </option>
<option value='https://circulatingnow.nlm.nih.gov/2014/08/'> August 2014 </option>
<option value='https://circulatingnow.nlm.nih.gov/2014/07/'> July 2014 </option>
<option value='https://circulatingnow.nlm.nih.gov/2014/06/'> June 2014 </option>
<option value='https://circulatingnow.nlm.nih.gov/2014/05/'> May 2014 </option>
<option value='https://circulatingnow.nlm.nih.gov/2014/04/'> April 2014 </option>
<option value='https://circulatingnow.nlm.nih.gov/2014/03/'> March 2014 </option>
<option value='https://circulatingnow.nlm.nih.gov/2014/02/'> February 2014 </option>
<option value='https://circulatingnow.nlm.nih.gov/2014/01/'> January 2014 </option>
<option value='https://circulatingnow.nlm.nih.gov/2013/12/'> December 2013 </option>
<option value='https://circulatingnow.nlm.nih.gov/2013/11/'> November 2013 </option>
<option value='https://circulatingnow.nlm.nih.gov/2013/10/'> October 2013 </option>
<option value='https://circulatingnow.nlm.nih.gov/2013/09/'> September 2013 </option>
<option value='https://circulatingnow.nlm.nih.gov/2013/08/'> August 2013 </option>
<option value='https://circulatingnow.nlm.nih.gov/2013/07/'> July 2013 </option>
</select>
<script type="text/javascript">
/* <![CDATA[ */
(function() {
var dropdown = document.getElementById( "archives-dropdown-5" );
function onSelectChange() {
if ( dropdown.options[ dropdown.selectedIndex ].value !== '' ) {
document.location.href = this.options[ this.selectedIndex ].value;
}
}
dropdown.onchange = onSelectChange;
})();
/* ]]> */
</script>
</aside></div><div class="widget-wrap"><aside id="text-4" class="widget widget_text clearfix"><div class="widget-header"><h3 class="widget-title">VISIT US</h3></div> <div class="textwidget"><a href="https://www.nlm.nih.gov/hmd/index.html">History of Medicine Division</a> at the <a href="https://www.nlm.nih.gov/">National Library of Medicine</a></div>
</aside></div><div class="widget-wrap"><aside id="google_translate_widget-5" class="widget widget_google_translate_widget clearfix"><div class="widget-header"><h3 class="widget-title">Translate This Blog</h3></div><div id="google_translate_element"></div></aside></div><div class="widget-wrap"><aside id="block-2" class="widget widget_block widget_text clearfix">
<p>National Library of Medicine<br><a href="https://www.google.com/maps/place/8600+Rockville+Pike,+Bethesda,+MD+20894/@38.9959508,-77.101021,17z/data=!3m1!4b1!4m5!3m4!1s0x89b7c95e25765ddb:0x19156f88b27635b8!8m2!3d38.9959508!4d-77.0988323">8600 Rockville Pike<br>Bethesda, MD 20894</a></p>
</aside></div><div class="widget-wrap"><aside id="block-3" class="widget widget_block widget_text clearfix">
<p><a href="https://www.nlm.nih.gov/web_policies.html">Web Policies</a><br><a href="https://www.nih.gov/institutes-nih/nih-office-director/office-communications-public-liaison/freedom-information-act-office">FOIA</a><br><a href="https://www.hhs.gov/vulnerability-disclosure-policy/index.html">HHS Vulnerability Disclosure</a></p>
</aside></div><div class="widget-wrap"><aside id="block-4" class="widget widget_block widget_text clearfix">
<p><a href="https://support.nlm.nih.gov/?from=https://circulatingnow.nlm.nih.gov/">NLM Support Center</a><br><a href="https://www.nlm.nih.gov/accessibility.html">Accessibility</a><br><a href="https://www.nlm.nih.gov/careers/careers.html">Careers</a></p>
</aside></div><div class="widget-wrap"><aside id="block-5" class="widget widget_block widget_text clearfix">
<p><a href="https://www.nlm.nih.gov/">NLM</a>&nbsp;|&nbsp;<a href="https://www.nih.gov/">NIH</a>&nbsp;|&nbsp;<a href="https://www.hhs.gov/">HHS</a>&nbsp;|&nbsp;<a href="https://www.usa.gov/">USA.gov</a></p>
</aside></div><div class="widget-wrap"><aside id="block-16" class="widget widget_block clearfix"><h3 class="widget-title">Connect with NLM</h3>
<figure class="wp-block-image size-large nlmicon"><a href="https://www.facebook.com/nationallibraryofmedicine"><img decoding="async" src="https://www.nlm.nih.gov/images/facebook_white.svg" alt=""/></a></figure>
<figure class="wp-block-image size-large nlmicon"><a href="https://twitter.com/nlm_nih"><img decoding="async" src="https://www.nlm.nih.gov/images/twitter_white.svg" style="padding:10px" alt=""/></a></figure>
<figure class="wp-block-image size-large nlmicon"><a href="https://www.linkedin.com/company/national-library-of-medicine-nlm"><img decoding="async" src="https://www.nlm.nih.gov/images/linkedin_white.svg" alt=""/></a></figure></aside></div><div class="widget-wrap"><aside id="jetpack_display_posts_widget-4" class="widget widget_jetpack_display_posts_widget clearfix"><div class="widget-header"><h3 class="widget-title">Films and Essays from NLM: Medicine on Screen</h3></div><div class="jetpack-display-remote-posts"><h4><a href="https://medicineonscreen.nlm.nih.gov/2024/07/09/promoting-birth-control-in-1970s-colombia-unlikely-alliances-on-and-off-the-screen/">Promoting Birth Control in 1970s Colombia: Unlikely Alliances On and Off the Screen</a></h4>
<a title="Promoting Birth Control in 1970s Colombia: Unlikely Alliances On and Off the Screen" href="https://medicineonscreen.nlm.nih.gov/2024/07/09/promoting-birth-control-in-1970s-colombia-unlikely-alliances-on-and-off-the-screen/"><img src="https://i0.wp.com/medicineonscreen.nlm.nih.gov/wp-content/uploads/2024/06/the-city_101194160.jpg?fit=625%2C480&ssl=1" alt="Promoting Birth Control in 1970s Colombia: Unlikely Alliances On and Off the Screen"/></a></div><!-- .jetpack-display-remote-posts --></aside></div><div class="widget-wrap"><aside id="wpcom_social_media_icons_widget-4" class="widget widget_wpcom_social_media_icons_widget clearfix"><div class="widget-header"><h3 class="widget-title">Explore History at NLM</h3></div><ul><li><a href="https://www.instagram.com/nlm_collections/" class="genericon genericon-instagram" target="_blank"><span class="screen-reader-text">View nlm_collections&#8217;s profile on Instagram</span></a></li><li><a href="https://www.pinterest.com/NLMHistory/" class="genericon genericon-pinterest" target="_blank"><span class="screen-reader-text">View NLMHistory&#8217;s profile on Pinterest</span></a></li><li><a href="https://www.youtube.com/user/NLMNIH/" class="genericon genericon-youtube" target="_blank"><span class="screen-reader-text">View NLMNIH&#8217;s profile on YouTube</span></a></li><li><a href="https://www.flickr.com/photos/nlmhmd/" class="genericon genericon-flickr" target="_blank"><span class="screen-reader-text">View nlmhmd&#8217;s profile on Flickr</span></a></li></ul></aside></div>
</section><!-- #secondary -->
</div><!-- #content -->
<div id="footer" class="footer-wrap">
<footer id="colophon" class="site-footer container clearfix" role="contentinfo">
<div id="footer-text" class="site-info">
<span class="credit-link">
WordPress ThemeZee. </span>
</div><!-- .site-info -->
</footer><!-- #colophon -->
</div>
</div><!-- #page -->
<!-- -->
<script defer id="bilmur" data-customproperties="{&quot;woo_active&quot;:&quot;0&quot;}" data-provider="wordpress.com" data-service="atomic" src="https://s0.wp.com/wp-content/js/bilmur.min.js?m=202510" data-site-tz="America/New_York"></script>
<div class="jetpack-subscription-modal">
<div class="jetpack-subscription-modal__modal-content">
<div class="wp-block-group has-border-color jetpack-subscription-modal__modal-content-form" style="border-color:#dddddd;border-width:1px;margin-top:0;margin-bottom:0;padding:32px"><div class="wp-block-group__inner-container is-layout-flow wp-block-group-is-layout-flow">
<h2 class="wp-block-heading has-text-align-center" style="margin-top:4px;margin-bottom:10px;font-size:26px;font-style:normal;font-weight:600">Discover more from Circulating Now from the NLM Historical Collections</h2>
<p class='has-text-align-center' style='margin-top:4px;margin-bottom:0px;font-size:15px'>Subscribe now to keep reading and get access to the full archive.</p>
<div class="wp-block-jetpack-subscriptions__supports-newline is-style-compact wp-block-jetpack-subscriptions">
<div class="wp-block-jetpack-subscriptions__container is-not-subscriber">
<form
action="https://wordpress.com/email-subscriptions"
method="post"
accept-charset="utf-8"
data-blog="52242398"
data-post_access_level="everybody"
data-subscriber_email=""
id="subscribe-blog-3"
>
<div class="wp-block-jetpack-subscriptions__form-elements">
<p id="subscribe-email">
<label
id="subscribe-field-3-label"
for="subscribe-field-3"
class="screen-reader-text"
>
Type your email… </label>
<input
required="required"
type="email"
name="email"
style="font-size: 16px;padding: 15px 23px 15px 23px;border-radius: 50px;border-width: 1px;"
placeholder="Type your email…"
value=""
id="subscribe-field-3"
title="Please fill in this field."
/> </p>
<p id="subscribe-submit"
>
<input type="hidden" name="action" value="subscribe"/>
<input type="hidden" name="blog_id" value="52242398"/>
<input type="hidden" name="source" value="https://circulatingnow.nlm.nih.gov/2021/05/13/exploring-the-data-of-web-archives-as-part-of-data-science-nlm/"/>
<input type="hidden" name="sub-type" value="subscribe-block"/>
<input type="hidden" name="app_source" value="atomic-subscription-modal-lo"/>
<input type="hidden" name="redirect_fragment" value="subscribe-blog-3"/>
<input type="hidden" name="lang" value="en_US"/>
<input type="hidden" id="_wpnonce" name="_wpnonce" value="d3fcec8ab9" /><input type="hidden" name="_wp_http_referer" value="/2021/05/13/exploring-the-data-of-web-archives-as-part-of-data-science-nlm/" /><input type="hidden" name="post_id" value="21153"/> <button type="submit"
class="wp-block-button__link"
style="font-size: 16px;padding: 15px 23px 15px 23px;margin: 0; margin-left: 10px;border-radius: 50px;border-width: 1px;"
name="jetpack_subscriptions_widget"
>
Subscribe </button>
</p>
</div>
</form>
</div>
</div>
<p class="has-text-align-center jetpack-subscription-modal__close" style="margin-top:20px;font-size:14px"><a href="#">Continue reading</a></p>
</div></div>
</div>
</div>
<div style="display:none">
<div class="grofile-hash-map-c19b566d0dc4245aba204c976266d3db">
</div>
</div>
<div id="jp-carousel-loading-overlay">
<div id="jp-carousel-loading-wrapper">
<span id="jp-carousel-library-loading">&nbsp;</span>
</div>
</div>
<div class="jp-carousel-overlay" style="display: none;">
<div class="jp-carousel-container">
<!-- The Carousel Swiper -->
<div
class="jp-carousel-wrap swiper-container jp-carousel-swiper-container jp-carousel-transitions"
itemscope
itemtype="https://schema.org/ImageGallery">
<div class="jp-carousel swiper-wrapper"></div>
<div class="jp-swiper-button-prev swiper-button-prev">
<svg width="25" height="24" viewBox="0 0 25 24" fill="none" xmlns="http://www.w3.org/2000/svg">
<mask id="maskPrev" mask-type="alpha" maskUnits="userSpaceOnUse" x="8" y="6" width="9" height="12">
<path d="M16.2072 16.59L11.6496 12L16.2072 7.41L14.8041 6L8.8335 12L14.8041 18L16.2072 16.59Z" fill="white"/>
</mask>
<g mask="url(#maskPrev)">
<rect x="0.579102" width="23.8823" height="24" fill="#FFFFFF"/>
</g>
</svg>
</div>
<div class="jp-swiper-button-next swiper-button-next">
<svg width="25" height="24" viewBox="0 0 25 24" fill="none" xmlns="http://www.w3.org/2000/svg">
<mask id="maskNext" mask-type="alpha" maskUnits="userSpaceOnUse" x="8" y="6" width="8" height="12">
<path d="M8.59814 16.59L13.1557 12L8.59814 7.41L10.0012 6L15.9718 12L10.0012 18L8.59814 16.59Z" fill="white"/>
</mask>
<g mask="url(#maskNext)">
<rect x="0.34375" width="23.8822" height="24" fill="#FFFFFF"/>
</g>
</svg>
</div>
</div>
<!-- The main close buton -->
<div class="jp-carousel-close-hint">
<svg width="25" height="24" viewBox="0 0 25 24" fill="none" xmlns="http://www.w3.org/2000/svg">
<mask id="maskClose" mask-type="alpha" maskUnits="userSpaceOnUse" x="5" y="5" width="15" height="14">
<path d="M19.3166 6.41L17.9135 5L12.3509 10.59L6.78834 5L5.38525 6.41L10.9478 12L5.38525 17.59L6.78834 19L12.3509 13.41L17.9135 19L19.3166 17.59L13.754 12L19.3166 6.41Z" fill="white"/>
</mask>
<g mask="url(#maskClose)">
<rect x="0.409668" width="23.8823" height="24" fill="#FFFFFF"/>
</g>
</svg>
</div>
<!-- Image info, comments and meta -->
<div class="jp-carousel-info">
<div class="jp-carousel-info-footer">
<div class="jp-carousel-pagination-container">
<div class="jp-swiper-pagination swiper-pagination"></div>
<div class="jp-carousel-pagination"></div>
</div>
<div class="jp-carousel-photo-title-container">
<h2 class="jp-carousel-photo-caption"></h2>
</div>
<div class="jp-carousel-photo-icons-container">
<a href="#" class="jp-carousel-icon-btn jp-carousel-icon-info" aria-label="Toggle photo metadata visibility">
<span class="jp-carousel-icon">
<svg width="25" height="24" viewBox="0 0 25 24" fill="none" xmlns="http://www.w3.org/2000/svg">
<mask id="maskInfo" mask-type="alpha" maskUnits="userSpaceOnUse" x="2" y="2" width="21" height="20">
<path fill-rule="evenodd" clip-rule="evenodd" d="M12.7537 2C7.26076 2 2.80273 6.48 2.80273 12C2.80273 17.52 7.26076 22 12.7537 22C18.2466 22 22.7046 17.52 22.7046 12C22.7046 6.48 18.2466 2 12.7537 2ZM11.7586 7V9H13.7488V7H11.7586ZM11.7586 11V17H13.7488V11H11.7586ZM4.79292 12C4.79292 16.41 8.36531 20 12.7537 20C17.142 20 20.7144 16.41 20.7144 12C20.7144 7.59 17.142 4 12.7537 4C8.36531 4 4.79292 7.59 4.79292 12Z" fill="white"/>
</mask>
<g mask="url(#maskInfo)">
<rect x="0.8125" width="23.8823" height="24" fill="#FFFFFF"/>
</g>
</svg>
</span>
</a>
<a href="#" class="jp-carousel-icon-btn jp-carousel-icon-comments" aria-label="Toggle photo comments visibility">
<span class="jp-carousel-icon">
<svg width="25" height="24" viewBox="0 0 25 24" fill="none" xmlns="http://www.w3.org/2000/svg">
<mask id="maskComments" mask-type="alpha" maskUnits="userSpaceOnUse" x="2" y="2" width="21" height="20">
<path fill-rule="evenodd" clip-rule="evenodd" d="M4.3271 2H20.2486C21.3432 2 22.2388 2.9 22.2388 4V16C22.2388 17.1 21.3432 18 20.2486 18H6.31729L2.33691 22V4C2.33691 2.9 3.2325 2 4.3271 2ZM6.31729 16H20.2486V4H4.3271V18L6.31729 16Z" fill="white"/>
</mask>
<g mask="url(#maskComments)">
<rect x="0.34668" width="23.8823" height="24" fill="#FFFFFF"/>
</g>
</svg>
<span class="jp-carousel-has-comments-indicator" aria-label="This image has comments."></span>
</span>
</a>
</div>
</div>
<div class="jp-carousel-info-extra">
<div class="jp-carousel-info-content-wrapper">
<div class="jp-carousel-photo-title-container">
<h2 class="jp-carousel-photo-title"></h2>
</div>
<div class="jp-carousel-comments-wrapper">
<div id="jp-carousel-comments-loading">
<span>Loading Comments...</span>
</div>
<div class="jp-carousel-comments"></div>
<div id="jp-carousel-comment-form-container">
<span id="jp-carousel-comment-form-spinner">&nbsp;</span>
<div id="jp-carousel-comment-post-results"></div>
<form id="jp-carousel-comment-form">
<label for="jp-carousel-comment-form-comment-field" class="screen-reader-text">Write a Comment...</label>
<textarea
name="comment"
class="jp-carousel-comment-form-field jp-carousel-comment-form-textarea"
id="jp-carousel-comment-form-comment-field"
placeholder="Write a Comment..."
></textarea>
<div id="jp-carousel-comment-form-submit-and-info-wrapper">
<div id="jp-carousel-comment-form-commenting-as">
<fieldset>
<label for="jp-carousel-comment-form-email-field">Email (Required)</label>
<input type="text" name="email" class="jp-carousel-comment-form-field jp-carousel-comment-form-text-field" id="jp-carousel-comment-form-email-field" />
</fieldset>
<fieldset>
<label for="jp-carousel-comment-form-author-field">Name (Required)</label>
<input type="text" name="author" class="jp-carousel-comment-form-field jp-carousel-comment-form-text-field" id="jp-carousel-comment-form-author-field" />
</fieldset>
<fieldset>
<label for="jp-carousel-comment-form-url-field">Website</label>
<input type="text" name="url" class="jp-carousel-comment-form-field jp-carousel-comment-form-text-field" id="jp-carousel-comment-form-url-field" />
</fieldset>
</div>
<input
type="submit"
name="submit"
class="jp-carousel-comment-form-button"
id="jp-carousel-comment-form-button-submit"
value="Post Comment" />
</div>
</form>
</div>
</div>
<div class="jp-carousel-image-meta">
<div class="jp-carousel-title-and-caption">
<div class="jp-carousel-photo-info">
<h3 class="jp-carousel-caption" itemprop="caption description"></h3>
</div>
<div class="jp-carousel-photo-description"></div>
</div>
<ul class="jp-carousel-image-exif" style="display: none;"></ul>
<a class="jp-carousel-image-download" href="#" target="_blank" style="display: none;">
<svg width="25" height="24" viewBox="0 0 25 24" fill="none" xmlns="http://www.w3.org/2000/svg">
<mask id="mask0" mask-type="alpha" maskUnits="userSpaceOnUse" x="3" y="3" width="19" height="18">
<path fill-rule="evenodd" clip-rule="evenodd" d="M5.84615 5V19H19.7775V12H21.7677V19C21.7677 20.1 20.8721 21 19.7775 21H5.84615C4.74159 21 3.85596 20.1 3.85596 19V5C3.85596 3.9 4.74159 3 5.84615 3H12.8118V5H5.84615ZM14.802 5V3H21.7677V10H19.7775V6.41L9.99569 16.24L8.59261 14.83L18.3744 5H14.802Z" fill="white"/>
</mask>
<g mask="url(#mask0)">
<rect x="0.870605" width="23.8823" height="24" fill="#FFFFFF"/>
</g>
</svg>
<span class="jp-carousel-download-text"></span>
</a>
<div class="jp-carousel-image-map" style="display: none;"></div>
</div>
</div>
</div>
</div>
</div>
</div>
<script type="text/javascript">
window.WPCOM_sharing_counts = {"https:\/\/circulatingnow.nlm.nih.gov\/2021\/05\/13\/exploring-the-data-of-web-archives-as-part-of-data-science-nlm\/":21153};
</script>
<link rel='stylesheet' id='all-css-d3eed8408a4b1b24afe0fda9758945f1' href='https://circulatingnow.nlm.nih.gov/_static/??-eJyVj9EKwjAMRX/IGHUo+iB+itQ2lGjWlqal7O8dTH0S3Z6S3JscbloCG0OhUDBJ9RwU71SSsQ/so6tCitbkWJUEtXGiDLcanNDaqq7aguuXAW9hLqCwkANvRCgPv6a5wMbOUxlrzC5lUoUUtcAko5bh/3NXDhY9Bco8ruj3dmkejZaNQE+ODUywT5hLf94eTt2u2+y74xOzmadK' type='text/css' media='all' />
<style id='jetpack-block-subscriptions-inline-css'>
.is-style-compact .is-not-subscriber .wp-block-button__link,.is-style-compact .is-not-subscriber .wp-block-jetpack-subscriptions__button{border-end-start-radius:0!important;border-start-start-radius:0!important;margin-inline-start:0!important}.is-style-compact .is-not-subscriber .components-text-control__input,.is-style-compact .is-not-subscriber p#subscribe-email input[type=email]{border-end-end-radius:0!important;border-start-end-radius:0!important}.is-style-compact:not(.wp-block-jetpack-subscriptions__use-newline) .components-text-control__input{border-inline-end-width:0!important}.wp-block-jetpack-subscriptions.wp-block-jetpack-subscriptions__supports-newline .wp-block-jetpack-subscriptions__form-container{display:flex;flex-direction:column}.wp-block-jetpack-subscriptions.wp-block-jetpack-subscriptions__supports-newline:not(.wp-block-jetpack-subscriptions__use-newline) .is-not-subscriber .wp-block-jetpack-subscriptions__form-elements{align-items:flex-start;display:flex}.wp-block-jetpack-subscriptions.wp-block-jetpack-subscriptions__supports-newline:not(.wp-block-jetpack-subscriptions__use-newline) p#subscribe-submit{display:flex;justify-content:center}.wp-block-jetpack-subscriptions.wp-block-jetpack-subscriptions__supports-newline .wp-block-jetpack-subscriptions__form .wp-block-jetpack-subscriptions__button,.wp-block-jetpack-subscriptions.wp-block-jetpack-subscriptions__supports-newline .wp-block-jetpack-subscriptions__form .wp-block-jetpack-subscriptions__textfield .components-text-control__input,.wp-block-jetpack-subscriptions.wp-block-jetpack-subscriptions__supports-newline .wp-block-jetpack-subscriptions__form button,.wp-block-jetpack-subscriptions.wp-block-jetpack-subscriptions__supports-newline .wp-block-jetpack-subscriptions__form input[type=email],.wp-block-jetpack-subscriptions.wp-block-jetpack-subscriptions__supports-newline form .wp-block-jetpack-subscriptions__button,.wp-block-jetpack-subscriptions.wp-block-jetpack-subscriptions__supports-newline form .wp-block-jetpack-subscriptions__textfield .components-text-control__input,.wp-block-jetpack-subscriptions.wp-block-jetpack-subscriptions__supports-newline form button,.wp-block-jetpack-subscriptions.wp-block-jetpack-subscriptions__supports-newline form input[type=email]{box-sizing:border-box;cursor:pointer;line-height:1.3;min-width:auto!important;white-space:nowrap!important}.wp-block-jetpack-subscriptions.wp-block-jetpack-subscriptions__supports-newline .wp-block-jetpack-subscriptions__form .wp-block-jetpack-subscriptions__button[contenteditable=true],.wp-block-jetpack-subscriptions.wp-block-jetpack-subscriptions__supports-newline form .wp-block-jetpack-subscriptions__button[contenteditable=true]{white-space:pre-wrap!important}.wp-block-jetpack-subscriptions.wp-block-jetpack-subscriptions__supports-newline .wp-block-jetpack-subscriptions__form input[type=email]::placeholder,.wp-block-jetpack-subscriptions.wp-block-jetpack-subscriptions__supports-newline .wp-block-jetpack-subscriptions__form input[type=email]:disabled,.wp-block-jetpack-subscriptions.wp-block-jetpack-subscriptions__supports-newline form input[type=email]::placeholder,.wp-block-jetpack-subscriptions.wp-block-jetpack-subscriptions__supports-newline form input[type=email]:disabled{color:currentColor;opacity:.5}.wp-block-jetpack-subscriptions.wp-block-jetpack-subscriptions__supports-newline .wp-block-jetpack-subscriptions__form .wp-block-jetpack-subscriptions__button,.wp-block-jetpack-subscriptions.wp-block-jetpack-subscriptions__supports-newline .wp-block-jetpack-subscriptions__form button,.wp-block-jetpack-subscriptions.wp-block-jetpack-subscriptions__supports-newline form .wp-block-jetpack-subscriptions__button,.wp-block-jetpack-subscriptions.wp-block-jetpack-subscriptions__supports-newline form button{border-color:#0000;border-style:solid}.wp-block-jetpack-subscriptions.wp-block-jetpack-subscriptions__supports-newline .wp-block-jetpack-subscriptions__form .wp-block-jetpack-subscriptions__textfield,.wp-block-jetpack-subscriptions.wp-block-jetpack-subscriptions__supports-newline .wp-block-jetpack-subscriptions__form p#subscribe-email,.wp-block-jetpack-subscriptions.wp-block-jetpack-subscriptions__supports-newline form .wp-block-jetpack-subscriptions__textfield,.wp-block-jetpack-subscriptions.wp-block-jetpack-subscriptions__supports-newline form p#subscribe-email{background:#0000;flex-grow:1}.wp-block-jetpack-subscriptions.wp-block-jetpack-subscriptions__supports-newline .wp-block-jetpack-subscriptions__form .wp-block-jetpack-subscriptions__textfield .components-base-control__field,.wp-block-jetpack-subscriptions.wp-block-jetpack-subscriptions__supports-newline .wp-block-jetpack-subscriptions__form .wp-block-jetpack-subscriptions__textfield .components-text-control__input,.wp-block-jetpack-subscriptions.wp-block-jetpack-subscriptions__supports-newline .wp-block-jetpack-subscriptions__form .wp-block-jetpack-subscriptions__textfield input[type=email],.wp-block-jetpack-subscriptions.wp-block-jetpack-subscriptions__supports-newline .wp-block-jetpack-subscriptions__form p#subscribe-email .components-base-control__field,.wp-block-jetpack-subscriptions.wp-block-jetpack-subscriptions__supports-newline .wp-block-jetpack-subscriptions__form p#subscribe-email .components-text-control__input,.wp-block-jetpack-subscriptions.wp-block-jetpack-subscriptions__supports-newline .wp-block-jetpack-subscriptions__form p#subscribe-email input[type=email],.wp-block-jetpack-subscriptions.wp-block-jetpack-subscriptions__supports-newline form .wp-block-jetpack-subscriptions__textfield .components-base-control__field,.wp-block-jetpack-subscriptions.wp-block-jetpack-subscriptions__supports-newline form .wp-block-jetpack-subscriptions__textfield .components-text-control__input,.wp-block-jetpack-subscriptions.wp-block-jetpack-subscriptions__supports-newline form .wp-block-jetpack-subscriptions__textfield input[type=email],.wp-block-jetpack-subscriptions.wp-block-jetpack-subscriptions__supports-newline form p#subscribe-email .components-base-control__field,.wp-block-jetpack-subscriptions.wp-block-jetpack-subscriptions__supports-newline form p#subscribe-email .components-text-control__input,.wp-block-jetpack-subscriptions.wp-block-jetpack-subscriptions__supports-newline form p#subscribe-email input[type=email]{height:auto;margin:0;width:100%}.wp-block-jetpack-subscriptions.wp-block-jetpack-subscriptions__supports-newline .wp-block-jetpack-subscriptions__form p#subscribe-email,.wp-block-jetpack-subscriptions.wp-block-jetpack-subscriptions__supports-newline .wp-block-jetpack-subscriptions__form p#subscribe-submit,.wp-block-jetpack-subscriptions.wp-block-jetpack-subscriptions__supports-newline form p#subscribe-email,.wp-block-jetpack-subscriptions.wp-block-jetpack-subscriptions__supports-newline form p#subscribe-submit{line-height:0;margin:0;padding:0}.wp-block-jetpack-subscriptions.wp-block-jetpack-subscriptions__supports-newline.wp-block-jetpack-subscriptions__show-subs .wp-block-jetpack-subscriptions__subscount{font-size:16px;margin:8px 0;text-align:end}.wp-block-jetpack-subscriptions.wp-block-jetpack-subscriptions__supports-newline.wp-block-jetpack-subscriptions__use-newline .wp-block-jetpack-subscriptions__form-elements{display:block}.wp-block-jetpack-subscriptions.wp-block-jetpack-subscriptions__supports-newline.wp-block-jetpack-subscriptions__use-newline .wp-block-jetpack-subscriptions__button,.wp-block-jetpack-subscriptions.wp-block-jetpack-subscriptions__supports-newline.wp-block-jetpack-subscriptions__use-newline button{display:inline-block;max-width:100%}.wp-block-jetpack-subscriptions.wp-block-jetpack-subscriptions__supports-newline.wp-block-jetpack-subscriptions__use-newline .wp-block-jetpack-subscriptions__subscount{text-align:start}#subscribe-submit.is-link{text-align:center;width:auto!important}#subscribe-submit.is-link a{margin-left:0!important;margin-top:0!important;width:auto!important}@keyframes jetpack-memberships_button__spinner-animation{to{transform:rotate(1turn)}}.jetpack-memberships-spinner{display:none;height:1em;margin:0 0 0 5px;width:1em}.jetpack-memberships-spinner svg{height:100%;margin-bottom:-2px;width:100%}.jetpack-memberships-spinner-rotating{animation:jetpack-memberships_button__spinner-animation .75s linear infinite;transform-origin:center}.is-loading .jetpack-memberships-spinner{display:inline-block}body.jetpack-memberships-modal-open{overflow:hidden}dialog.jetpack-memberships-modal{opacity:1}dialog.jetpack-memberships-modal,dialog.jetpack-memberships-modal iframe{background:#0000;border:0;bottom:0;box-shadow:none;height:100%;left:0;margin:0;padding:0;position:fixed;right:0;top:0;width:100%}dialog.jetpack-memberships-modal::backdrop{background-color:#000;opacity:.7;transition:opacity .2s ease-out}dialog.jetpack-memberships-modal.is-loading,dialog.jetpack-memberships-modal.is-loading::backdrop{opacity:0}
</style>
<style id='core-block-supports-inline-css'>
.wp-container-core-group-is-layout-1 > :where(:not(.alignleft):not(.alignright):not(.alignfull)){max-width:480px;margin-left:auto !important;margin-right:auto !important;}.wp-container-core-group-is-layout-1 > .alignwide{max-width:480px;}.wp-container-core-group-is-layout-1 .alignfull{max-width:none;}
</style>
<script type="text/javascript" id="coblocks-tinyswiper-initializer-js-extra">
/* <![CDATA[ */
var coblocksTinyswiper = {"carouselPrevButtonAriaLabel":"Previous","carouselNextButtonAriaLabel":"Next","sliderImageAriaLabel":"Image"};
/* ]]> */
</script>
<script type="text/javascript" id="tortuga-navigation-js-extra">
/* <![CDATA[ */
var tortugaScreenReaderText = {"expand":"Expand child menu","collapse":"Collapse child menu","icon":"<svg class=\"icon icon-expand\" aria-hidden=\"true\" role=\"img\"> <use xlink:href=\"https:\/\/circulatingnow.nlm.nih.gov\/wp-content\/themes\/tortuga\/assets\/icons\/genericons-neue.svg#expand\"><\/use> <\/svg>"};
/* ]]> */
</script>
<script type="text/javascript" id="subscription-modal-js-js-extra">
/* <![CDATA[ */
var subscriptionData = {"homeUrl":"circulatingnow.nlm.nih.gov"};
/* ]]> */
</script>
<script type='text/javascript' src='https://circulatingnow.nlm.nih.gov/_static/??-eJyNjlFuAjEMRC/U1CAVwU/Vs2QTK3hJnCh22G5PT1ZLadUixJ/t8ZuZqRiXWZEVSmyBWMDlIWZ3EvAkCuPPwVimZJUyv47yMj1BnpF9rgJKPBuZqGB9Fr2FLuyKGmJSspG+/tnoERP2nFy1BQtWBFUWG7ZnCmvnRN+9iV1sHmXNSak7mIolzr9+/hYMra8D1gBDo+jB59QZ62cg9vj5gBxRi3UnSNm3iLdEAWmDuEplaWe6aqPpw1W+o3b/j/S+3b9tdtvd4bC5ADw6qaw='></script>
<script type="text/javascript" src="https://secure.gravatar.com/js/gprofiles.js?ver=202510" id="grofiles-cards-js"></script>
<script type="text/javascript" id="wpgroho-js-extra">
/* <![CDATA[ */
var WPGroHo = {"my_hash":""};
/* ]]> */
</script>
<script type='text/javascript' src='https://circulatingnow.nlm.nih.gov/wp-content/plugins/jetpack/modules/wpgroho.js?m=1730206540'></script>
<script type="text/javascript" id="front_end_js-js-extra">
/* <![CDATA[ */
var blnotifier_front_end = {"show_in_console":"","admin_dir":"wp-admin","scan_header":"","scan_footer":"","elements":{"a":"href","iframe":"src","video":"src","img":"src"},"nonce":"fcca7daeae","ajaxurl":"https:\/\/circulatingnow.nlm.nih.gov\/wp-admin\/admin-ajax.php"};
/* ]]> */
</script>
<script type="text/javascript" src="https://circulatingnow.nlm.nih.gov/wp-content/plugins/broken-link-notifier/includes/js/results-front.js?ver=1.2.0" id="front_end_js-js"></script>
<script type='text/javascript' src='https://circulatingnow.nlm.nih.gov/wp-content/plugins/jetpack/_inc/build/likes/queuehandler.min.js?m=1740419734'></script>
<script type="text/javascript" id="jetpack-stats-js-before">
/* <![CDATA[ */
_stq = window._stq || [];
_stq.push([ "view", JSON.parse("{\"v\":\"ext\",\"blog\":\"52242398\",\"post\":\"21153\",\"tz\":\"-5\",\"srv\":\"circulatingnow.nlm.nih.gov\",\"hp\":\"atomic\",\"ac\":\"2\",\"amp\":\"0\",\"j\":\"1:14.4\"}") ]);
_stq.push([ "clickTrackerInit", "52242398", "21153" ]);
/* ]]> */
</script>
<script type="text/javascript" src="https://stats.wp.com/e-202510.js" id="jetpack-stats-js" defer="defer" data-wp-strategy="defer"></script>
<script type="text/javascript" id="jetpack-carousel-js-extra">
/* <![CDATA[ */
var jetpackSwiperLibraryPath = {"url":"https:\/\/circulatingnow.nlm.nih.gov\/wp-content\/plugins\/jetpack\/_inc\/build\/carousel\/swiper-bundle.min.js"};
var jetpackCarouselStrings = {"widths":[370,700,1000,1200,1400,2000],"is_logged_in":"","lang":"en","ajaxurl":"https:\/\/circulatingnow.nlm.nih.gov\/wp-admin\/admin-ajax.php","nonce":"171eaffc49","display_exif":"1","display_comments":"1","single_image_gallery":"1","single_image_gallery_media_file":"","background_color":"black","comment":"Comment","post_comment":"Post Comment","write_comment":"Write a Comment...","loading_comments":"Loading Comments...","image_label":"Open image in full-screen.","download_original":"View full size <span class=\"photo-size\">{0}<span class=\"photo-size-times\">\u00d7<\/span>{1}<\/span>","no_comment_text":"Please be sure to submit some text with your comment.","no_comment_email":"Please provide an email address to comment.","no_comment_author":"Please provide your name to comment.","comment_post_error":"Sorry, but there was an error posting your comment. Please try again later.","comment_approved":"Your comment was approved.","comment_unapproved":"Your comment is in moderation.","camera":"Camera","aperture":"Aperture","shutter_speed":"Shutter Speed","focal_length":"Focal Length","copyright":"Copyright","comment_registration":"0","require_name_email":"1","login_url":"https:\/\/circulatingnow.nlm.nih.gov\/wp-login.php?redirect_to=https%3A%2F%2Fcirculatingnow.nlm.nih.gov%2F2021%2F05%2F13%2Fexploring-the-data-of-web-archives-as-part-of-data-science-nlm%2F","blog_id":"1","meta_data":["camera","aperture","shutter_speed","focal_length","copyright"]};
/* ]]> */
</script>
<script type='text/javascript' src='https://circulatingnow.nlm.nih.gov/_static/??-eJyNjEkKgDAMAD9kDeJ+EJ8itYaSGmOxLeLvvehVPM4MzOmV2SWiRPCcLEkAh9Frs8JEYmBOxAsYfewpIL9NvSLfSHIXsvPXJhLjoqxmxuP6omc7bkPRllVZd33R3MRXPxI='></script>
<script type="text/javascript" id="jetpack-blocks-assets-base-url-js-before">
/* <![CDATA[ */
var Jetpack_Block_Assets_Base_Url="https://circulatingnow.nlm.nih.gov/wp-content/plugins/jetpack/_inc/blocks/";
/* ]]> */
</script>
<script type="text/javascript" id="google-translate-init-js-extra">
/* <![CDATA[ */
var _wp_google_translate_widget = {"lang":"en_US","layout":"0"};
/* ]]> */
</script>
<script type='text/javascript' src='https://circulatingnow.nlm.nih.gov/_static/??-eJyNj8EKwjAQRH/IdCtC1YP4KdIm27DtNgndTYN/b9DeRPA4w7wZpiRDwXJ2KDAJOBKFDYOLK5RkUuTnSMzNQqGZ5FAtG4NiUEicPYUKoabezvCoNTBwtLOA5EHsSkkp1sRGWH7A/UyyoH7gXZhxfafcX4OZ2EEh51EFfIye0ejaB+Fe8cvYf9yX2/F8ul7aru0uLzfvYWU='></script>
<script type="text/javascript" src="//translate.google.com/translate_a/element.js?cb=googleTranslateElementInit&amp;ver=14.4" id="google-translate-js"></script>
<script type="text/javascript" id="sharing-js-js-extra">
/* <![CDATA[ */
var sharing_js_options = {"lang":"en","counts":"1","is_stats_active":"1"};
/* ]]> */
</script>
<script type="text/javascript" src="https://circulatingnow.nlm.nih.gov/wp-content/plugins/jetpack/_inc/build/sharedaddy/sharing.min.js?ver=14.4" id="sharing-js-js"></script>
<script type="text/javascript" id="sharing-js-js-after">
/* <![CDATA[ */
var windowOpen;
( function () {
function matches( el, sel ) {
return !! (
el.matches && el.matches( sel ) ||
el.msMatchesSelector && el.msMatchesSelector( sel )
);
}
document.body.addEventListener( 'click', function ( event ) {
if ( ! event.target ) {
return;
}
var el;
if ( matches( event.target, 'a.share-twitter' ) ) {
el = event.target;
} else if ( event.target.parentNode && matches( event.target.parentNode, 'a.share-twitter' ) ) {
el = event.target.parentNode;
}
if ( el ) {
event.preventDefault();
// If there's another sharing window open, close it.
if ( typeof windowOpen !== 'undefined' ) {
windowOpen.close();
}
windowOpen = window.open( el.getAttribute( 'href' ), 'wpcomtwitter', 'menubar=1,resizable=1,width=600,height=350' );
return false;
}
} );
} )();
var windowOpen;
( function () {
function matches( el, sel ) {
return !! (
el.matches && el.matches( sel ) ||
el.msMatchesSelector && el.msMatchesSelector( sel )
);
}
document.body.addEventListener( 'click', function ( event ) {
if ( ! event.target ) {
return;
}
var el;
if ( matches( event.target, 'a.share-facebook' ) ) {
el = event.target;
} else if ( event.target.parentNode && matches( event.target.parentNode, 'a.share-facebook' ) ) {
el = event.target.parentNode;
}
if ( el ) {
event.preventDefault();
// If there's another sharing window open, close it.
if ( typeof windowOpen !== 'undefined' ) {
windowOpen.close();
}
windowOpen = window.open( el.getAttribute( 'href' ), 'wpcomfacebook', 'menubar=1,resizable=1,width=600,height=400' );
return false;
}
} );
} )();
var windowOpen;
( function () {
function matches( el, sel ) {
return !! (
el.matches && el.matches( sel ) ||
el.msMatchesSelector && el.msMatchesSelector( sel )
);
}
document.body.addEventListener( 'click', function ( event ) {
if ( ! event.target ) {
return;
}
var el;
if ( matches( event.target, 'a.share-tumblr' ) ) {
el = event.target;
} else if ( event.target.parentNode && matches( event.target.parentNode, 'a.share-tumblr' ) ) {
el = event.target.parentNode;
}
if ( el ) {
event.preventDefault();
// If there's another sharing window open, close it.
if ( typeof windowOpen !== 'undefined' ) {
windowOpen.close();
}
windowOpen = window.open( el.getAttribute( 'href' ), 'wpcomtumblr', 'menubar=1,resizable=1,width=450,height=450' );
return false;
}
} );
} )();
var windowOpen;
( function () {
function matches( el, sel ) {
return !! (
el.matches && el.matches( sel ) ||
el.msMatchesSelector && el.msMatchesSelector( sel )
);
}
document.body.addEventListener( 'click', function ( event ) {
if ( ! event.target ) {
return;
}
var el;
if ( matches( event.target, 'a.share-linkedin' ) ) {
el = event.target;
} else if ( event.target.parentNode && matches( event.target.parentNode, 'a.share-linkedin' ) ) {
el = event.target.parentNode;
}
if ( el ) {
event.preventDefault();
// If there's another sharing window open, close it.
if ( typeof windowOpen !== 'undefined' ) {
windowOpen.close();
}
windowOpen = window.open( el.getAttribute( 'href' ), 'wpcomlinkedin', 'menubar=1,resizable=1,width=580,height=450' );
return false;
}
} );
} )();
var windowOpen;
( function () {
function matches( el, sel ) {
return !! (
el.matches && el.matches( sel ) ||
el.msMatchesSelector && el.msMatchesSelector( sel )
);
}
document.body.addEventListener( 'click', function ( event ) {
if ( ! event.target ) {
return;
}
var el;
if ( matches( event.target, 'a.share-pocket' ) ) {
el = event.target;
} else if ( event.target.parentNode && matches( event.target.parentNode, 'a.share-pocket' ) ) {
el = event.target.parentNode;
}
if ( el ) {
event.preventDefault();
// If there's another sharing window open, close it.
if ( typeof windowOpen !== 'undefined' ) {
windowOpen.close();
}
windowOpen = window.open( el.getAttribute( 'href' ), 'wpcompocket', 'menubar=1,resizable=1,width=450,height=450' );
return false;
}
} );
} )();
var windowOpen;
( function () {
function matches( el, sel ) {
return !! (
el.matches && el.matches( sel ) ||
el.msMatchesSelector && el.msMatchesSelector( sel )
);
}
document.body.addEventListener( 'click', function ( event ) {
if ( ! event.target ) {
return;
}
var el;
if ( matches( event.target, 'a.share-telegram' ) ) {
el = event.target;
} else if ( event.target.parentNode && matches( event.target.parentNode, 'a.share-telegram' ) ) {
el = event.target.parentNode;
}
if ( el ) {
event.preventDefault();
// If there's another sharing window open, close it.
if ( typeof windowOpen !== 'undefined' ) {
windowOpen.close();
}
windowOpen = window.open( el.getAttribute( 'href' ), 'wpcomtelegram', 'menubar=1,resizable=1,width=450,height=450' );
return false;
}
} );
} )();
/* ]]> */
</script>
<iframe src='https://widgets.wp.com/likes/master.html?ver=20250305#ver=20250305' scrolling='no' id='likes-master' name='likes-master' style='display:none;'></iframe>
<div id='likes-other-gravatars' role="dialog" aria-hidden="true" tabindex="-1"><div class="likes-text"><span>%d</span></div><ul class="wpl-avatars sd-like-gravatars"></ul></div>
<script type="text/javascript">
(function () {
const iframe = document.getElementById( 'jetpack_remote_comment' );
const watchReply = function() {
// Check addComment._Jetpack_moveForm to make sure we don't monkey-patch twice.
if ( 'undefined' !== typeof addComment && ! addComment._Jetpack_moveForm ) {
// Cache the Core function.
addComment._Jetpack_moveForm = addComment.moveForm;
const commentParent = document.getElementById( 'comment_parent' );
const cancel = document.getElementById( 'cancel-comment-reply-link' );
function tellFrameNewParent ( commentParentValue ) {
const url = new URL( iframe.src );
if ( commentParentValue ) {
url.searchParams.set( 'replytocom', commentParentValue )
} else {
url.searchParams.delete( 'replytocom' );
}
if( iframe.src !== url.href ) {
iframe.src = url.href;
}
};
cancel.addEventListener( 'click', function () {
tellFrameNewParent( false );
} );
addComment.moveForm = function ( _, parentId ) {
tellFrameNewParent( parentId );
return addComment._Jetpack_moveForm.apply( null, arguments );
};
}
}
document.addEventListener( 'DOMContentLoaded', watchReply );
// In WP 6.4+, the script is loaded asynchronously, so we need to wait for it to load before we monkey-patch the functions it introduces.
document.querySelector('#comment-reply-js')?.addEventListener( 'load', watchReply );
const commentIframes = document.getElementsByClassName('jetpack_remote_comment');
window.addEventListener('message', function(event) {
if (event.origin !== 'https://jetpack.wordpress.com') {
return;
}
if (!event?.data?.iframeUniqueId && !event?.data?.height) {
return;
}
const eventDataUniqueId = event.data.iframeUniqueId;
// Change height for the matching comment iframe
for (let i = 0; i < commentIframes.length; i++) {
const iframe = commentIframes[i];
const url = new URL(iframe.src);
const iframeUniqueIdParam = url.searchParams.get('iframe_unique_id');
if (iframeUniqueIdParam == event.data.iframeUniqueId) {
iframe.style.height = event.data.height + 'px';
return;
}
}
});
})();
</script>
</body>
</html>