nih-gov/www.nlm.nih.gov/pubs/techbull/nd21/nd21_medline_2022.html
2025-02-26 13:17:41 -05:00

187 lines
13 KiB
HTML

<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
<html xmlns="http://www.w3.org/1999/xhtml" lang="en">
<head>
<meta http-equiv="X-UA-Compatible" content="IE=8;" />
<meta name="twitter:card" content="summary_large_image">
<meta name="twitter:site" content="@NLM_NIH">
<meta name="twitter:title" content="MEDLINE 2022 Initiative: Transition to Automated Indexing. NLM Technical Bulletin. 2021 Nov&#8211;Dec">
<meta name="twitter:description" content=" The NLM Technical Bulletin is your source to stay informed about NLM products and services.">
<meta name="twitter:image" content="https://www.nlm.nih.gov/pubs/techbull/images/nlm_tech_bulletin_graphic_twitter.jpg">
<meta property="og:url" content="https://www.nlm.nih.gov/pubs/techbull/tb.html" />
<meta property="og:type" content="article" />
<meta property="og:title" content="MEDLINE 2022 Initiative: Transition to Automated Indexing. NLM Technical Bulletin. 2021 Nov&#8211;Dec" />
<meta property="og:description" content="The NLM Technical Bulletin is your source to stay informed about NLM products and services." />
<meta property="og:image" content="https://www.nlm.nih.gov/pubs/techbull/images/nlm_tech_bulletin_graphic_facebook.jpg" />
<link type="text/css" href="/pubs/techbull/styles/reset.css" rel="stylesheet" />
<link type="text/css" href="/pubs/techbull/styles/technicalBulletin.css" rel="stylesheet" />
<!--Call jQuery-->
<script src="//assets.nlm.nih.gov/jquery/jquery-latest.min.js"></script>
<script src="//assets.nlm.nih.gov/jquery/jquery-migrate-latest.min.js"></script>
<script src="/pubs/techbull/scripts/techbull.js" type="text/javascript" language="javascript"></script>
<!--[if lte IE 8]>
<script type="text/javascript" src="/scripts/PIE.js"></script>
<![endif]-->
<link type="text/css" href="/pubs/techbull/styles/print.css" rel="stylesheet" media="print"/>
<title>MEDLINE 2022 Initiative: Transition to Automated Indexing. NLM Technical Bulletin. 2021 Nov&#8211;Dec</title>
<link rel="schema.DC" href="http://purl.org/dc/elements/1.1/" title="The Dublin Core metadata Element Set" />
<meta name="DC.Title" content="MEDLINE 2022 Initiative: Transition to Automated Indexing" />
<meta name="DC.Publisher" content="U.S. National Library of Medicine" />
<meta name="DC.Date.Issued" content="2021-12-01" />
<meta name="DC.Date.Modified" content="2024-03-14" />
<meta name="NLMDC.Date.LastReviewed" content="2024-03-14" />
<meta name="NLM.Contact.Email" content="nlmtechbull@mail.nlm.nih.gov" />
<meta name="DC.Type" content="Newsletters" />
<meta name="NLM.Permanence.Level" content="Permanent: Stable Content" />
<meta name="DC.Rights" content="Public Domain" />
<meta name="DC.Language" content="eng" />
<!-- Google Tag Manager -->
<script>(function(w,d,s,l,i){w[l]=w[l]||[];w[l].push({'gtm.start': new Date().getTime(),event:'gtm.js'});var f=d.getElementsByTagName(s)[0],j=d.createElement(s),dl=l!='dataLayer'?'&l='+l:'';j.async=true;j.src='//www.googletagmanager.com/gtm.js?id='+i+dl;f.parentNode.insertBefore(j,f);})(window,document,'script','dataLayer','GTM-MT6MLL');</script>
<!-- End Google Tag Manager -->
</head>
<body>
<!-- Google Tag Manager -->
<noscript><iframe src="//www.googletagmanager.com/ns.html?id=GTM-MT6MLL" height="0" width="0" style="display:none;visibility:hidden" title="googletagmanager"></iframe></noscript>
<!-- End Google Tag Manager -->
<div class="skipnavigation"><a title="Skip the navigation on this page" href="#skipnav" class="skipnavigation">Skip Navigation Bar</a></div>
<div>
<div class="header">
<img src="/pubs/techbull/images/tb_logo_113.jpg" alt="National Library of Medicine Technical Bulletin" title="National Library of Medicine Technical Bulletin" /><img src="/pubs/techbull/images/nlm_masthead_113.jpg" alt="National Library of Medicine Technical Bulletin" title="National Library of Medicine Technical Bulletin" usemap="#nlm_masthead_113" />
</div>
<div class="search_box">
<form method="get" action="//vsearch.nlm.nih.gov/vivisimo/cgi-bin/query-meta" target="_self" name="searchForm" class="searchForm">
<label class="displaynone" for="search">Search</label>
<input name="query" id="search" type="text" class="search-input inactive" size="50" onfocus="this.value=''" value="Search here for NLM Technical Bulletin articles" aria-label="Search NLM Technical Bulletin">
<input type="hidden" name="v:project" value="technical-bulletin">
</form>
</div>
</div>
<div id="nav">
<!--Open drop-->
<ul class="topnav">
<li class="currentissue"><a href="//www.nlm.nih.gov/pubs/techbull/current_issue.html">Current Issue</a> <img class="separator" src="/pubs/techbull/images/whitelinetransparentbackground.gif " alt=""/></li>
<li class="archive"><a href="//www.nlm.nih.gov/pubs/techbull/back_issues.html">Previous Issues</a> <img class="separator" src="/pubs/techbull/images/whitelinetransparentbackground.gif " alt=""/></li>
<li class="about"><a href="//www.nlm.nih.gov/pubs/techbull/about.html">About</a> <img class="separator" src="/pubs/techbull/images/whitelinetransparentbackground.gif " alt=""/></li>
<li class="staycurrent"><a href="//www.nlm.nih.gov/pubs/techbull/stay_current.html">Stay Current <img class="emaillogo" src="/pubs/techbull/images/email_20px.gif" alt="E-Mail Sign Up" style="margin-top: -4px;"/> <img class="rsslogo" src="/pubs/techbull/images/rss_20px.gif" alt="RSS Feed" style="margin-top: -4px;"/></a></li>
</ul>
<!--Close drop-->
</div>
<div class="body">
<a id="skipnav" name="skipnav"></a>
<div class="syndicate">
<p class="tableOfContents"><strong>Table of Contents: <a href="/pubs/techbull/nd21/nd21_issue_cover.html">2021 NOVEMBER&#8211;DECEMBER No. 443</a></strong></p>
<p class="prevnext"><span class="buttons">
<span class="previous"><a href="nd21_fda_srs.html">Previous</a></span> <span class="next"><a href="nd21_clinical_trials_beta.html">Next</a></span>
</span></p>
<hr class="hr1" />
<h1 class="articleH1">MEDLINE 2022 Initiative: Transition to Automated Indexing</h1>
<p class="tbyearmonth">MEDLINE 2022 Initiative: Transition to Automated Indexing. NLM Tech Bull. 2021 Nov-Dec;(443):e5.</p>
<div class="articleactions">2021 December 01 <span class="status">[posted]</span>
</div>
<div class="articleParagraph">
<p>As part of the efforts of the National Library of Medicine (NLM) to transform and accelerate biomedical discovery and improve health and health care, we are transitioning to automated <a href="https://www.nlm.nih.gov/mesh/meshhome.html">MeSH</a> indexing of <a href="https://www.nlm.nih.gov/medline/medline_overview.html">MEDLINE</a> citations in <a href="https://pubmed.ncbi.nlm.nih.gov/">PubMed</a>. Automated indexing will provide users with timely access to MeSH indexed metadata and allow NLM to scale MeSH indexing for MEDLINE to the volume of published biomedical literature. Human indexers have been and will continue to be involved in the refinement of automated indexing algorithms and will play a significant role in the quality assurance approaches for automated indexing.</p>
<p>In 2018, NLM launched the MEDLINE 2022 initiative, a five-year development plan that aims to ensure that MEDLINE continues to evolve to meet the needs of users in an age of data-driven discovery. A key goal of this initiative involved implementing a range of indexing methods to ensure the timely assignment of MeSH to MEDLINE citations. Based on the successful pilot of automated indexing on a limited scale since 2016, it was determined that fully automated MEDLINE indexing be implemented with quality control, and that human curation and automation be specifically applied to improve the discoverability of chemical and gene information in MEDLINE.</p>
<div class="figure"><br />
<img src="/pubs/techbull/nd21/graphics/medline_2022_fig1.png" alt="Three different images of computer keyboards captioned with the Medline 2022 Initiative Goals. 1. A 24-hour response time for MeSH indexed citations to appear in PubMed; 2. Expanded chemical and gene curation by subject matter experts; 3. Continuous improvement of the automatic indexing algorithm" title="MEDLINE 2022 Initiative Goals." /><br />
<strong>Figure 1: MEDLINE 2022 Initiative Goals.</strong></div>
<a name="fig1"></a>
<p>Automated MeSH indexing has been under development at NLM for many years and the most significant outcome is the development of the <a href="https://lhncbc.nlm.nih.gov/ii/tools/MTI.html#:~:text=NLM%20Medical%20Text%20Indexer%20%28MTI%29%20The%20NLM%20Medical,more%20efficiently%20and%20consistently.%20Batch%20MTI%20Interactive%20MTI">Medical Text Indexer</a> (MTI) by researchers in the <a href="https://lhncbc.nlm.nih.gov/">Lister Hill National Center for Biomedical Communications</a>. MTI is not new; it has been used to provide indexing suggestions for human indexers since 2002 and was incorporated as the "first line" of indexing with subsequent human curation for a set of journals starting in 2011. Automated indexing with a version of MTI has been used for comments since 2016, OLDMEDLINE citations since 2015, and for processing an experimental batch of backlogged citations in 2016. Since 2018, the method of indexing has been identified in the XML of all completed citations.</p>
<p>The MTI algorithm has been undergoing refinements in recent years as we move towards automation, including incorporation of deep learning approaches to improve the application of MeSH subheadings, the incorporation of rules and triggers for the indexing of Publication Types, and the application of IM designation. The version of MTI used for current automated indexing is called MTIA, and it is being applied to citations from a variety of journals. Human curation of MTIA-indexed citations originally involved a scan of all citations indexed by MTIA but has been modified to focus curation on specific sets of citations (e.g., those involving genes and proteins) to scale curation and to ensure that indexed terms are correct and irrelevant terms are not indexed.
<p>Recognizing that searching for chemicals and genes are some of the most searched data points in PubMed, we are working to improve recognition of these entities by MTIA and are evaluating the incorporation of chemicals identified by the <a href="https://www.nature.com/articles/s41597-021-00875-1">NLM-Chem</a> identification tool. We are also evaluating <a href="https://www.sciencedirect.com/science/article/pii/S1532046421001088">NLM-Gene</a> as a tool to support curation at scale for the creation of GeneRIFs (the links made between PubMed and the <a href="https://www.ncbi.nlm.nih.gov/gene?cmd=Retrieve">Gene</a> database).</p>
<p>By mid-2022 we expect that all citations indexed for MEDLINE will be indexed by MTIA, with human curation applied as indicated. Beyond achievement of this major milestone, the MTIA algorithm will continue to be refined and improved.</p>
<p>Watch for future <i>NLM Technical Bulletin</i> articles for updates on developments. If you have questions or suggestions, please contact <a href="https://support.nlm.nih.gov/support/create-case/">NLM Customer Support.</a></p>
</div>
<p class="articleParagraph">
</p>
</div>
<div class="footer">
<p class="footerLeft"><span class="footerissn"><strong>ISSN 2161-2986 (Online)</strong> Content not copyrighted; freely reproducible.</span><br/>
<a href="/">National Library of Medicine</a> 8600 Rockville Pike, Bethesda, MD 20894
<br/>
<a href="//www.nlm.nih.gov/socialmedia/index.html">Connect with NLM</a>,
<a href="//www.nlm.nih.gov/web_policies.html">Web Policies</a>,
<a href="//www.nlm.nih.gov/careers/jobopenings.html">Careers</a>,
<a href="//www.nlm.nih.gov/accessibility.html">Accessibility</a>,
<a href="//www.usa.gov/" id="anch_34">USA.gov</a>,
<a href="//www.hhs.gov/vulnerability-disclosure-policy/index.html">HHS Vulnerability Disclosure</a>
<br/>
<a href="//www.nih.gov/">NIH</a>,
<a href="https://www.hhs.gov/">HHS</a>,
<a href="//www.nih.gov/institutes-nih/nih-office-director/office-communications-public-liaison/freedom-information-act-office">FOIA</a>,
<a class="supportLink" href="//support.nlm.nih.gov?from=" target="_blank">NLM Support Center</a>
</p>
<p class="footerRight">
<strong>Last updated:</strong> 14 March 2024</p>
</div>
</div>
<map id="nlm_masthead_113" name="nlm_masthead_113">
<area shape="rect" alt="NLM Technical Bulletin" coords="1,15,396,45" href="//www.nlm.nih.gov/pubs/techbull/tb.html" title="NLM Technical Bulletin" />
<area shape="rect" alt="National Library of Medicine" coords="0,47,203,62" href="//www.nlm.nih.gov/" title="National Library of Medicine" />
<area shape="rect" coords="207,47,396,62" href="//www.nih.gov/" alt="National Institutes of Health" title="" />
</map>
<!--*****************************Content end*******************************-->
<script src="/scripts/support.js"></script>
<script src="/core/nlm-notifyExternal/1.0/nlm-notifyExternal.min.js"></script>
</body>
</html>