nih-gov/www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html
2025-02-26 13:17:41 -05:00

5104 lines
360 KiB
HTML

<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
<html xmlns="http://www.w3.org/1999/xhtml">
<head>
<meta http-equiv="Content-Type" content="text/html; charset=utf-8" />
<link href="/archive/styles/global.css" rel="stylesheet" title="default" type="text/css" />
<link href="/archive/styles/global_import.css" rel="stylesheet" media="all" title="default" type="text/css" />
<script type="text/javascript" src="/archive/scripts/archive.js"></script>
<style type="text/css" media="screen" title="default">
@import url("/archive/styles/global_import.css");
@import url("/archive/styles/level2_import.css");
SPAN.disclaimer{
text-align: right; font-style:italic;
}
</style>
<!--[if IE]>
<link rel="stylesheet" href="/archive/styles/global_print.css" type="text/css" title="printpreview" media="print" />
<link rel="stylesheet" href="/archive/styles/level2_print.css" type="text/css" title="printpreview" media="print" />
<![endif]-->
<style type="text/css" media="print" >
#screen-version{display:none;}
</style>
<link rel="stylesheet" href="/archive/styles/archive.css" type="text/css" title="default" />
<title>Unified Medical Language System (UMLS) (CBM 96-8)</title>
<meta http-equiv="Content-Type" content="text/html; charset=iso-8859-1" /><link
title="The Dublin Core metadata Element Set"
"http://purl.org/dc/elements/1.1/"="http://purl.org/dc/elements/1.1/"" rel="schema.DC" /><!-- encoding = ISO-8859-1 -->
<META NAME="DC.Title" content="Current Bibliographies in Medicine 96-8">
<META NAME="DC.Publisher" content="U.S. National Library of Medicine" />
<META NAME="DC.Date.Issued" content="1997-03-21" />
<META NAME="DC.Date.Modified" content="1998-04-24" />
<META NAME="DC.Type" content="Bibliography">
<META NAME="DC.Rights" content="public domain" />
<META NAME="DC.Language" content="eng" />
<META NAME="NLMDC.Identifier.BibUI" content="9706954" />
<META NAME="NLMDC.Subject.NLMClass" content="ZW 1 N272 no.96-8" />
<META NAME="DC.Contributor.Creator" content="Selden, Catherine" />
<META NAME="DC.Relation.IsPartOf" content="Current bibliographies in medicine 96-8" />
<META NAME="NLMDC.Subject.Title" content="UMLS" />
<META NAME="DC.Subject.MeSH" content="Natural Language Processing" />
<META NAME="DC.Subject.MeSH" content="Vocabulary, Controlled" />
<META NAME="DC.Contributor" content="Humphreys, Betsy L." />
<META NAME="DC.Contributor" content="National Library of Medicine (U.S.). Reference Section." />
<META NAME="DC.Identifier.URL" content="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html" />
<META NAME="DC.Description.Notes" content="archived" />
<META NAME="DC.Date.Archived" content="2004-08-31" />
<META NAME="DC.Contact.Email" content="refweb@nlm.nih.gov" />
<META NAME="NLMDC.Date.Expiration" content="2003-04-30" />
<META NAME="NLM.Permanence.Level" content="Permanent: Stable Content" />
<META NAME="NLM.Permanence.Guarantor" content="U.S. National Library of Medicine" />
<META NAME="DC.Relation" content="Current Bibliographies in Medicine 96-8">
<META NAME="DC.Title.Alternate" content="CBM 96-8, Unified Medical Language System (UMLS)">
<META NAME="DC.Contributor" content="Catherine R. Selden, M.L.S.">
<META NAME="DC.Contributor" content="Betsy L. Humphreys, M.L.S.">
<META NAME="DC.Format" content="HTML">
<META NAME="DC.Coverage" content="January 1986 through December 1996">
<!-- BEGIN NLM HEADER -->
<meta content="MSHTML 6.00.2800.1458" name="GENERATOR" />
</head>
<body text=#000000 vLink=#960044 bgColor=#ffffff>
<!-- -->
<a href="#skip" style="color: red; display: none;">Skip to Content</a>
<table width="100%" border="0" cellpadding="0" cellspacing="0" id="archeader">
<tr>
<td id="arcbanner" ><img src="/archive/images/head_left.gif" alt="" width="334" height="55" border="0" usemap="#nlm_logo" id="NLMBanner" /></td>
<td valign="top" width="*"><div id="archivetext">Archives</div></td>
<td id="arcsearch"><form method="get" action="http://search.nlm.nih.gov/homepage/query" target="_self" name="searchForm" id="searchForm" >
<label for="PARAMETER" id="searchLabel">Search NLM Web Site</label>
<input name="PARAMETER" id="PARAMETER" type="text" class="text" size="12" />
<input name="imageField" type="image" src="/archive/images/button_go.gif" alt="Search" align="absmiddle" class="gobutton" />
<span class="navbar" ><a href="/">NLM Home</a> | <a href="/about/archives.html">About the Archives</a></span>
<input type="hidden" name="FUNCTION" value="search" />
<input type="hidden" name="MAX" value="250" />
<input type="hidden" name="DISAMBIGUATION" value="true" />
</form>
</td>
</tr>
<tr id="breadcrumb" >
<td colspan="3"><span id="arccontainerheader" class="breadlinks"><a href="/index.html">Home</a> &gt; <strong>NLM Archives</strong> &gt; </span> <span id="disclaimerheader"><strong>Document content is not current. Links may be broken.</strong></span><span class="spacer"></span></td>
</tr>
</table>
<p> </p>
<TABLE cellSpacing=0 cellPadding=0 width=640 border=0><!-- NLM LOGO BAR -->
<TBODY>
<TR>
<TD noWrap align=left><A title="Skip NLM Navigation"
href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#skipNLMNav"><IMG
height=1 alt="Skip NLM Navigation" src="umlscbm_files/blank1.gif" width=1
border=0></A><A "http://www.nlm.nih.gov/nlmhome.html"><IMG height=60
alt="NLM Home Page" src="umlscbm_files/99subhead.gif" width=201
border=0></A><A "http://www.nlm.nih.gov/pubs/resources.html"><IMG
height=60 alt="Current Bibliographies in Medicine Home Page"
src="umlscbm_files/cbmhead.gif" width=428 border=0></A><BR><!-- FIRST NAVIGATION BAR (BLUE BAR) --><IMG height=1
alt="" src="umlscbm_files/blank1.gif" width=1 border=0><A
"http://www.nlm.nih.gov/pubs/resources.html"><IMG height=20
alt="CBM Home Page" src="umlscbm_files/cbmhm.gif" width=219
border=0></A><A "http://www.nlm.nih.gov/contacts/contact.html"><IMG
height=20 alt="Contact NLM" src="umlscbm_files/contactnlmblubar.gif"
width=99 border=0></A><A "http://www.nlm.nih.gov/siteindex.html"><IMG
height=20 alt="Site Index" src="umlscbm_files/siteindexblubar.gif"
width=81 border=0></A><A "http://www.nlm.nih.gov/search.html"><IMG
height=20 alt="Search Our Web Site" src="umlscbm_files/sowsblubar.gif"
width=151 border=0></A><A "http://www.nlm.nih.gov/nlmhome.html"><IMG
height=20 alt="NLM Home Page" src="umlscbm_files/nlmhomeblubar.gif"
width=90 border=0></A><BR><!-- SECOND NAVIGATION BAR --><IMG height=1
alt="" src="umlscbm_files/blank1.gif" width=1 border=0><A
"http://www.nlm.nih.gov/hinfo.html"><IMG height=20
alt="Health Information" src="umlscbm_files/hinavybar.gif" width=119
border=0></A><A "http://www.nlm.nih.gov/libserv.html"><IMG height=20
alt="Library Services" src="umlscbm_files/lsnavybar.gif" width=115
border=0></A><A "http://www.nlm.nih.gov/resprog.html"><IMG height=20
alt="Research Programs" src="umlscbm_files/rpnavybar.gif" width=134
border=0></A><A "http://www.nlm.nih.gov/nn.html"><IMG height=20
alt="New and Noteworthy" src="umlscbm_files/nnnavybar.gif" width=128
border=0></A><A "http://www.nlm.nih.gov/ginfo.html"><IMG height=20
alt="General Information" src="umlscbm_files/ginavybar.gif" width=130
border=0></A> </TD></TR>
<TR>
<TD><BR><!-- END NLM HEADER --><!-- Standard heading -->
<H2 id=skipNLMNav>Current Bibliographies in Medicine 96-8</H2><!-- ************************* Content start ************************* -->
<HR>
<H1><A name=list>Unified Medical Language System® (UMLS®)</A> </H1>
<HR>
<P>January 1986 through December 1996</P>
<P>280 Citations</P>
<P>Prepared by <BR>Catherine R. Selden, M.L.S.<BR>Betsy L. Humphreys,
M.L.S.<BR></P>
<P>U.S. DEPARTMENT OF HEALTH AND HUMAN SERVICES<BR>Public Health
Service<BR>National Institutes of Health</P>
<P><A "http://www.nlm.nih.gov/nlmhome.html">National Library of
Medicine</A><BR>Reference Section<BR>8600 Rockville Pike<BR>Bethesda,
Maryland 20894</P>
<P>1997</P>
<HR>
<P><STRONG>National Library of Medicine Cataloging in
Publication</STRONG></P>
<P>Selden, Catherine <BR>Unified Medical Language System (UMLS): January
1986 through December 1996 : 280 citations / prepared by Catherine R.
Selden, Betsy L. Humphreys. -- Bethesda, Md. (8600 Rockville Pike,
Bethesda 20894) : U.S. Dept. of Health and Human Services, Public Health
Service, National Institutes of Health, National Library of Medicine,
Reference Section ; Pittsburgh, PA : Sold by the Supt. of Docs., U.S.
G.P.O., 1997.<BR>-- (Current bibliographies in medicine ; 96-8)</P>
<P>1. Unified Medical Language System - bibliography 2. Vocabulary,
Controlled - bibliography 3. Natural Language Processing - bibliography I.
Humphreys, Betsy L. II. National Library of Medicine (U.S.). Reference
Section III. Title IV. Series</P>
<P>02NLM: ZW 1 N272 no. 96-8</P>
<HR>
<H2>Contents</H2>
<H3><A href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#12">Series
Note</A></H3>
<H3><A
href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#8">Foreword</A></H3>
<H3><A
href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#10">Introduction</A></H3>
<H3><A href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#18">Search
Strategy</A></H3>
<H3><A href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#20">Sample
Citations</A></H3>
<H3><A
href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#15">Bibliography</A></H3><A
href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#list">Return to title
page</A>
<HR>
<P><A name=12><STRONG>Series Note</STRONG></A></P>
<P>Current Bibliographies in Medicine (CBM) is a continuation in part of
the National Library of Medicine's Literature Search Series, which ceased
in 1987 with No. 87-15. In 1989 it also subsumed the Specialized
Bibliography Series. Each bibliography in the new series covers a distinct
subject area of biomedicine and is intended to fulfill a current awareness
function. Citations are usually derived from searching a variety of online
databases. Citations are usually derived from searching a variety of
online databases. <A
"http://www.nlm.nih.gov/pubs/factsheets/online_databases.html">NLM
databases</A> utilized include MEDLINE®, AVLINE®, BIOETHICSLINE®,
CANCERLIT®, CATLINE®, HEALTHSTAR<SUP><FONT size=1>tm</FONT></SUP>,
POPLINE<SUP><FONT size=1>tm</FONT></SUP> and TOXLINE®. The only criterion
for the inclusion of a particular published work is its relevance to the
topic being presented; the format, ownership, or location of the material
is not considered. </P>
<P>Comments and suggestions on this series may be addressed to:</P>
<P>Karen Patrias, Editor<BR>Current Bibliographies in
Medicine<BR>Reference Section<BR>National Library of Medicine<BR>Bethesda,
MD 20894<BR>Phone: 301-496-6097<BR>Fax: 301-402-1384<BR><A
"mailto:ref@nlm.nih.gov">mailto:ref@nlm.nih.gov</A></P>
<P>This bibliography, CBM 96-8, is the last publication in this series for
calendar year 1996.</P>
<P>Ordering Information:</P>
<P><EM>Current Bibliographies in Medicine</EM> is sold by the
Superintendent of Documents, U.S. Government Printing Office, P.O. 371954,
Pittsburgh, PA 15250-7954. Orders for individual bibliographies in the
series ($5.50, $6.88 foreign) should be sent to the Superintendent of
Documents citing the title, CBM number, and the GPO List ID number.</P>
<P>Internet Access:</P>
<P>The <EM>Current Bibliographies in Medicine</EM> series is also
available at no cost to anyone with Internet access through the Library's
World Wide Web site at <A
"http://www.nlm.nih.gov/pubs/resources.html">http://www.nlm.nih.gov/pubs/resources.html</A>.</P>
<P>Use of funds for printing this periodical has been approved by the
Director of the Office of Management and Budget through September 30,
1997.</P><A
href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#list">Return to title
page</A> | <A
href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#15">Return to table of
contents</A>
<HR>
<P><STRONG><A name=8>FOREWORD</A></STRONG> </P>
<P>This bibliography marks the tenth anniversary of the National Library
of Medicine's Unified Medical Language System® (UMLS®) project, a
long-term research and development effort with the ambitious goal of
enabling computer systems to "understand" medical meaning. The project was
proposed to Congress as essential to the development of advanced health
information systems -- and as requiring an initial 5-10 year development
phase which would cost $1-3 million per year. The Congress responded with
generous and faithful support. </P>
<P>In 1986, we foresaw a future with widespread access to more powerful,
less expensive computers, improved telecommunications, and a huge array of
diverse machine-readable biomedical information sources. In such a future,
health professionals and researchers would be able to obtain information
relevant to practice or research decisions when and where needed -- but
only if automated systems could interpret their inquiries correctly,
identify databases likely to have information relevant to these inquiries,
and retrieve the pertinent information from those sources. The UMLS
project set out to design and build Knowledge Sources that could be used
by computer programs to overcome the barriers to effective information
retrieval caused by disparities in language and by the scattering of
information across many databases and systems. We understood from the
beginning that designing and building the Knowledge Sources would in fact
be easier and less expensive than maintaining them over time in order to
reflect new biomedical discoveries and concepts. For this reason, an
institution like NLM was considered to be more appropriate for directing
the UMLS project than a university department operating under short-term
grant support. </P>
<P>Ten years later our predictions regarding computers, communications,
and biomedical databases have proven to be roughly accurate, and the
explosive growth of the Internet and the World-Wide Web has both
simplified and magnified the problems the UMLS is designed to address. NLM
has issued annual editions of the UMLS Knowledge Sources since 1990 and,
in 1996, sent them to more than 700 system developers around the world.
Use of the UMLS Knowledge Sources allows many different computer systems,
including NLM's own Internet Grateful Med, to behave as if they had at
least a limited understanding of the medical meaning in words and phrases
used by questioners. Interest in controlling the language used in
computer-based patient records, as an aid to decision support, quality
control, and research, has spread from the medical informatics community
to those delivering and paying for health care. In this environment, there
is increasing interest in applying the UMLS products. </P>
<P>A long-term project of the breadth and complexity of the UMLS requires
a team with knowledge and skills from many fields. From its inception, the
UMLS effort has involved internal research and development by NLM staff,
competitively awarded contracts and grants for research assistance from
many U.S. informatics research groups, and volunteer UMLS users worldwide,
who have tested the Knowledge Sources in different environments and
provided valuable suggestions for their improvement. The UMLS project is
also indebted to the producers of many important biomedical vocabularies
and classifications who provided their terminologies to NLM for
incorporation in the UMLS Metathesaurus. </P>
<P>Set out below are the research groups and principal investigators who
have been NLM's major partners in developing and testing the UMLS
Knowledge Sources:</P>
<UL>
<LI>Beth Israel Hospital, Charles Safran, M.D.<BR>
<LI>Brigham &amp; Women's Hospital, Robert A. Greenes, M.D., Ph.D.
<LI>Carnegie-Mellon University, David A. Evans, Ph.D.
<LI>Columbia University, James J. Cimino, M.D.
<LI>Indiana University, Clement J. McDonald, M.D.
<LI>Kaiser Permanente, Simon Cohn, M.D., M.P.H.
<LI>Lexical Technology, Inc., Mark S. Tuttle
<LI>Massachusetts General Hospital, G. Octo Barnett, M.D.
<LI>Mayo Foundation, Christopher G. Chute, M.D., Ph.D.
<LI>Oregon Health Sciences University, William R. Hersh, M.D.
<LI>University of California, San Francisco, Marsden S. Blois, M.D.,
Ph.D.
<LI>University of Pittsburgh, Randolph A. Miller, M.D., Gregory F.
Cooper, M.D., Ph.D., Henry J. Lowe, M.D.
<LI>University of Utah, Homer R. Warner, M.D., Ph.D.
<LI>Yale School of Medicine, Perry L. Miller, M.D., Ph.D. </LI></UL>
<P>Literally dozens of individuals from these and other institutions have
made substantial contributions to the UMLS project. We thank them all for
what has been a gratifying and productive association. </P>
<P>The UMLS has benefited from the talent, energy, and insight of many
leaders in medical informatics and medical librarianship, most of whom are
well-represented in this bibliography. One scientist whose number of UMLS
publications does not adequately reflect his importance to the project is
Marsden Scott Blois, M.D., Ph.D. Dr. Blois was awarded one of the first
UMLS research contracts in 1986; he died in 1988 just after the project's
exploratory phase concluded. His seminal thinking about medical
information [1,2] greatly influenced the UMLS project and the design of
the UMLS Metathesaurus. His NLM colleagues and friends believe that, like
us, he would have been pleased -- but not satisfied -- with the UMLS
achievements of the past decade. </P>
<P>Donald A.B. Lindberg, M.D.<BR>Director, National Library of
Medicine<BR></P>
<P>Betsy L. Humphreys, M.L.S.<BR>Assistant Director for Health Services
Research Information, National Library of Medicine <BR></P>
<P><CITE>1. Blois MS. Information and medicine: the nature of medical
descriptions. Berkeley: University of California Press;
1984.</CITE><BR><CITE>2. Blois MS. Medicine and the nature of vertical
reasoning. N Engl J Med 1988 Mar 31;318(13):847-51.</CITE> </P><A
href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#list">Return to title
page</A> | <A
href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#15">Return to table of
contents</A><BR>
<HR>
<P><STRONG><A name=10>INTRODUCTION</A></STRONG></P>
<P>Unified Medical Language System</P>
<P>In 1986, the National Library of Medicine (NLM) began a long-term
research and development project to build the Unified Medical Language
System (UMLS®). The purpose of the UMLS is to aid the development of
systems that help health professionals and researchers retrieve and
integrate electronic biomedical information from a variety of sources. The
UMLS approach involves the development of machine-readable Knowledge
Sources that can be used by a wide variety of applications programs to
compensate for differences in the way concepts are expressed in different
machine-readable sources and by different users, to identify the
information sources most relevant to a user inquiry, and to negotiate the
telecommunications and search procedures necessary to retrieve information
from these sources. The goal is to make it easy for users to link
disparate information systems, including computer-based patient records,
bibliographic databases, factual databases, and expert systems. </P>
<P>The UMLS project is directed by a multi-disciplinary team of NLM staff
and involves medical informatics research groups across the United States
working under competitively awarded contracts and grants. More than 700
volunteer users receive the annual editions of the UMLS products free of
charge under the terms of a license agreement. The Knowledge Sources are
iteratively refined and expanded based on feedback from those applying
each successive version. </P>
<P>There are four UMLS Knowledge Sources: the Metathesaurus®:, the
SPECIALIST<SUP><FONT size=1>tm</FONT></SUP> Lexicon, a Semantic Network
and an Information Sources Map. Most heavily used to date, the
Metathesaurus provides a uniform, integrated distribution format for more
than 30 biomedical vocabularies and classifications, linking many
different names for the same concepts. The Lexicon contains syntactic
information for many Metathesaurus terms, component words, and English
words, including verbs, that do not appear in the Metathesaurus. The
Semantic Network contains information about the types or categories (e.g.,
"Disease or Syndrome," "Virus") to which all Metathesaurus concepts have
been assigned and the permissible relationships among these types (e.g.,
"Virus" causes "Disease or Syndrome"). The Information Sources Map or
directory contains both human-readable and machine-"processable"
information about the scope, location, vocabulary, syntax rules, and
access conditions of biomedical databases of all kinds. The references in
this bibliography cover the structure and semantics of the UMLS Knowledge
Sources, their development and maintenance, and assessments of their
coverage and utility for particular purposes. Some of this literature
reflects understandable confusion about the relationship of the
Metathesaurus to its constituent vocabularies. </P>
<P>The UMLS Knowledge Sources were designed as multi-purpose tools, to
facilitate the development of more effective biomedical information
systems. As intended, they have been applied in a wide variety of research
and development environments to many different tasks, including vocabulary
development, knowledge representation, clinical data capture, linking
patient data to knowledge sources, curriculum analysis, natural language
processing, automated indexing, and information retrieval. This
bibliography covers the full range of UMLS applications. </P>
<P>Particularly in its early years, but also more recently, the UMLS
project commissioned exploratory and ancillary studies on such topics as
user information needs, methods of organizing and merging vocabulary
information, and information retrieval techniques and also developed
specialized tools for use in the research effort. The bibliography also
includes published articles describing these efforts. </P>
<P>NLM staff members and outside observers have viewed the UMLS project as
an important complement to other initiatives affecting access to
information and information technology, including Integrated Advanced
Information Management Systems (IAIMS), the High Performance Computing and
Communications Program, and the emerging National Information
Infrastructure. Some commentators have been critical of the UMLS's purpose
and its approach. The bibliography includes discussions of the
relationship of the UMLS to other programs as well as commentaries on its
potential value. </P>
<P>The references in this bibliography include journal articles, book
chapters, technical reports, dissertations, and conference papers that
include substantive discussions of the UMLS project, the UMLS Knowledge
Sources, UMLS applications, and related studies carried out under the
auspices of the UMLS project. In general, meeting abstracts, letters,
comments, and editorials are included only if they present research
findings or express opinions about the project not reflected elsewhere.
Although both English and foreign language publications are cited, most
references are to English language publications. References are arranged
by subject and appear under only one topic. Abstracts have been included
if permission was granted by copyright holders. Special copyright notices
appear at the end of the abstracts if requested by copyright holders. </P>
<P>The compilers wish to thank Marlyn Schepartz, National Library of
Medicine, for her expert production and editorial assistance; Alexa T.
McCray, Ph.D. for help in organizing the references; and the many UMLS
researchers who reviewed an early draft of the bibliography and provided
additional relevant references. </P><A
href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#list">Return to title
page</A> | <A
href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#15">Return to table of
contents</A>
<HR>
<P><A name=18><STRONG>Search Strategy</STRONG></A></P>
<P>A variety of online databases are usually searched in preparing
bibliographies in the CBM series. To assist you in updating or otherwise
manipulating the material in this search, the strategy used for the NLM's
MEDLINE database is given below. Please note that the search strategies
presented here differ from individual demand searches in that they a re
generally broadly formulated and irrelevant citations edited out prior to
printing.</P>
<P>SS1 = UNIFIED MEDICAL LANGUAGE SYSTEM OR VOCABULARY, CONTROLLED
OR<BR>NATURAL LANGUAGE PROCESSING<BR>SS2 = (TW) UNIFIED AND MEDICAL AND
LANGUAGE AND SYSTEM OR UMLS<BR>SS3 = (TW) NATURAL AND LANGUAGE AND
PROCESSING OR METATHESAURUS<BR>SS4 = SEMANTIC@NETWORK<BR>SS5 =
KNOWLEDGE@SOURCES#<BR>SS6 = INFORMATION@SOURCES@MAP<BR>SS7 = 1 OR 2 OR 3
OR 4 OR 5 OR 6 <BR></P>
<P><STRONG>GRATEFUL MED and INTERNET GRATEFUL MED</STRONG></P>
<P>To make online searching easier and more efficient, the Library offers
GRATEFUL MED, microcomputer-based software that provides a user-friendly
interface to most NLM databases. This software was specifically developed
for health professionals and features multiple choice menus and "fill in
the blank" screens for easy search preparation. GRATEFUL MED runs on an
IBM PC (or IBM-compatible) with DOS 2.0 or Windows or on a Macintosh, and
requires a Hayes (or Hayes-compatible) modem. It may be purchased from the
National Technical Information Service in Springfield, Virginia, for
$29.95 (plus $3.00 per order for shipping). For your convenience, an order
blank has been enclosed at the back of this bibliography.</P>
<P>INTERNET GRATEFUL MED is available from the World Wide Web. The user
with Internet access and an NLM user account need only point a compatible
Web browser (Netscape Navigator is strongly recommended) to <A
"http://igm.nlm.nih.gov/">http://igm.nlm.nih.gov/</A>. No other
software at the user end is required.</P><A
href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#list">Return to title
page</A> | <A
href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#15">Return to table of
contents</A>
<HR>
<P><STRONG><A name=20>Sample Citations</A></STRONG> </P>
<P>Citations are formatted according to the rules established for
<EM>Index Medicus</EM> ®. Sample journal and monograph citations appear
below. For journal articles written in a foreign language, the English
translation of the title is placed in brackets; for monographs, the title
is given in the original language. In both cases the language of
publication is shown by a three letter abbreviation appearing at the end
of the citation.</P>
<P><STRONG>Journal Article:</STRONG></P>
<P><EM>Example:</EM><BR>Cimino JJ. Use of the Unified Medical Language
System in patient care at the Columbia-Presbyterian Medical Center.
Methods Inf Med 1995 Mar;34(1-2):158-64. </P>
<P><EM>Order, with separating punctuation:</EM><BR>Authors. Article Title.
Abbreviated Journal Title Date;Volume(Issue):Pages.</P>
<P><STRONG>Book Chapter:</STRONG></P>
<P><EM>Example:</EM><BR>McCray AT. Representing biomedical knowledge in
the UMLS semantic network. In: Broering NC, editor. High-performance
medical libraries: advances in information management for the virtual era.
Westport (CT): Meckler; 1993. p. 31-44. </P>
<P><EM>Order, with separating punctuation:</EM><BR>Chapter Authors.
Chapter Title. Book Editor. Book Title. Place of Publication: Publisher;
Date. Pages.</P>
<P>For details of the formats used for references, see the following
publication:<BR>Patrias, Karen. <EM>National Library of Medicine
recommended formats for bibliographic citation</EM>. Bethesda (MD): The
Library; 1991 Apr. Available from: NTIS, Springfield, VA; PB91-182030.
</P><A href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#list">Return to
title page</A> | <A
href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#15">Return to table of
contents</A>
<HR>
<H2><A name=15>TABLE OF CONTENTS FOR UMLS CBM</A></H2>
<H3><A href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#1">Overview and
Conceptual Foundations</A></H3>
<H3>UMLS Knowledge Sources</H3>
<UL>
<LI>Metathesaurus and Semantic Network<BR>
<UL>
<LI><A
href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#2a">-Structural and
Semantic Properties</A><BR>
<LI><A
href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#2b">-Development
and Maintenance</A><BR>
<LI>-<A href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#2c">Content
Coverage</A><BR></LI></UL>
<LI><A
href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#2d">Information
Sources Map</A><BR>
<LI><A
href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#2e">Distribution
Formats and Associated Tools</A><BR></LI></UL>
<H3>UMLS Applications</H3>
<UL>
<LI>Vocabulary Construction and Concept Discovery<BR>
<UL>
<LI><A href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#3a">-
Vocabulary Design, Construction, and Maintenance</A><BR>
<LI><A href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#3b">-
Vocabulary Standards, Servers, and Mapping Methods</A><BR>
<LI><A href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#3c">-
Knowledge Acquisition and Concept Discovery</A><BR></LI></UL>
<LI>Data Creation<BR>
<UL>
<LI><A href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#3d">-
Clinical Data</A><BR>
<LI><A href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#3e">-
Curricula and Faculty Interests</A><BR></LI></UL>
<LI>Natural Language processing, Indexing, and Retrieval<BR>
<UL>
<LI><A href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#3f">- NLP
Methods and Algorithms</A><BR>
<LI><A href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#3g">-
Indexing and Retrieval Methods and Algorithms</A><BR>
<LI><A href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#3h">-
Information Retrieval Systems</A><BR></LI></UL>
<LI><A href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#3i">Linking
Clinical Systems to Knowledge-Based Information Sources</A><BR>
<LI><A href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#3j">Access to
Multiple Knowledge-Based Information Sources</A><BR></LI></UL>
<H3>Preliminary and Ancillary Studies</H3><BR>
<UL>
<LI><A href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#4a">User
Information Needs</A><BR>
<LI><A href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#4b">Vocabulary
Analysis and Merging</A><BR>
<LI><A href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#4c">Knowledge
Acquisition and Representation</A><BR>
<LI><A
href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#4d">Information and
Retrieval Techniques</A><BR>
<LI><A href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#4e">Vocabulary
Browsers</A><BR>
<LI><A href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#4f">Research
Tools</A><BR></LI></UL>
<H3><A href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#5">The UMLS in
Relation to Other Programs</A></H3>
<H3><A href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#6">Commentaries
and Opinions about UMLS</A></H3><A
href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#list">Return to title
page</A>
<HR>
<H3><A name=1>Overview and Conceptual Foundations</A></H3>
<HR>
<P>Hattery M. UMLS: guide and translator in the land of medical research.
Inf Retr Libr Autom (US) 1992 Feb;27(9):1-6.</P>
<P>Humphreys BL, Lindberg DA. Building the Unified Medical Language
System. Proc Annu Symp Comput Appl Med Care 1989:475-80. The National
Library of Medicine's Unified Medical Language System (UMLS) project has
moved from a period of background studies and exploration of alternatives
to the actual construction of the first versions of important UMLS
components. This paper discusses the UMLS development strategy and
assumptions, describes briefly the UMLS components as currently
envisioned, and then focuses on the content of the first version of the
UMLS metathesaurus (Meta-1), its central vocabulary component. Copyright
by and reprinted with permission of the American Medical Informatics
Association.</P>
<P>Humphreys BL, Lindberg DA. The UMLS project: making the conceptual
connection between users and the information they need. Bull Med Libr
Assoc 1993 Apr;81(2):170-7. Conceptual connections between users and
information sources depend on an accurate representation of the content of
available information sources, an accurate representation of specific user
information needs, and the ability to match the two. Establishing such
connections is a principal function of medical librarians. The goal of the
National Library of Medicine's Unified Medical Language System (UMLS)
project is to facilitate the development of conceptual connections between
users and relevant machine-readable information. The UMLS model involves a
combination of three centrally developed Knowledge Sources (a
Metathesaurus, a Semantic Network, and an Information Sources Map) and a
variety of smart interface programs that make use of these Knowledge
Sources to help users in different environments find machine-readable
information relevant to their particular practice or research problems.
The third experimental edition of the UMLS Knowledge Sources was issued in
the fall of 1992. Current priorities for the UMLS project include
developing applications that make use of the Knowledge Sources and using
feedback from these applications to guide ongoing enhancement and
expansion of the Knowledge Sources. Medical librarians are involved
heavily in the direction of the UMLS project, in the development of the
Knowledge Sources, and in their experimental application. The involvement
of librarians in reviewing, testing, and providing feedback on UMLS
products will increase the likelihood that the UMLS project will achieve
its goal of improving access to machine-readable biomedical information.
Copyright by and reprinted with permission of the Medical Library
Association.</P>
<P>Humphreys BL, Lindberg DA. The Unified Medical Language System project:
a distributed experiment in improving access to biomedical information.
Medinfo 1992;7(Pt 2):1496-500. The goal of the US National Library of
Medicine's UMLS project is to overcome the barriers to information access
caused by the variety of ways the same biomedical concepts are expressed
and by the fragmentation of useful biomedical information among disparate
databases and systems. The UMLS strategy focuses on the development of new
knowledge sources that can be used by a variety of intelligent programs to
compensate for differences in the terminology employed by users and
information sources and in database structure and content. The early
versions of the UMLS Knowledge Sources are intended for use by system
developers. They are available free of charge under the terms of an
experimental agreement and have been distributed to 150 sites throughout
the world. Priorities for annual enhancement to the UMLS components will
be based on feedback received from those who are applying these new tools
to a variety of information access problems.</P>
<P>Humphreys BL, Lindberg DA, Hole WT. Assessing and enhancing the value
of the UMLS Knowledge Sources. Proc Annu Symp Comput Appl Med Care
1991:78-82. The goal of the UMLS Project is to give practitioners and
researchers easy access to machine-readable information from diverse
sources. Assessment of the first experimental versions of the UMLS
Knowledge Sources is essential to measuring progress toward that goal and
to identifying needed enhancements. As of July 30, 1991, copies of the
first edition of the UMLS Knowledge Sources had been distributed to 143
individuals and institutions; 66 had provided initial feedback
information. The information received indicates that the UMLS Knowledge
Sources will undergo broad testing in the patient care, medical education,
library service, and product development environments. Preliminary data
support the hypothesis that expanded coverage of routine clinical concepts
is needed. Key enhancements planned for 1992 and beyond include expanded
coverage of ICD-9-CM and CPT. Copyright by and reprinted with permission
of the American Medical Informatics Association.</P>
<P>Humphreys BL, Schuyler PL. The Unified medical language system: Moving
beyond the vocabulary of bibliographic retrieval. In: Broering NC.,
editor. High-performance medical libraries: advances in information
management for the virtual era. Westport (CT): Meckler; 1993. p. 31-44.
The National Library of Medicine's (NLM) Medical Subject Headings (MeSH)
is an extensive biomedical thesaurus used to index, catalog, and retrieve
citations to the biomedical literature. It is one of a number of source
vocabular ies for the Unified Medical Language System (UMLS), a major NLM
research and development program designed to help users to retrieve and
integrate information from a variety of disparate information sources. The
information sources of interest include bibl iographic databases, patient
records systems, factual databanks, and knowledge bases. The UMLS project
has produced three new Knowledge Sources: a Metathesaurus of concepts and
terms from vocabularies and classifications used in different types of
biomedi cal information sources: a Semantic Network of sensible
relationships among the broad semantic types or categories to which all
Metathesaurus concepts are assigned; and an information Sources Map that
describes the scope, content, and access conditions fo r publicly
available biomedical information sources. The UMLS Knowledge Sources are
intended for use by system developers and can be accessed by a variety of
interface programs to interpret user inquiries, identify sources of
information relevant to these queries, and retrieve the relevant
information. A number of specific projects are underway to assess the
usefulness of the current versions of the UMLS Knowledge Sources and to
provide feedback that can guide their future development.</P>
<P>Lindberg DA, Humphreys BL. Computer systems that understand medical
meaning. In: Scherrer JR, Cote RA, Mandil SH, editors, Computerized
natural medical language processing for knowledge representation.
Proceedings of the IFIP-IMIA WG6 International Wo rking Conference; 1988
Sep 12-15; Geneva, Switzerland. Amsterdam: North-Holland; 1989. p. 5-17.
The National Library of Medicine has begun the development of the Unified
Medical Language System (UMLS). The UMLS project is an effort to build an
increasing ly intelligent automated system that understands biomedical
terms and their interrelationships and uses this understanding to help
users retrieve and organize information from machine-readable sources.
Compared to many other efforts to build systems that understand medical
meaning, the UMLS emphasizes breadth of scope, even at the sacrifice of
depth of understanding. To some degree, it must attempt to encompass all
of biomedicine and to provide access to many different types of automated
information. This great breadth is partially offset by the defined and, in
a sense, limited purpose of the UMLS project. The goal of the UMLS is to
facilitate the retrieval and integration of information from a variety of
machine-readable information sources, including de scriptions of the
biomedical literature, clinical records, factual databanks and medical
knowledge bases. The UMLS will compensate for the differences in the
terminologies used in these disparate systems and for variations in the
language employed by user s themselves. </P>
<P>Lindberg DA, Humphreys BL. Toward a unified medical language. In: EFMI
- European Federation for Medical Informatics. Medical Informatics Europe
'87. Proceedings of the 7th International Congress; 1987 Sep 21-25; Rome,
Italy. Rome: Luigi Pozzi; 1987 . p. 23-31.</P>
<P>Lindberg DA, Humphreys BL. The UMLS knowledge sources: tools for
building better user interfaces. Proc Annu Symp Comput Appl Med Care
1990:121-5. The current focus of the National Library of Medicine's
Unified Medical Language System (UMLS) project is the development,
testing, and evaluation of the first versions of three new knowledge
sources: the Metathesaurus, the Semantic Network, and the Information
Sources Map. These three knowledge sources can be used by interface
programs to conduct an intellig ent interaction with the user and to make
the conceptual link between the user's question and relevant machine
readable information. NLM is providing experimental copies of the initial
versions of the UMLS knowledge sources in exchange for feedback on way s
they can and should be improved. The hope is that the results of such
experimentation will provide both immediate improvements in biomedical
information service and useful suggestions for enhancements to the UMLS.
Copyright by and reprinted with permiss ion of the American Medical
Informatics Association.</P>
<P>Lindberg DA, Humphreys BL, McCray AT. The Unified Medical Language
System. Methods Inf Med 1993 Aug;32(4):281-91. In 1986, the National
Library of Medicine began a long-term research and development project to
build the Unified Medical Language System (UMLS). The purpose of the UMLS
is to improve the ability of computer programs to understand the
biomedical meaning in user inquiries and to use this understanding to
retrieve and integrate relevant machine-readable information for users.
Underlying the U MLS effort is the assumption that timely access to
accurate and up-to-date information will improve decision making and
ultimately the quality of patient care and research. The development of
the UMLS is a distributed national experiment with a strong ele ment of
international collaboration. The general strategy is to develop UMLS
components through a series of successive approximations of the
capabilities ultimately desired. Three experimental Knowledge Sources, the
Metathesaurus, the Semantic Network, an d the Information Sources Map have
been developed and are distributed annually to interested researchers,
many of whom have tested and evaluated them in a range of applications.
The UMLS project and current developments in high-speed, high-capacity
intern ational networks are converging in ways that have great potential
for enhancing access to biomedical information.</P>
<P>Paterson G. UMLS knowledge sources and Canada: an overview. Bibl Medica
Can 1996 Spring;17(3):102-4.</P>
<P>Schuyler P. Integrated access to medical and pharmacological
information: the unified medical language system at the National Library
of Medicine. In: Proceedings: 1990 International Chemical Information
Conference; Montreux, Switzerland: New York: Springer-Verlag; 1990. p.
195-203.</P>
<P>Squires SJ. Access to biomedical information: the unified medical
language system. Libr Trends 1993 Summer;42(1):127-52. The National
Library of Medicine (NLM) is engaged in a long-term project to develop a
Unified Medical Language System (UMLS) that will retrieve and integrate
information from a variety of information resources. Two UMLS components
use fundamental aspects of controlled vocabulary structure and management
and their relationship to information retrieval that have general interest
for librarianship. The UMLS project is described, along with its initial
deployment in retrieval environments. Reprinted with permission from
Library Trends. Copyright 1993 The Board of Trustees of the University of
Illinois.</P><A
href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#list">Return to title
page</A> | <A
href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#15">Return to table of
contents</A>
<HR>
<H3>UMLS Knowledge Sources</H3>
<UL>
<LI><STRONG>Metathesaurus and Semantic Network</STRONG><BR>
<UL>
<LI><STRONG><A name=2a>Structural and Semantic
Properties</A></STRONG><BR></LI></UL></LI></UL>
<HR>
<P>Joubert M, Miton F, Fieschi M, Robert JJ. A conceptual graphs modeling
of UMLS components. Medinfo 1995;8(Pt 1):90-4. The Unified Medical
Language System (UMLS) of the U.S. National Library of Medicine is a
complex collection of terms, concepts, and relationships derived from
standard classifications. Potential applications would benefit from a high
level representation of its components. This paper proposes a conceptual
representation of both the Metathesaurus and the Semantic Network of the
UMLS based on conceptual graphs. It shows that the addition of a
dictionary of concepts to the UMLS knowledge base allows the capability to
exploit it pertinently. This dictionary defines more precisely the core
concepts and adds constraints on their use. Constraints are dedicated to
guide an intelligent browsing of the UMLS knowledge sources.</P>
<P>Lipow SS, Campbell KE, Olson NE, Tuttle MS, Erlbaum MS, Fuller LF,
Sherertz DS, Nelson SJ, Cole WG. Formal properties of the metathesaurus:
An update. Proc Annu Symp Comput Appl Med Care 1995:944.</P>
<P>McCray AT. Representing biomedical knowledge in the UMLS semantic
network. In: Broering NC., editor. High-performance medical libraries:
advances in information management for the virtual era. Westport (CT):
Meckler; 1993. p. 45-55. The Unified Medical Language System (UMLS)
Semantic Network is one of three Knowledge Sources currently available as
part of the National Library of Medicine's (NLM) UMLS Project. The purpose
of the Network is to provide a consistent categorization of all concepts
found in the Metathesaurus and to provide useful links between these
concepts at the level of the semantic types. The Semantic Network is
closely tied to the other two UMLS Knowledge Sources, the Metathesaurus
and the Information Sources Map. Taken together, these three Knowledge
Sources provide powerful tools for enhancing biomedical information
retrieval.</P>
<P>McCray AT. UMLS semantic network. Proc Annu Symp Comput Appl Med Care
1989:503-7. The UMLS network of semantic types is one component of NLM's
evolving Unified Medical Language System. This paper discusses the role of
the semantic network in the overall system, then describes the evolution
and current status of the network, and finally, concludes with a
discussion of plans for further development. Copyright by and reprinted
with permission of the American Medical Informatics Association.</P>
<P>McCray AT, Hole WT. The scope and structure of the first version of the
UMLS Semantic Network. Proc Annu Symp Comput Appl Med Care 1990:126-30.
The authors discuss the UMLS Semantic Network, one of three UMLS knowledge
sources currently under development by the National Library of Medicine.
They describe the structure and content of the network, and discuss the
relationship between the network and the first version of the UMLS
Metathesaurus. They address the assumptions and process involved in
assigning semantic types to Metathesaurus concepts and conclude with a
description of the distribution format of this knowledge source. Copyright
by and reprinted with permission of the American Medical Informatics
Association.</P>
<P>McCray AT, Nelson SJ. The representation of meaning in the UMLS.
Methods Inf Med 1995 Mar;34(1-2):193-201. The UMLS knowledge sources
provide detailed information about biomedical naming systems and
databases. The Metathesaurus contains biomedical terminology from an
increasing number of biomedical thesauri, and the Semantic Network
provides a structure that encompasses and unifies the thesauri that are
included in the Metathesaurus. This paper addresses some fundamental
principles underlying the design and development of the Metathesaurus and
Semantic Network. It begins with a description of the formal properties of
the semantic network. It continues with consideration of the principle of
semantic locality and how this is reflected in the UMLS knowledge sources.
The paper concludes with a discussion of the issues involved in attempting
to reuse knowledge and the potential for reuse of the UMLS knowledge
sources.</P>
<P>Nelson SJ, Fuller LF, Erlbaum MS, Tuttle MS, Sherertz DD, Olson NE. The
semantic structure of the UMLS Metathesaurus. Proc Annu Symp Comput Appl
Med Care 1992:649-53. Meta-1.1, the UMLS metathesaurus, represents medical
knowledge in the forms of names of concepts and links between those
concepts. The representations of the semantic neighborhood of a concept
can be thought of as dimensions of the property of semantic locality and
include term information (broader, narrower, or otherwise related), the co
ntextual information (parent-child, siblings in a hierarchy), the semantic
types, and the co-occurrence data (links discovered empirically from
concepts used to index the medical literature.) The degree of redundancy
of each of these dimensions was invest igated by reviewing the extent of
multiple presentations of concepts which appear as related to a given
concept. The degree of overlap was surprisingly small. While the
co-occurrence data finds some of the links represented by other
dimensions, those link s are but minute fractions of the vast amount of
co-occurrence derived links. Because parent-child relationships are often
subsumptive (or categorical) in nature, it might be expected that siblings
usually share the same semantic types. While true in the aggregate, the
wide variance in percent of types shared may reflect the intended usages
of the source vocabularies. Noun phrases were extracted from the
definitions of 40 concepts in Meta-1 in order to assess systematically the
coverage of important conce pts by Meta-1, and to assess whether the links
between these definitional concepts, which may have special value, and the
concept being defined were indeed present. Out of 161 of these
definitional concepts, 29 were not represented in Meta-1, and 37 of th ose
represented in Meta-1 had no direct link to the concept they were
defining. Copyright by and reprinted with permission of the American
Medical Informatics Association.</P>
<P>Nelson SJ, Tuttle MS, Cole WG, Sherertz DD, Sperzel WD, Erlbaum MS,
Fuller LL, Olson NE. From meaning to term: semantic locality in the UMLS
Metathesaurus. Proc Annu Symp Comput Appl Med Care 1991:209-13. The
Unified Medical Language System Metathesaurus represents the results of a
synthesis of existing biomedical naming systems (thesauri). The naming and
other information about the meanings in the Metathesaurus can be used to
find the preferred naming of that meaning in the source chosen by the
user, by exploiting the property of semantic locality. The aspects of
semantic locality in the Metathesaurus which can be thus exploited are the
terms, the semantic types, the use of that term in a source context, and
the co-occurrence of terms in MEDLINE. To find how a meaning is named in
the source of choice, a user must exploit one of these aspects of semantic
locality, entering a term somehow related to the term being sought, and
navigating to the preferred term. While the first three of these aspects
of semantic locality are normative, the last is empirical. Testing of the
utility of the aspects of semantic locality in information retrieval would
require a uniform interface with 1, no Metathesaurus, 2, the Metathesaurus
without the aspects in question, and 3, the Metathesaurus including all
the aspects. Other potential uses of empirically derived semantic locality
include defining or suggesting potentially relevant concepts in a given
situation. Copyright by and reprinted with permission of the American
Medical Informatics Association.</P>
<P>Schuyler PL, Hole WT, Tuttle MS, Sherertz DD. The UMLS Metathesaurus:
representing different views of biomedical concepts. Bull Med Libr Assoc
1993 Apr;81(2):217-22. The UMLS Metathesaurus is a compilation of names,
relationships, and associated information from a variety of biomedical
naming systems representing different views of biomedical practice or
research. The Metathesaurus is organized by meaning, and the fundamental
unit in the Metathesaurus is the concept. Differing names for a biomedical
meaning are linked in a single Metathesaurus concept. Extensive additional
information describing semantic characteristics, occurrence in
machine-readable information sources, and how concepts co-occur in these
sources is also provided, enabling a greater comprehension of the concept
in its various contexts. The Metathesaurus is not a standardized
vocabulary; it is a tool for maximizing the usefulness of existing
vocabularies. It serves as a knowledge source for developers of biomedical
information applications and as a powerful resource for biomedical
information specialists. Copyright by and reprinted with permission of the
Medical Library Association.</P>
<P>Tuttle M, Sherertz D, Olson N, Erlbaum M, Sperzel D, Fuller L, Nelson
S. Using Meta-1-the 1st version of the UMLS Metathesaurus. Proc Annu Symp
Comput Appl Med Care 1990:131-5. The National Library of Medicine (NLM) is
developing the Unified Medical Language System (UMLS) to provide uniform
access to the world's biomedical knowledge. The foundation of the UMLS is
a metathesaurus of concept names, or terms. Meta-1, the first version of
the Metathesaurus, was synthesized from existing biomedical nomenclatures
and classification systems, and it contains in excess of 100000 terms,
including all those from MeSH and DSM, and a portion of those from SNOMED,
ICD, CPT, LCSH, COSTAR and other sources. These names are arranged and
labeled so as to help answer the questions, 'What is it called?' and
'Where can I find out more about it?' The first question is referred to as
the naming problem, and the second as the location problem.' Meta-1 is a
source of lexical diversity and semantic locality with which to address
these problems in biomedicine. While the NLM will be using Meta-1 in the
UMLS, non-NLM developers and users may wish to use Meta-1 to help solve
their own naming and location problems. Copyright by and reprinted with
permission of the American Medical Informatics Association.</P>
<P>Tuttle MS, Nelson SJ, Fuller LF, Sherertz DD, Erlbaum MS, Sperzel WD,
Olson NE, Suarez-Munist ON. The semantic foundations of the UMLS
metathesaurus. Medinfo 1992;7(Pt 2):1506-11. The United States National
Library of Medicine (NLM) has issued two (annual) versions of the Unified
Medical Language System (UMLS) Metathesaurus, with the third scheduled for
Fall, 1992. The UMLS project is a long-term initiative intended to
develop, for use by both care-givers and researchers, a uniform interface
to biomedical knowledge available in electronic form. The project has been
in a component evaluation phase since the release of Meta-1.0, the first
version of the Metathesaurus, and an accompanying Semantic Network, in
October, 1990. The Metathesaurus, so called because it is a synthesis and
enhancement of existing naming and classification systems, is the central
naming component of the UMLS, a place where both users and programs can
retrieve the names of biomedical concepts, and information about how the
names and concepts relate to one another, and how they are used in
selected machine readable sources.</P>
<P>Tuttle MS, Olson NE, Campbell KE, Sherertz DD, Nelson SJ, Cole WG.
Formal properties of the Metathesaurus. Proc Annu Symp Comput Appl Med
Care 1994:145-9. The Metathesaurus is a machine-created, human edited and
enhanced synthesis of authoritative biomedical terminologies. Its formal
properties permit it to be a) exploited by computers, and b) modified and
enhanced without compromising that usage. If further constraints were
imposed on the existence and identity of Metathesaurus relationships,
i.e., if every Metathesaurus concept had a genus and a differentia, then
the Metathesaurus could be converted into an Aristotelian Hierarchy. In
this sense, a genus is a concept that classifies another concept, and a
differentia is a concept that distinguishes the classified concept from
all other concepts in the same class. Since, in principle, these
constraints would make the Metathesaurus easier to leverage and maintain
computationally, it is interesting to ask to what degree the maintenance
and enhancement procedures now in place are producing a Metathesaurus that
is also an Aristotelian Hierarchy. Given a liberal interpretation of the
current Metathesaurus schema, the proportion of the Metathesaurus that is
Aristotelian in each annual version is increasing in spite of dramatic
concurrent increases in the number of Metathesaurus concepts. Without
formality there is no modifiability nor scalability. We need formal
methods and computer-based tools that can help us with the task [of
controlled medical vocabulary construction]. We need research in which
controlled vocabulary development is the focus rather than a stepping
stone for work on other theories and applications. Copyright by and
reprinted with permission of the American Medical Informatics
Association.</P>
<P>Yang Y, Chute CG. A schematic analysis of the Unified Medical Language
System. Proc Annu Symp Comput Appl Med Care 1991:204-8. The UMLS is a
complex collection of medical terms and relationships derived from
standard classifications. Appreciating the scope and layout of these
relations from text descriptions of relational schema is difficult. The
graphical technique of Logical Data Structure (LDS) representation was
employed to illustrate the UMLS schema as a data abstraction, affording
additional insights that might otherwise escape notice. An LDS
representation of the Metathesaurus offers the following advantages: 1)
the separation of a viewpoint from physical data structures enables a
global outline of the contents; 2) the graphical map makes the
interrelation of data visible; and 3) the logical entities explicitly
reflect the decision-making which was implicit or ambiguous in the
relational scheme. Copyright by and reprinted with permission of the
American Medical Informatics Association.</P><A
href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#list">Return to title
page</A> | <A
href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#15">Return to table of
contents</A>
<HR>
<UL>
<LI>
<UL>
<LI><STRONG><A name=2b>Development and
Maintenance</A></STRONG><BR></LI></UL></LI></UL>
<HR>
<P>Sherertz DD, Olson NE, Tuttle MS, Erlbaum MS. Source inversion and
matching in the UMLS Metathesaurus. Proc Annu Symp Comput Appl Med Care
1990:141-5. One of three knowledge sources being developed as NLM'S UMLS
is a biomedical thesaurus, called the Metathesaurus. It contains
inter-term relationships across six biomedical nomenclatures and
classification systems, derivable from lexical mapping techniques. The
first public version, META-1, was built in two stages: source inversion
and source matching. Versions for the six sources were obtained in
machine-readable form. Source specific techniques were derived empirically
to analyze the information structure and content of each source. The
results of each analysis were used to guide the inversion of the
corresponding source, resulting in a homogeneous representation for all
sources. The core concepts of META-1 come primarily from MEDLINE index
terms (MeSH). Previous work on lexical mapping developed algorithmic
methods to link concepts in different sources. These methods were refined
iteratively, and used to implement a META-1 matching engine. The initial
version of META-1 was constructed with this engine, by matching the META-1
core concepts to the other sources. This version of META-1 was edited and
enhanced by domain experts, after the inclusion of supplementary
information, to produce the first publicly released version of META-1.
Copyright by and reprinted with permission of the American Medical
Informatics Association.</P>
<P>Sherertz DD, Olson NE, Tuttle MS, Sperzel WD, Erlbaum MS, Fuller LF.
The META-1 engine: a database methodology used in building the UMLS
METATHESAURUS. Medinfo 1992;7(Pt 1):144-9. Three knowledge sources are
being developed as part of the US NLM's UMLS project. The largest of these
is a biomedical thesaurus, called the METATHESAURUS. META-1 and META-1.1
(or META-1*), the first two versions of the METATHESAURUS, contain term
attributes and relationships across a number of biomedical nomenclatures
and classification systems. Entries in META-1* result from human experts
editing entries computed by an explicit database methodology. A database
engine is implemented to manage the steps used to build up the entries of
META-1* before editing, and to control the application of facts generated
by editing the computed META-1* entries. This engine maintains and
manipulates a database of facts about the entries in META-1*, and, prior
to editing produces a METATHESAURUS that is probably correct, in the sense
that all of the inter-term relationships are derivable solely from data
within the sources. The methodology used by this engine controls the
management of complexity in the METATHESAURUS, as facts change and evolve,
allowing many iterations of META-1* to be computed and analyzed.</P>
<P>Sherertz DD, Tuttle MS, Blois MS, Erlbaum MS. Intervocabulary mapping
within the UMLS: the role of lexical matching. Proc Annu Symp Comput Appl
Med Care 1988:201-6. Within the NLM's UMLS Project, one challenge is
mapping concepts from one information resource to another. While a
complete solution to this problem requires construction of a comprehensive
biomedical thesaurus, the present research provides evidence that
considerable progress can be made with a straightforward lexical approach.
Furthermore, such a lexical approach is the only practical way to begin
construction of, and maintain, any such thesaurus. Related research has
demonstrated the regularity of word usage within the context of
biomedicine. This regularity suggests that mapping between biomedical
information resources that have a constrained vocabulary can use lexical
matching techniques with considerable success. A method has been developed
to map 'phrases' from candidate sources to MeSH. In one experiment, this
method attempts to map 834 disease names from the disease descriptions
composed at UCSF for the UMLS. In a second experiment, the same method
attempts to map disease attributes from these diseases. Copyright by and
reprinted with permission of the American Medical Informatics
Association.</P>
<P>Sherertz DD, Tuttle MS, Olson NE, Erlbaum MS, Nelson SJ. Lexical
mapping in the UMLS metathesaurus. Proc Annu Symp Comput Appl Med Care
1989:494-9. A critical knowledge source being developed as part of the
NLM's UMLS (National Library of Medicine's Unified Medical Language
System) project is a biomedical thesaurus, called the metathesaurus.
Central to the metathesaurus will be interterm relationships, across
several biomedical nomenclatures and classification systems, which are
derivable from lexical mapping techniques. Previous UMLS research on
intervocabulary mapping elaborated these techniques. During the Fall of
1988, they were extended and used to build Meta-0, a 2000-concept
demonstration metathesaurus. Meta-0 was composed primarily of the most
frequently occurring MEDLINE index terms from MeSH (Medical Subject
Headings), and MeSH will be the main source of concepts for Meta-1, the
initial public version of the metathesaurus. Review of Meta-0 suggested
several refinements to the methodology for building Meta-1. These include
labeling MeSH entry terms as lexical variants or synonyms before linking
them to other sources. Later work refined algorithmic methods that detect
lexical variants in MeSH. Copyright by and reprinted with permission of
the American Medical Informatics Association.</P>
<P>Sperzel D, Erlbaum M, Fuller L, Sherertz D, Olson N, Schuyler P, Hole
W, Savage A, Passarelli P, Tuttle M. Editing the UMLS Metathesaurus:
review and enhancement of a computer knowledge source. Proc Annu Symp
Comput Appl Med Care (1990):136-40. The paper describes the editing of
Meta-1, the first official version of the National Library of Medicine's
(NLM) Unified Medical Language System (UMLS) Metathesaurus. After a
preliminary version of Meta-1 was generated by automated techniques, it
was edited by domain experts. The goal of editing was to enhance
approximately 30000 Metathesaurus entries and to correct 'errors of
commission' introduced by the automated techniques. Enhancements were made
by assigning semantic types (such as 'Disease or Syndrome' or 'Virus') and
lexical tags (such as 'eponym') to the Meta-1 entries. The production of
Meta-1 required balancing the costs of human and computational resources
appropriately, and it may illustrate a paradigm for the construction of
large biomedical information resources. The tool-supported process of
editing Meta-1, as well as some of the issues that arose during this
endeavor, are presented. Despite its large scale, the Meta-1 editing task
was accomplished within the specified constraints. Copyright by and
reprinted with permission of the American Medical Informatics
Association.</P>
<P>Sperzel WD, Tuttle MS. Updating the UMLS metathesaurus: A model. Proc
Annu Symp Comput Appl Med Care 1989:488-93. The Unified Medical Language
System (UMLS) is intended to support uniform access of machine-readable
biomedical information resources. The foundation of the UMLS is a
metathesaurus, which will link terms in different biomedical
nomenclatures. Because the resources and nomenclatures continue to evolve,
the metathesaurus must evolve with them. Thus, an important criterion for
the design of the metathesaurus is the accommodation of change. A model of
such accommodation is presented. A key design decision was the
representation of the metathesaurus, and prospective updates, as a
database of "facts." Particular emphasis is placed on database operations
that use the results of internomenclature lexical matching to collapse
entries from different nomenclatures into metathesaurus entries. The
implementation of this model for a simplified version of the metathesaurus
is described. Copyright by and reprinted with permission of the American
Medical Informatics Association.</P>
<P>Sperzel WD, Tuttle MS, Olson NE, Erlbaum MS, Saurez-Munist O, Sherertz
DD, Fuller LF. The Meta-1.2 engine: a refined strategy for linking
biomedical vocabularies. Proc Annu Symp Comput Appl Med Care 1992:304-8.
This paper presents a preliminary description of the database schema and
associated procedures that are the foundation for the engine that will
produce Meta-1.2. Meta-1.2 is the next incarnation of the Metathesaurus,
which is one of the principal components of the National Library of
Medicine's Unified Medical Language System (UMLS). We use the word engine
as a generic term that includes a database and the programs that operate
on it. While this design builds heavily upon previous work, it
incorporates some major changes in philosophy. A major hypothesis is that
the simple representation described here is suitable for any controlled
vocabulary in the biomedical domain. Indeed, this hypothesis is central to
a strategy for producing future versions of the Metathesaurus and for
supporting collaboration with people who wish to contribute additional
terms and relationships to the Metathesaurus. Another change involves the
representation of classes and relationships. The revised database schema
includes an explicit representation of the source or authority for
relationships, which is analogous to the way that the sources of terms
have been represented since the first version of the Metathesaurus. A
sequence of steps utilizing the new representations to produce the
Metathesaurus is presented. Copyright by and reprinted with permission of
the American Medical Informatics Association.</P>
<P>Suarez-Munist ON, Tuttle MS, Olson NE, Erlbaum MS, Sherertz DD, Lipow
SS, Cole WG, Keck KD, Davis AN, Hole WT, et al. MEME II supports the
cooperative management of terminology. Proc AMIA Fall Symp 1996:84-8.
Health care enterprises need enterprise-wide terminologies to compare,
reuse and repurpose health care descriptions. But once they are created,
these terminologies need to be maintained and enhanced to sustain their
utility and that of the descriptions encoded with them. MEME II
(Metathesaurus Enhancement and Maintenance Environment, Version II)
supports the required activities and enables enterprises to leverage their
investment in terminology and descriptions by permitting remote --
extra-enterprise -- enhancements to terminology to be incorporated
locally, and local -- intra-enterprise -- enhancements to be shared
remotely. MEME II represents all changes to terminologies as data, or
"actions" that can be interpreted by an "action engine." These actions, or
messages, represent semantic "units of work" that can be interpreted by
other copies of MEME II. The exchange of update messages increases the
likelihood that "the comparability of terminology-based health care
descriptions can be sustained. Copyright by and reprinted with permission
of the American Medical Informatics Association.</P>
<P>Tuttle MS, Blois MS, Erlbaum MS, Sherertz DD, Nelson SJ. Toward a
bio-medical thesaurus: Building the foundation of the UMLS. Proc Annu Symp
Comput Appl Med Care 1988:191-5. The Unified Medical Language System
(UMLS) is being designed to provide a uniform user interface to
heterogeneous machine-readable biomedical information resources, such as
bibliographic databases, genetic databases, expert systems and patient
records. Such an interface will have to recognize different ways of saying
the same thing and provide links to related ways of saying things. One way
to represent the necessary associations is by using a domain thesaurus. As
no such thesaurus exists, and because, once built, it will be both sizable
and in need of continuous maintenance, its design should include a
methodology for building and maintaining it. A methodology utilizing
lexically expanded schema inversion and a design, called T. Lex, is
proposed, which forms an approach to the problem of defining and building
a biomedical thesaurus. It is argued that the semantic locality implicit
in such a thesaurus will support model-based reasoning in biomedicine.
Copyright by and reprinted with permission of the American Medical
Informatics Association.</P>
<P>Tuttle MS, Sherertz DD, Erlbaum MS, Olson NE, Nelson SJ. Implementing
meta-1: The first version of the UMLS metathesaurus. Proc Annu Symp Comput
Appl Med Care 1989:493-7. The Unified Medical Language System (UMLS) is
being designed to provide uniform access to computer-based resources in
biomedicine. For the foreseeable future, the foundation of the UMLS will
be a metathesaurus of concepts, synthesized from existing sources,
including MeSH, SNOMED, ICD-9-CM, CPT-4, DSM-III, and other biomedical
nomenclatures and classification systems. In Meta-1, the first version of
the metathesaurus, the synthesis is being implemented using a three-part
methodology: concept names (terms) and intrasource relationships, such as
synonymy, have been extracted from each source and converted to a
homogeneous representation, intersource lexical matches have been used to
combine terms from different sources into metathesaurus entries; and some
30000 of these entries, those containing MeSH terms and a selected sample
of terms from other domains, will be reviewed by humans, enhanced, and
modified, as appropriate. This methodology must eventually support
incremental development and an audit trail, and it must preserve
relationships added during human review. The 30,000 Meta-1 entries will
contain in excess of 60,000 biomedical terms, and these terms will
participate in more than 100,000 thesaurus relationships. These
"normative" relationships will be supplemented by "empirical"
relationships computed from certain UMLS resources. The first of the
empirical relationships will be counts of the occurrence and co-occurrence
of Meta-1 concepts in MEDLINE. Copyright by and reprinted with permission
of the American Medical Informatics Association.</P>
<P>Tuttle MS, Sherertz DD, Erlbaum MS, Sperzel WD, Fuller LF, Olson NE,
Nelson SJ, Cimino JJ, Chute CG. Adding your terms and relationships to the
UMLS Metathesaurus. Proc Annu Symp Comput Appl Med Care 1991:219-23. The
National Library of Medicine's Unified Medical Language System
Metathesaurus contains the richest single corpus of biomedical names in
existence. Yet, developers wishing to make use of the Metathesaurus will
be confronted by users who want to add local terminology and relationships
not already represented there. We urge developers to fill those needs,
while, at the same time, they plan for the many consequences of unilateral
Metathesaurus enhancement. Foremost among these consequences is the need
to maintain local enhancements across subsequent releases of the
Metathesaurus. These problems are illustrated via examples of candidate
Metathesaurus enhancement terms in use at the Columbia-Presbyterian
Medical Center (CPMC), at the Mayo Clinic, and in Current Disease
Descriptions (CDD). Sharing and reuse of Metathesaurus enhancement methods
may permit local enhancements to be used at other sites, and it may permit
the global Metathesaurus utilization effort to benefit from economies of
scale. Copyright by and reprinted with permission of the American Medical
Informatics Association.</P>
<P>Tuttle MS, Suarez-Munist ON, Olson NE, Sherertz DD, Sperzel WD, Erlbaum
MS, Fuller LF, Hole WT, Nelson SJ, Cole WG, et al. Merging terminologies.
Medinfo 1995;8(Pt 1):162-6. A terminology is a systematic, authoritative
collection of concept names, or terms, in some domain. No single
terminology names all th0e important concepts in biomedicine. One approach
to creating a more comprehensive biomedical terminology is to merge
existing biomedical terminologies, as the UMLS Metathesaurus has done for
the last six years. Because existing terminologies may overlap--for
example, one terminology may name a concept also named by another
terminology--the terminologies in the Metathesaurus must be merged. Some
terminologies suggest merges through their structure or content e.g., they
suggest synonyms or connections to other terminologies; other merges can
be suggested by algorithm. Regardless, all merges in the Metathesaurus
must be approved by a human editor with appropriate domain knowledge. By
the time Meta-'96 is released early in 1996, one prototype and seven
released versions of the Metathesaurus will have been produced by a
sequence of four qualitatively different methods, named for the way in
which they merge terms: #1 Term Rewrite Rules, #2 Transitive Closure on
Facts, #3 Fact-at-a-Time Concept Merging, and #4 Action-at-a-Time Object
Processing. The development of each method has been constrained by the
annual Metathesaurus release schedule. The first two methods made the best
use of limited computational resources, and the last two make better use
of human editing resources.</P><A
href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#list">Return to title
page</A> | <A
href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#15">Return to table of
contents</A>
<HR>
<UL>
<LI>
<UL>
<LI><STRONG><A name=2c>Content
Coverage</A></STRONG><BR></LI></UL></LI></UL>
<HR>
<P>Bishop CW, Ewing PD. Transferring knowledge from one system to another.
Proc Annu Symp Comput Appl Med Care 1994:967. Although knowledge is
contained in many systems, moving it from one system to another is not an
easy task because each system is tailored in its own unique way and
because knowledge configurations are usually copyrighted. To populate our
FRAMEMED knowledge base we turned to the NLM Metathesaurus as a
readily-available open source of knowledge. We were disappointed by the
greatly variable granularity of the concepts and the lack of definitions
that could be borrowed. Some reference books in electronic form seem
attractive but reformatting will require excessive human intervention and
copyright negotiation. Copyright by and reprinted with permission of the
American Medical Informatics Association.</P>
<P>Campbell JR, Kallenberg GA, Sherrick RC. The clinical utility of META:
an analysis for hypertension. Proc Annu Symp Comput Appl Med Care
1992:397-401. To evaluate the clinical completeness of the National
Library of Medicine Metathesaurus(META), we coded the conceptual
information found in 2000 problem oriented (SOAP) notes for hypertension
from one COSTAR site. To minimize the effects of practice idiosyncracy, we
analyzed an additional 500 notes from a second, geographically remote
site. Concepts occurring at either site numbered 1337. We classified
concepts occurring at both sites as core concepts and these numbered 121.
We attempted to find a matching concept of the proper semantic type in
META for each of the items. All matching was done by program with a manual
review by a physician. The overall success rate for matching was: [table:
see text]. We observed the greatest frequency of unmatched concepts in
physical examination, medications, symptoms, personal behavior,
non-medical therapies and counselling. We conclude that the current
release of META is not sufficiently rich to describe the process of care
in the ambulatory management of hypertension. However, the construction
and breadth of the current scheme holds promise for medical knowledge
representation and translation. Copyright by and reprinted with permission
of the American Medical Informatics Association.</P>
<P>Campbell JR, Payne TH. A comparison of four schemes for codification of
problem lists. Proc Annu Symp Comput Appl Med Care 1994:201-5. We set out
to evaluate the completeness of four major coding schemes in
representation of the patient problem list: the Unified Medical Language
System (UMLS, 4th edition), the Systematized Nomenclature of Medicine
(SNOMED International), the Read coding system (version 2), and the
International Classification of Diseases (9th Clinical
Modification)(ICD-9-CM). We gathered 400 problems from patient records at
primary care sites in Omaha and Seattle. Matching these against the best
description found in each of the coding schemes, we asked five medical
faculty reviewers to rate the matches on a five-point Likert scale
assessing their satisfaction with the results. For the four schemes, we
computed the following rates of dissatisfaction, satisfaction, and average
scores: [table: see text]. From this analysis, we conclude that UMLS and
SNOMED performed substantially better in capturing the clinical content of
the problem lists than READ or ICD-9-CM. No scheme could be considered
comprehensive. Depending on the goal of systems developers, UMLS and
SNOMED may offer different, and complementary, advantages. Copyright by
and reprinted with permission of the American Medical Informatics
Association.</P>
<P>Chute CG, Cohn SP, Campbell KE, Oliver DE, Campbell JR. The content
coverage of clinical classifications. For The Computer-Based Patient
Record Institute's Work Group on Codes &amp; Structures. J Am Med Inform
Assoc 1996 May-Jun;3(3):224-33. BACKGROUND AND OBJECTIVE: Patient
conditions and events are the core of patient record content.
Computer-based records will require standard vocabularies to represent
these data consistently, thereby facilitating clinical decision support,
research, and efficient care delivery. To address whether existing major
coding systems can serve this function, the authors evaluated major
clinical classifications for their content coverage. METHODS: Clinical
text from four medical centers was sampled from inpatient and outpatient
settings. The resultant corpus of 14,247 words was parsed into 3,061
distinct concepts. These concepts were grouped into Diagnoses, Modifiers,
Findings, Treatments and Procedures, and Other. Each concept was coded
into ICD-9-CM, ICD-10, CPT, SNOMED III, Read V2, UMLS 1.3, and NANDA; a
secondary reviewer ensured consistency. While coding, the information was
scored: 0 = no match, 1 = fair match, 2 = complete match. RESULTS:
ICD-9-CM had an overall mean score of 0.77 out of 2; its highest subscore
was 1.61 for Diagnoses. ICD-10 scored 1.60 for Diagnoses, and 0.62
overall. The overall score of ICD-9-CM augmented by CPT was not materially
improved at 0.82. The SNOMED International system demonstrated the highest
score in every category, including Diagnoses (1.90), and had an overall
score of 1.74. CONCLUSION: No classification captured all concepts,
although SNOMED did notably the most complete job. The systems in major
use in the United States, ICD-9-CM and CPT, fail to capture substantial
clinical content. ICD-10 does not perform better than ICD-9-CM. The major
clinical classifications in use today incompletely cover the clinical
content of patient records; thus analytic conclusions that depend on these
systems may be suspect. Copyright by and reprinted with permission of the
American Medical Informatics Association.</P>
<P>Chute CG, YangY, Tuttle MS, Sherertz DD, Olson NE, Erlbaum MS. A
preliminary evaluation of the UMLS Metathesaurus for patient record
classification. Proc Annu Symp Comput Appl Med Care 1990:161-5. The UMLS
project seeks to provide a unified interface to biomedical knowledge
resources. Patient medical records are an enormous repository of clinical
intervention and outcome, and are drawing increasing attention in the
pursuit of quality assurance, outcomes research, and epidemiologic
analysis. The authors sought to evaluate an unedited version of the
preliminary UMLS Metathesaurus, Meta-1, for the automated coding of
medical diagnosis and surgical procedures. Identical evaluations were
undertaken using SNOMED and the Mayo Clinic indexing lexicon. Meta-1
performed comparably to the comparison clinical indexing system, although
all systems exhibited problems associated with clinical attribute levels
and modifier combinations. Copyright by and reprinted with permission of
the American Medical Informatics Association.</P>
<P>Cimino JJ. Representation of clinical laboratory terminology in the
Unified Medical Language System. Proc Annu Symp Comput Appl Med Care
1991:199-203. The Unified Medical Language System (UMLS) was examined to
determine its coverage of clinical laboratory terminology in use at the
Columbia-Presbyterian Medical Center (CPMC). The Metathesaurus (Meta-1)
contains exact matches for 30% of 1460 CPMC laboratory terms and near
matches for an additional 42%, with better coverage of atomic-level
concepts (substance terms) than complex ones (tests and panels). The
Semantic Network includes types for representing laboratory procedures
(2), measured substances (at least 56) and sampled substances (at least
14), but no type to represent specimens. Few of the UMLS semantic
relationships are applicable to the CPMC vocabulary. These results have
implications for the utility of the UMLS for linking clinical databases to
electronic medical information sources. Copyright by and reprinted with
permission of the American Medical Informatics Association.</P>
<P>Evans DA. The language of medicine and the modeling of information. In:
Evans DA, Patel VL , editors. Advanced models of cognition for medical
training and practice; Berlin: Springer-Verlag; 1992. p. 43-67.</P>
<P>Friedman C. The UMLS coverage of clinical radiology. Proc Annu Symp
Comput Appl Med Care 1992:309-13. The informational content of clinical
radiology reports was examined to determine the coverage of the Unified
Medical Language System (UMLS) in relation to the terminology used by
physicians in the Radiology Department of Columbia Presbyterian Medical
Center (CPMC). The UMLS semantic network contained 17 semantic types which
were compatible with the types of clinical information in the reports. The
type of semantic categories missing from the UMLS consisted mainly of
modifier information relating to certainty, degree, and change type of
information. This type of information formed a substantial part of the
domain. Although most of the informational categories were found in the
UMLS semantic network, most of the domain terms were not. Our results
strongly suggest that the UMLS could be a significant tool for developing
clinical text processing applications if it were extended to cover
clinical domains. Copyright by and reprinted with permission of the
American Medical Informatics Association.</P>
<P>Fuller L, Hole W, Olson N, Schuyler P, Tuttle M. Drug and chemical
entries in Meta-1. Proc Annu Symp Comput Appl Med Care 1990:146-50.
Thirty-two percent of the concepts in the National Library of Medicine's
UMLS Metathesaurus, Meta-1, are the names of biomedically important
chemicals. The paper describes the origin of the chemical terms included
in Meta-1, the structure and information content of these records, and the
potential uses of these concepts to access chemical information in
biomedical databases. Data is also presented quantitatively describing the
subjects of the articles in the biomedical literature and the frequency
with which articles include chemical subjects. Copyright by and reprinted
with permission of the American Medical Informatics Association.</P>
<P>Huff SM, Warner HR. A comparison of Meta-1 and HELP terms: implications
for clinical data. Proc Annu Symp Comput Appl Med Care 1990:166-9. Terms
from the HELP System's vocabulary were matched with Meta-1 terms on a word
by word basis as well as on a phrase by phrase basis with the goal of
exploring what steps might need to be taken if some future version
(Meta-N) of the UMLS Metathesaurus were to be used to represent clinical
data. Word by word matching revealed that 54% of HELP words were present
in Meta-1, while 8% of HELP phrases had a corresponding phrase. The words
that did not match in HELP were mostly adjectives and adverbs after taking
into account misspellings and abbreviations. Phrase matches were low
because of the inclusion of adjectives and adverbs in HELP clinical terms.
If some future version of the Metathesaurus is to be used for
representation of clinical data additional terms are needed as well as a
grammar that permits construction of clinical phrases that include
modifiers and time references. Copyright by and reprinted with permission
of the American Medical Informatics Association.</P>
<P>Lange LL. Representation of everyday clinical nursing language in UMLS
and SNOMED. Proc AMIA Fall Symp 1996:140-4. Everyday clinical nursing
language is informal and idiosyncratic. Whether the everyday language of
nurses can be represented by standardized vocabulary systems, such as the
UMLS and SNOMED, was the focus of the study. Computer systems that allow
clinicians to pick terms that are familiar are likely to be better
accepted and thus more effective than systems that impose formal
terminologies on users. Nursing phrases were extracted from handwritten
shift notes, reduced to atomic-level terms, and matched to UMLS and
SNOMED. Exact matches were obtained for 56% of terms in UMLS and 49% in
SNOMED. Fifty-nine semantic types and 24 different source vocabularies
were represented by the terms. Nursing vocabularies were represented by
only 5% of source vocabulary citations. Copyright by and reprinted with
permission of the American Medical Informatics Association.</P>
<P>Lindberg CH. A comparison of the language of patient charts at
Presbyterian University Hospital, Pittsburgh, PA., and the Unified Medical
Language System of the National Library of Medicine (online medical
records) [dissertation]. Pittsburgh (PA): University of Pittsburgh; 1994.
176 p. Available from: University Microforms, Ann Arbor, MI; 9426718. This
dissertation matches the language of online medical records at the
Presbyterian University Hospital in Pittsburgh with the language of the
Unified Medical Language System (UMLS), an experimental thesaurus of
biomedicine developed by the National Library of Medicine. In the future,
the UMLS may serve as an interface between medical charts and the
information in databases such as Medline. The main research question is
whether the UMLS captures the concepts found in medical charts and can
thus be used to bridge the gap between chart terminology and MeSH, the
vocabulary used to access Medline. A sample of 50 records from two
diagnoses was compared to the UMLS. A statistical formula selected
potentially useful non-matches, which were then analyzed to determine
whether the missing concepts are wholly or partially present in another
form in MeSH. Seventy percent of the missing terms are either broader
terms than MeSH headings or synonyms of chart terms/concepts.
Approximately 19% of the dropped terms could not form a strong map to
MeSH. The study indicates that, since so many chart terms are found in
some form, a chart-generated search can link to many related concepts in
MeSH, but a significant number of chart concepts must be added to the UMLS
or cross referenced to MeSH. Provided by UMI. </P>
<P>Moving toward international standards in primary care informatics:
clinical vocabulary. Conference Summary Report. 1995 Nov 1-2; New Orleans.
Rockville (MD): Agency for Health Care Policy and Research; 1996 Oct. 35
p. (AHCPR pub. no. 96-0069) Available also from <A
"http://www.ahcpr.gov/research/pcinform/">http://www.ahcpr.gov/research/pcinform/</A>.</P>
<P>Mullins HC, Scanland PM, Collins D, Treece L, Petruzzi P Jr., Goodson
A, Dickinson M. The efficacy of SNOMED, Read codes, and UMLS in coding
ambulatory family practice clinical records. Proc AMIA Fall Symp
1996:135-9. This study was initially developed as a traditional
quantitative study to determine the level of match of identified clinical
terms in three (3) clinical vocabularies. To address concerns raised by a
review of the literature and our own experience, a supplemental study to
collect qualitative data was added. Dictated progress notes from a
stratified sample of patient visits over a period of four (4) years were
used to obtain a representative sample of terms. A total of 144 progress
notes were selected taking into consideration the usual demographics plus
additional variables. From the 144 clinical notes, 864 terms were
extracted and evaluated by level of match. The within-term effect was
highly significant (F=58.69, p&lt;-.001), indicating significant
differences in the mean level of match for the three coding systems.
Qualitative findings suggest that this and other published studies may not
answer questions about the "efficacy of available clinical vocabularies in
coding ambulatory family practice clinical records", and additional
studies are needed which must be carefully structured and utilize a
standardized procedure. Copyright by and reprinted with permission of the
American Medical Informatics Association.</P>
<P>O'Keefe KM, Sievert M, Mitchell JA. Mendelian inheritance in man:
diagnoses in the UMLS. Proc Annu Symp Comput Appl Med Care 1993:735-9.
Because they deal with many distinct but rare inheritance diseases,
geneticists have difficulty translating from their codes to other
biomedical coding schemes. The objective of this research was to
investigate the potential uses and difficulties of using the UMLS
Metathesaurus for genetic diagnoses and to make recommendations to UMLS
developers for improvements in UMLS for common genetic disorders. The 110
most common Mendelian Inheritance in Man disorders from the Missouri
Genetic Disease Program over the period of one year were translated into
MeSH, ICD and SNOMED. The more common diseases are more likely to be
mapped than the rarer ones. Diseases with a proven genetic inheritance
pattern are more likely to be mapped than those with speculated
inheritance patterns. Approximately one third of all diagnoses were not
mapped across all three coding schemes in Meta-1.2. The ICD coding scheme
was found to be too broad to be meaningful for genetic diagnosis or
epidemiological purposes. MeSH and SNOMED need to be made more specific
and complete, and all of the new version of SNOMED needs to be included in
the Metathesaurus. Copyright by and reprinted with permission of the
American Medical Informatics Association.</P>
<P>Payne TH, Martin DR. How useful is the UMLS metathesaurus in developing
a controlled vocabulary for an automated problem list? Proc Annu Symp
Comput Appl Med Care 1993:705-9. We are developing a set of problem list
phrases to be used in the automated problem list of a prototype clinical
computing system. Because of the large number of terms in the Unified
Medical Language System (UMLS) and the links between them, we are
experimenting with the use of the UMLS as the foundation for our problem
list phrase set. We have found the UMLS to be very useful for this
project, but that it lacks many phrases clinicians wish to include in the
problem list. Internal linkages between phrases provided in the UMLS are
not well suited to our needs. We plan to continue our use of the UMLS but
to add problem list phrases and linkages between phrases to support
browsing and decision support applications. Copyright by and reprinted
with permission of the American Medical Informatics Association.</P>
<P>Rosenberg KM, Coultas DB. Acceptability of Unified Medical Language
System terms as substitute for natural language general medicine clinic
diagnoses. Proc Annu Symp Comput Appl Med Care 1994:193-7. The
acceptability of using the Unified Medical Language System (UMLS) concept
phrases to substitute for physicians' diagnosis statements was
investigated. Physician diagnosis statements recorded in the University of
New Mexico's General Medicine Clinic were input into a computer program
that automatically finds the best matching UMLS concept phrases. The
computer program written in C++ integrates UMLS searching and browsing
with a graphical user interface. Five attending physicians in the
Department of Internal Medicine rated the acceptability of the UMLS
concept phrase as a substitute for the original physician statement. One
hundred and ninety-five patients' notes were examined with 447 diagnosis
statements recorded of which 271 statements were unique. Attending
physicians rated their satisfaction with the automated UMLS substitutes on
a scale of 1 (extremely dissatisfied) to 5 (extremely satisfied).
Intrarater (mean 0.94) and interrater correlations (mean 0.75) were high.
The mean rating was 4.0 (quite satisfied). Most (73%) of the substitution
were satisfactory (rating of 4 or 5), 16% were neutral (rating of 3), and
21% were unsatisfactory (rating of 1 or 2). A review of the substitutions
showed a frequent lack of clinical modifier terms in UMLS as has been
previously described. Comparison to a previous study shows the broader
term coverage of UMLS to be a more acceptable source of diagnosis codes
than using International Classification of Diseases revision 9 alone.
These results suggest that UMLS can be an effective tool for coding
unconstrained physician diagnoses. Copyright by and reprinted with
permission of the American Medical Informatics Association.</P>
<P>Sato L, McClure RC, Rouse RL, Schatz CA, Greenes RA. Enhancing the
Metathesaurus with clinically relevant concepts: anatomic representations.
Proc Annu Symp Comput Appl Med Care 1992:388-91. To create a comprehensive
taxonomy for medical concepts it is necessary to identify gaps and
reconcile differences that exist between clinical, bibliographic, and
other source vocabularies. As part of the Unified Medical Language System
project, we have proposed enhancements to the Metathesaurus by the
inclusion of terms from two source vocabularies with different unique
perspectives or views. This process has disclosed a number of issues that
arise as complexity increases. These issues must be resolved if the
resultant Metathesaurus is to support the variety of uses for which it is
intended. Copyright by and reprinted with permission of the American
Medical Informatics Association.</P>
<P>Warren JJ, Campbell JR, Palandri MK, Stoupa RA. Analysis of three
coding schemes: can they capture nursing care plan concepts? Proc Annu
Symp Comput Appl Med Care 1994:962.</P>
<P>Zielstorff RD, Cimino C, Barnett GO, Hassan L, Blewett DR.
Representation of nursing terminology in the UMLS Metathesaurus: a pilot
study. Proc Annu Symp Comput Appl Med Care 1992:392-6. To see whether the
National Library of Medicine's Metathesaurus (tm) includes terminology
relevant to clinical nursing practice, two widely used nursing
vocabularies were matched against the Meta. The two nursing vocabularies
are 1) the North American Nursing Diagnosis List of Approved Diagnoses;
and 2) the Omaha System, a vocabulary of problems and interventions
developed by the Omaha Visiting Nurses Association. First, the terms were
scanned against Meta in their native form, with phrases and combinations
intact. This produced a relatively low percentage of exact matches (12%).
Next, the terms were separated into core concepts and modifiers and the
analysis was repeated. The percentage of exact matches to terms in Meta
increased to 32%. However, the semantic types of the split terms often
were not equivalent to the semantic types of the phrases from which the
split terms were derived; also, in some cases, terms returned as exact
matches had different meanings in Meta. Automatic scanning for lexical
matches is a helpful first step in searching for vocabulary representation
in Meta, but term-by-term search for context, semantic type and definition
is essential. However, it seems clear that representation of nursing
terminology in the Metathesaurus needs to be expanded. Copyright by and
reprinted with permission of the American Medical Informatics
Association.</P><A
href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#list">Return to title
page</A> | <A
href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#15">Return to table of
contents</A>
<HR>
<UL>
<LI><STRONG><A name=2d>Information Sources Map</A></STRONG><BR></LI></UL>
<HR>
<P>Masys DR. An evaluation of the source selection elements of the
prototype UMLS Information Sources Map. Proc Annu Symp Comput Appl Med
Care 1992:295-8. The Information Sources Map (ISM) is a component of the
National Library of Medicine's Unified Medical Language System (UMLS)
project. The ISM is intended to provide both human-readable and
machine-interpretable information about the content, scope, and access
conditions for various information sources such as databases, expert
systems, and the organizations which make these information sources
available. Automated source selection is supported by three types of
indexing in the ISM: Medical Subject Heading (MeSH) terms and subheadings;
Semantic Types from the UMLS Semantic Network; and Semantic Type
Relations, which depict pairs of semantic types joined by a relationship
chosen from the Semantic Network. This paper reports a study of the recall
and precision of the source selection elements in the prototype version of
the ISM. Copyright by and reprinted with permission of the American
Medical Informatics Association.</P>
<P>Masys DR, Humphreys BL. Structure and function of the UMLS information
sources map. Medinfo 1992;7(Pt 2):1518-21. A health professional seeking
information which is represented in computerized format faces formidable
difficulties in determining which information sources may be relevant to a
particular question, and in gaining access to that information. The first
version of a new UMLS data file called the Information sources map (ISM)
has been created to address this problem. The ISM is intended to provide
both human-readable and machine-interpretable information about the
content, scope, and access conditions for various information sources such
as databases, expert systems, and the organizations which make these
information sources available. The first prototype of the ISM features
indexing elements which support automated source selection; subsequent
versions will encode the logic necessary to connect to and retrieve
information from the sources represented in the ISM file.</P>
<P>Miller PL, Clyman JI, Frawley SJ, Paton JA, Powsner SM, Roderer N,
Shifman MA. NetMenu and a prototype UMLS information sources map. Proc
Annu Symp Comput Appl Med Care 1993:957. This paper describes NetMenu and
an Information Sources Map (ISM), two tools under development to help the
biomedical user find out about a range of network-based information
sources, and to connect automatically to a chosen source. The prototype
ISM is developed as part of the Unified Medical Language System (UMLS)
project of the National Library of Medicine. Both NetMenu and the ISM are
operational at Yale University School Medicine and are available for use
elsewhere. Copyright by and reprinted with permission of the American
Medical Informatics Association.</P>
<P>Miller PL, Frawley SJ, Wright L, Roderer NK, Powsner SM. Lessons
learned from a pilot implementation of the UMLS information sources map. J
Am Med Inform Assoc 1995 Mar-Apr;2(2):102-15. OBJECTIVE: To explore the
software design issues involved in implementing an operational information
sources map (ISM) knowledge base (KB) and system of navigational tools
that can help medical users access network-based information sources
relevant to a biomedical question. DESIGN: A pilot biomedical ISM KB and
associated client-server software (ISM/Explorer) have been developed to
help students, clinicians, researchers, and staff access network-based
information sources, as part of the National Library of Medicine's (NLM)
multi-institutional Unified Medical Language System (UMLS) project. The
system allows the user to specify and constrain a search for a biomedical
question of interest. The system then returns a list of sources matching
the search. At this point the user may request 1) further information
about a source, 2) that the list of sources be regrouped by different
criteria to allow the user to get a better overall appreciation of the set
of retrieved sources as a whole, or 3) automatic connection to a source.
RESULTS: The pilot system operates in client-server mode and currently
contains coded information for 121 sources. It is in routine use from
approximately 40 workstations at the Yale School of Medicine. The lessons
that have been learned are that: 1) it is important to make access to
different versions of a source as seamless as possible, 2) achieving
seamless, cross-platform access to heterogeneous sources is difficult, 3)
significant differences exist between coding the subject content of an
electronic information resource versus that of an article or a book, 4)
customizing the ISM to multiple institutions entails significant
complexities, and 5) there are many design trade-offs between specifying
searches and viewing sets of retrieved sources that must be taken into
consideration. CONCLUSION: An ISMKB and navigational tools have been
constructed. In the process, much has been learned about the complexities
of development and evaluation in this new environment, which are different
from those for Gopher, wide area information servers (WAIS),
World-Wide-Web (WWW), and MOSAIC resources. Copyright by and reprinted
with permission of the American Medical Informatics Association.</P>
<P>Miller PL, Paton JA, Clyman JI, Powsner SM. Prototyping an
institutional IAIMS/UMLS information environment for an academic medical
center. Bull Med Libr Assoc 1992 Jul;80(3):281-7. The paper describes a
prototype information environment designed to link network-based
information resources in an integrated fashion and thus enhance the
information capabilities of an academic medical center. The prototype was
implemented on a single Macintosh computer to permit exploration of the
overall information architecture and to demonstrate the various desired
capabilities prior to full-scale network-based implementation. At the
heart of the prototype are two components: a diverse set of information
resources available over an institutional computer network and an
information sources map designed to assist users in finding and accessing
information resources relevant to their needs. The paper describes these
and other components of the prototype and presents a scenario illustrating
its use. The prototype illustrates the link between the goals of two
National Library of Medicine initiatives, the Integrated Academic
Information Management System (IAIMS) and the Unified Medical Language
System (UMLS). Copyright by and reprinted with permission of the Medical
Library Association.</P>
<P>Miller PL, Wright LW, Frawley SJ, Clyman JI, Powsner SM. Selecting
relevant information resources in a network-based environment: the UMLS
information sources map. Medinfo 1992;7(Pt 2):1512-7. The paper describes
experience in building a prototype information sources map (ISM) as part
of the Unified Medical language System (UMLS) project of the National
Library of Medicine. A test set of 112 representative medically-related
information sources was compiled. The purpose was to explore what type of
coded information should be included in the ISM to help select sources
relevant to a user query. For each ISM entry (describing a particular
information source), two general types of coded information were included.
(1) Coding using MeSH terms and Meta-1 semantic types was used to
characterize the source's subject content. (2) Additional coded
information related to the source's use. The paper discusses experience in
coding the information sources to create the prototype ISM, and describes
a study to assess the utility of the different coded information in
selecting sources relevant to a user query.</P>
<P>Shifman MA, Clyman JI, Paton JA, Powsner SM, Roderer NK, Miller PL.
NetMenu. Experience in the implementation of an institutional menu of
information sources. Proc Annu Symp Comput Appl Med Care 1993:554-8.
NetMenu is a program developed at Yale University, which enables a
straightforward access to online information systems. NetMenu has been
deployed in several diverse settings within the medical center. In the
hospital, NetMenu functions as a front-end for the clinical workstation,
providing access to the hospital information system, the clinical
laboratory computer, a drug database and several bibliographic databases.
The medical libraries utilize NetMenu for both medical education
workstations and for scholarly information workstations. This paper
describes the initial experience in the implementation, support, and
maintenance of NetMenu as an institutional menu of information sources.
Copyright by and reprinted with permission of the American Medical
Informatics Association.</P>
<P>Silverstein SM, Miller PL, Cullen MR. An information sources map for
Occupational and Environmental Medicine: guidance to network-based
information through domain-specific indexing. Proc Annu Symp Comput Appl
Med Care 1993:616-20. This paper describes a prototype information sources
map (ISM), an on-line information source finder, for Occupational and
Environmental Medicine (OEM). The OEM ISM was built as part of the Unified
Medical Language System (UMLS) project of the National Library of
Medicine. It allows a user to identify sources of on-line information
appropriate to a specific OEM question, and connect to the sources. In the
OEM ISM we explore a domain-specific method of indexing information source
contents, and also a domain-specific user interface. The indexing
represents a domain expert's opinion of the specificity of an information
source in helping to answer specific types of domain questions. For each
information source, an index field represents whether a source might
provide useful information in an occupational, industrial, or
environmental category. Additional fields represent the degree of
specificity of a source in individual question types in each category. The
paper discusses the development, design, and implementation of the
prototype OEM ISM. Copyright by and reprinted with permission of the
American Medical Informatics Association.</P><A
href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#list">Return to title
page</A> | <A
href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#15">Return to table of
contents</A>
<HR>
<UL>
<LI><STRONG><A name=2e>Distribution Formats and Associated
Tools</A></STRONG><BR></LI></UL>
<HR>
<P>McCray AT, Divita G. ASN.1: defining a grammar for the UMLS knowledge
sources. Proc Annu Symp Comput Appl Med Care 1995:868-72. The Unified
Medical Language System (UMLS) project provides resources on an
experimental basis to the research community. In 1995 the four UMLS
Knowledge Sources have been provided in an additional data format,
Abstract Syntax Notation One (ASN.1). The benefits of ASN.1 are that it
provides a standard, formal grammar for complex data and allows exchange
of that data in a way which is independent of the particular software and
hardware environment in which the data are created and stored. The paper
begins with an introduction to the ASN.1 standard itself. It continues
with a discussion of the ASN.1 implementation of the UMLS Knowledge
Sources and some of the consequences for the newly released UMLS Knowledge
Source Server. It concludes with a discussion of some of the benefits of
using ASN.1 encoded data. Copyright by and reprinted with permission of
the American Medical Informatics Association.</P>
<P>McCray AT, Razi A. The UMLS Knowledge Source server. Medinfo 1995;8(Pt
1):144-7. The UMLS Knowledge Source server is an evolving tool for
accessing information stored in the UMLS Knowledge Sources. The system
architecture is based on the client-server paradigm wherein remote site
users send their requests to a centrally managed server at the U.S.
National Library of Medicine. The client programs can run on platforms
supporting the TCP/IP communication protocol. Access to the system is
provided through a command-line interface and through an Application
Programming Interface.</P>
<P>McCray AT, Razi AM, Bangalore AK, Browne AC, Stavri PZ. The UMLS
knowledge source server: a versatile internet-based research tool. Proc
AMIA Fall Symp 1996:164-8. The National Library of Medicine's Unified
Medical Language System (UMLS) project regularly distributes a set of
Knowledge Sources to the research community. In 1995 the UMLS data were
made available for the first time through the Internet-based UMLS
Knowledge Source Server. The server can be accessed through three
different client interfaces. The World Wide Web interface allows users to
browse and explore the data and to see how those data are organized in the
UMLS. The command-line interface is best suited for batch processing, and
the application programming interface allows developers at remote sites to
embed calls in their application programs to the Knowledge Source Server.
Copyright by and reprinted with permission of the American Medical
Informatics Association.</P>
<P>McCray AT, Srinivasan S, Browne AC. Lexical methods for managing
variation in biomedical terminologies. Proc Annu Symp Comput Appl Med Care
1994:235-9. Access to biomedical terminologies is hampered by the high
degree of variability inherent in natural language terms and in the
terminologies themselves. The lexicon, lexical programs, databases, and
indexes included with the 1994 release of the UMLS Knowledge Sources are
designed to help users manage this variability. We describe these
resources and illustrate their flexibility and usefulness in providing
enhanced access to data in the UMLS Metathesaurus. Copyright by and
reprinted with permission of the American Medical Informatics
Association.</P>
<P>Nelson SJ, Sherertz DD, Tuttle MS, Erlbaum MS. Using MetaCard: a
Hypercard browser for biomedical knowledge sources. Proc Annu Symp Comput
Appl Med Care 1990:151-4. As part of the Unified Medical Language System
(UMLS) project a large metathesaurus (Meta-1) was built. We have adapted a
Hypercard browser of Meta-1 (MetaCard) to enable a user to continue the
browsing process, extending from the Metathesaurus to a variety of
different knowledge sources. These knowledge sources include Current
Disease Description (CDD), Physicians Data Query (PDQ), and Mendelian
Inheritance in Man (MIM). Metacard can also be linked to Grateful Med, the
NLM program which is used to search MEDLINE. A user can, with minimal
training, use MetaCard to access these four different knowledge sources.
The links (how one goes from one knowledge source to another) have been
built on the basis of disease names. In organizing these links, it was
helpful to use CDD as an additional source of knowledge about how diseases
are named in various sources. Further plans are to expand the use of the
Metathesaurus in building links to knowledge sources. The question with
each method of linking used will be to what extent the method provides a
robust linkage whose utility can be anticipated. While future refinements
or developments of links may give additional functionality, the current
linkages are sufficient to provide a useful browsing tool. We believe that
this is so because much of the knowledge in each of these sources is
organized around diseases. Navigation is easy because of the similarities
of the Hypercard interfaces to each of the knowledge sources: a common set
of conventions (e.g. point and click) helps make it work. Copyright by and
reprinted with permission of the American Medical Informatics
Association.</P>
<P>Sherertz D, Tuttle M, Cole W, Erlbaum M, Olson N, Nelson S. A HyperCard
implementation of Meta-1.: The first version of the UMLS Metathesaurus.
Proc Annu Symp Comput Appl Med Care 1989:1017-8. The Unified Medical
Language System (UMLS) is being designed to provide uniform access to
computer-based resources in biomedicine. For the foreseeable future, the
foundation of the UMLS will be a "metathesaurus of concepts," synthesized
from existing biomedical nomenclatures. Meta-1, the first version of the
Metathesaurus, will contain all of MeSH, a selection of terms from primary
care, clinical medicine, and other domains, and all terms from SNOMED,
ICD-9-CM, and CPT-4 which "match" them--about 30,000 terms. In addition,
Meta-1 contains information about the occurrence and co-occurrence of its
terms in selected resources, such as MEDLINE. As Meta-1 will contain about
100MB of terms and relationships, it is unlikely that it will be
"printed." Instead, some UMLS applications will support Metathesaurus
"browsing." One way of browsing Meta-1 will be via the Apple Macintosh
application called HyperCard. A demonstration of a HyperCard interface,
called "Meta-Card" will first acquaint viewers with the contents of the
pre-human-review version of Meta-1, and second, illustrate how an
object-oriented interface can be programmed to support various visual
metaphors, e.g. "click-to-get-more-information," and
"click-to-follow-a-semantic-link," and the notion of a Metathesaurus
esthetic. Copyright by and reprinted with permission of the American
Medical Informatics Association.</P>
<P>Tuttle MS, Sperzel WD, Olson NE, Erlbaum MS, Suarez-Munist O, Sherertz
DD, Nelson SJ, Fuller LF. The homogenization of the Metathesaurus schema
and distribution format. Proc Annu Symp Comput Appl Med Care 1992:299-303.
The third version of the UMLS Metathesaurus, Meta-1.2, to be released in
October 1992, will have a simpler schema and simpler distribution formats
than the first two versions, Meta-1.0 and Meta-1.1 released in October
1990 and 1991, respectively. For one thing, it will have only a single
kind of entry (Concept), rather than three (Concept, Related, and
Synonym). Further, the Relational Format, will consist of four logical
relations, or tables, instead of the nearly three score different tables
used to represent the same kind of information in Meta-1.1. These four
tables will contain, respectively, (1) the names of each concept, (2) the
relationships between concepts, (3) attributes of the concepts, and (4) a
word-based index into the concept names. We argue that the new schema and
formats provide a better conceptual model of the Metathesaurus, and
represent the information contained there more uniformly. Even though
these changes are incremental and evolutionary, both users and software
developers should find the Meta-1.2 significantly easier to understand,
and the information contained in it significantly easier to use. Copyright
by and reprinted with permission of the American Medical Informatics
Association.</P><A
href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#list">Return to title
page</A> | <A
href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#15">Return to table of
contents</A>
<HR>
<H3>UMLS Applications</H3>
<UL>
<LI><STRONG>Vocabulary Construction and Concept Discovery</STRONG><BR>
<UL>
<LI><STRONG><A name=3a>Vocabulary Design, Construction and
Maintenance</A></STRONG><BR></LI></UL></LI></UL>
<HR>
<P>Campbell KE, Musen MA. Representation of clinical data using SNOMED III
and conceptual graphs. Proc Annu Symp Comput Appl Med Care 1992:354-8.
None of the coding schemes currently contained within the Unified Medical
Language System (UMLS) is sufficiently expressive to represent medical
progress notes adequately. Some coding schemes suffer from domain
incompleteness, others suffer from the inability to represent modifiers
and time references, and some suffer from both problems. The recently
released version of the Systematized Nomenclature of Medicine (SNOMED III)
is a potential solution to the data-representation problem because it is
relatively domain complete, and because it uses a generative coding scheme
that will allow the construction of codes that contain modifiers and time
references. SNOMED III does have an important weakness, however. SNOMED
III lacks a formalized system for using its codes; thus, it fails to
ensure consistency in its use across different institutions. Application
of conceptual-graph formalisms to SNOMED III can ensure such consistency
of use. Conceptual-graph formalisms will also allow mapping of the
resulting SNOMED III codes onto relational data models and onto other
formal systems, such as first-order predicate calculus. Copyright by and
reprinted with permission of the American Medical Informatics
Association.</P>
<P>Carenini G, Moore JD. Using the UMLS Semantic Network as a basis for
constructing a terminological knowledge base: a preliminary report. Proc
Annu Symp Comput Appl Med Care 1993:725-9. Sharing and reuse of knowledge
bases is recognized in Artificial Intelligence and Medical Informatics as
beneficial, but difficult. Reusing an existing knowledge base can save
considerable time and effort during the knowledge engineering phase, and
facilitates integration of systems. However, the degree to which knowledge
can be shared among different applications is still mainly an empirical
question. In this paper, we describe the preliminary results of our
attempt to reuse the UMLS Semantic Network as an ontology for the
knowledge base of a patient education system. Copyright by and reprinted
with permission of the American Medical Informatics Association.</P>
<P>Cimino JJ. Controlled medical vocabulary construction: methods from the
Canon Group [editorial]. J Am Med Inform Assoc 1994
May-Jun;1(3):296-7.</P>
<P>Cimino JJ. Formal descriptions and adaptive mechanisms for changes in
controlled medical vocabularies. Methods Inf Med 1996 Sep;35(3):202-10.
Comment in: Methods Inf Med 1996 Sep;35(3):211-7; Methods Inf Med 1996
Sep;35(3):218-9. (Eng). Standard controlled medical vocabularies are
typically based on a coding scheme, while medical informatics applications
tend to have a more formal conceptual foundation. When such applications
attempt to use data coded with standard vocabularies, problems can arise
when the standard vocabulary changes over time. A formal taxonomy is
presented for describing the semantic changes which can occur in a
vocabulary, such as simple addition, refinement, precoordination,
disambiguation, redundancy, obsolescence, discovered redundancy, major
name changes, minor name changes, code reuse, and changed codes. The
taxonomy is described that used to effect change in one concept-based
vocabulary (the Medical Entities Dictionary), and the utility of the
approach is demonstrated by applying it to the changes appearing in the
1994 release of the International Classification of Diseases, Ninth
Edition, with Clinical Modifications (ICD-9-CM). </P>
<P>Cimino JJ, Clayton PD. Coping with changing controlled vocabularies.
Proc Annu Symp Comput Appl Med Care 1994:135-9. For the foreseeable
future, controlled medical vocabularies will be in a constant state of
development, expansion and refinement. Changes in controlled vocabularies
must be reconciled with historical patient information which is coded
using those vocabularies and stored in clinical databases. This paper
explores the kinds of changes that can occur in controlled vocabularies,
including adding terms (simple additions, refinements, redundancy and
disambiguation), deleting terms, changing terms (major and minor name
changes), and other special situations (obsolescence, discovering
redundancy, and precoordination). Examples are drawn from actual changes
appearing in the 1993 update to the International Classification of
Diseases (ICD9-CM). The methods being used at Columbia-Presbyterian
Medical Center to reconcile its Medical Entities Dictionary and its
clinical database are discussed. Copyright by and reprinted with
permission of the American Medical Informatics Association.</P>
<P>Cimino JJ, Clayton PD, Hripcsak G, Johnson SB. Knowledge-based
approaches to the maintenance of a large controlled medical terminology. J
Am Med Inform Assoc 1994 Jan-Feb;1(1):35-50. OBJECTIVE: Develop a
knowledge-based representation for a controlled terminology of clinical
information to facilitate creation, maintenance, and use of the
terminology. DESIGN: The Medical Entities Dictionary (MED) is a semantic
network, based on the Unified Medical Language System (UMLS), with a
directed acyclic graph to represent multiple hierarchies. Terms from four
hospital systems (laboratory, electrocardiography, medical records coding,
and pharmacy) were added as nodes in the network. Additional knowledge
about terms, added as semantic links, was used to assist in integration,
harmonization, and automated classification of disparate terminologies.
RESULTS: The MED contains 32,767 terms and is in active clinical use.
Automated classification was successfully applied to terms for laboratory
specimens, laboratory tests, and medications. One benefit of the approach
has been the automated inclusion of medications into multiple
pharmacologic and allergenic classes that were not present in the pharmacy
system. Another benefit has been the reduction of maintenance efforts by
90%. CONCLUSION: The MED is a hybrid of terminology and knowledge. It
provides domain coverage, synonymy, consistency of views, explicit
relationships, and multiple classification while preventing redundancy,
ambiguity (homonymy) and misclassification. Copyright by and reprinted
with permission of the American Medical Informatics Association.</P>
<P>Cimino JJ, Hripcsak G, Johnson SB, Clayton PD. Designing an
introspective, multipurpose, controlled medical vocabulary. Proc Annu Symp
Comput Appl Med Care 1989:513-8. The medical vocabulary used in clinical
information systems must be more than a simple list of terms. We agree
that such a vocabulary must have synonymy, domain completeness, and
multiple classifications providing consistent views and explicit
relationships, while remaining unambiguous and non-redundant. We examine
the abilities of existing controlled vocabularies (ICD9-CM, SNOMED, MeSH,
CMIT, CPT4, COSTAR, HELP, DXPLAIN, and UMLS) to meet these goals and
propose an enhanced vocabulary structure based on a directed, acyclic
semantic net. This structure provides a representation which permits
introspection by the vocabulary maintenance system responsible for
providing a terminology which meets the seven requirements. The
vocabulary, called the Medical Entities Dictionary (MED), will serve a
variety of applications. Copyright by and reprinted with permission of the
American Medical Informatics Association.</P>
<P>Cimino JJ, Hripcsak G, Johnson SB, Friedman C, Fink DJ, Clayton PD.
UMLS as knowledge base- a rule-based expert system approach to controlled
medical vocabulary management. Proc Annu Symp Comput Appl Med Care
1990:175-9. The National Library of Medicine is developing a Unified
Medical Language System (UMLS) which addresses the need for integration of
several large, nationally accepted vocabularies. This is important to the
clinical information system under development at the Columbia-Presbyterian
Medical Center (CPMC). The authors are using UMLS components as the core
of their effort to integrate existing local CPMC vocabularies which are
not among the source vocabularies of the UMLS. They are also using the
UMLS to build a knowledge base of vocabulary structure and content such
that logical rules can be developed to assist in the management of the
integrated vocabularies. At present, the UMLS Semantic Network is used to
organize terms which describe laboratory procedures. The authors have
developed a set of rules for identifying undesirable conditions in the
vocabulary. They have applied these rules to 526 laboratory test terms and
have found ten cases (2%) of definite redundancy and sixty-eight cases
(13%) of potential redundancy. The rules have also been used to organize
the terminology in new ways that facilitate its management. Using the UMLS
model as a vocabulary knowledge base allows the authors to apply an expert
system approach to vocabulary integration and management. Copyright by and
reprinted with permission of the American Medical Informatics
Association.</P>
<P>Evans DA, Cimino JJ, Hersh WR, Huff SM, Bell DS. Toward a
medical-concept representation language. The Canon Group. J Am Med Inform
Assoc 1994 May-Jun;1(3):207-17. The Canon Group is an informal
organization of medical informatics researchers who are working on the
problem of developing a deeper representation formalism for use in
exchanging data and developing applications. Individuals in the group
represent experts in such areas as knowledge representation and
computational linguistics, as well as in a variety of medical
subdisciplines. All share the view that current mechanisms for the
characterization of medical phenomena are either inadequate (limited or
rigid) or idiosyncratic (useful for a specific application but incapable
of being generalized or extended). The Group proposes to focus on the
design of a general schema for medical-language representation including
the specification of the resources and associated procedures required to
map language (including standard terminologies) into representations that
make all implicit relations visible, reveal hidden attributes, and
generally resolve ambiguous or vague references. The Group is proceeding
by examining large numbers of texts (records) in medical sub-domains to
identify candidate concepts and by attempting to develop general rules and
representations for elements such as attributes and values so that all
concepts may be expressed uniformly. Copyright by and reprinted with
permission of the American Medical Informatics Association.</P>
<P>Fowler J, Buffone G, Moreau D. The architecture of a distributed
medical dictionary. Medinfo 1995;8(Pt 1):126-30. Exploiting high-speed
computer networks to provide a national medical information infrastructure
is a goal for medical informatics. The Distributed Medical Dictionary
under development at Baylor College of Medicine is a model for an
architecture that supports collaborative development of a distributed
online medical terminology knowledge-base. A prototype is described that
illustrates the concept. Issues that must be addressed by such a system
include high availability, acceptable response time, support for local
idiom, and control of vocabulary.</P>
<P>Humphreys BL. Comment on "Toward data standards for clinical nursing
information". J Am Med Inform Assoc 1994 Nov-Dec;1(6):472-4.</P>
<P>Levesque Y, LeBlanc AR, Maksud M. MD Concept: a model for integrating
medical knowledge. Proc Annu Symp Comput Appl Med Care 1994:252-6. Many
integrated clinical information systems depend on large knowledge bases
containing a dictionary of terms as well as specific information about
each term and the relationships between terms. We propose a knowledge base
model called MD Concept which is based on a semantic network and uses an
object-oriented paradigm and relational tables. A prototype has been
developed which integrates the Unified Medical Language System (UMLS) with
other databases including the Systematized Nomenclature of Medicine
(SNOMED II), the Diagnostic and Statistical Manual of Mental Disorders
(DSM-IIIR) and a pharmaceutical database. We demonstrate how a user can
easily navigate in this knowledge world using a browser. Copyright by and
reprinted with permission of the American Medical Informatics
Association.</P>
<P>Rada R. Maintaining thesauri and metathesauri. Int Classif 1990
;17(3-4):158-164. Maintaining a thesuarus is a time-consuming task which
should go hand-in-hand with the indexing of information and should be
supported by software. To connect different docuement databases their
respective thesauri should be related. The most straightforward way to
support this by computer is to map the terms of one thesaurus to those of
another. Such a mapping creates one kind of metathesaurus. As citation
systems are extended to include full-text on-line , a new thesaurus may be
used to index individual paragraphs of a document, and a metathesaurus may
apply to a universe of paragraphs. To illustrate these principles several
computer systems are described which help people maintain thesauri and
metathesauri. Particular success has been had by the National Library of
Medicine with its Medical Subject Headings and its Unified Medical
Language System. Copyright International Society for Knowledge
Organization.</P>
<P>Rosse C, Ben Said M, Eno KR, Brinkley JF. Enhancements of anatomical
information in UMLS knowledge sources. Proc Annu Symp Comput Appl Med Care
1995:873-7. Although anatomical terminology forms a part of biomedical
structured vocabularies, available sources lack the requisite granularity,
semantic types and relationships for comprehensively and consistently
representing anatomical concepts in machine readable form. Thoracic
angiology was selected as a proof of concept experiment for in depth
representation of symbolic information in gross anatomy through the
enhancement of semantic types, concepts and relationships in UMLS.
Provided the representation of concepts is comprehensive, hierarchies
generated with four types of simple relationships are capable of
displaying anatomical information from the systemic view point with
sufficient detail to meet the needs of applications in basic science
education and in the practice of surgical subspecialties. Copyright by and
reprinted with permission of the American Medical Informatics
Association.</P>
<P>Wigertz OB, Clayton PD, Hripcsak G, Linnarsson R. Knowledge
representation and data model to support medical knowledge base
transportability. In: Talmon JL, Fox J, editors. Knowledge based systems
in medicine: methods, applications and evaluation. Proceedings of the
Workshop System Engineering in Medicine; 1989 Mar 16-18; Maastricht,
Netherlands. Berlin: Springer-Verlag; 1991. p. 80-90. The authors discuss
the thesis that it is possible to design a data model and a representation
of the medical decision-making knowledge in a sufficiently high level and
modular format to ease transportability between institutions and systems.
They discuss some of the prerequisites of this uniform representation of
medical terms, medical data and medical logic. They discuss UMLS (unified
medical language system) and its metathesaurus. The possible impact of the
sharing of knowledge bases on the development and use of medical decision
support systems is also considered.</P><A
href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#list">Return to title
page</A> | <A
href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#15">Return to table of
contents</A>
<HR>
<UL>
<LI>
<UL>
<LI><STRONG><A name=3b>Vocabulary Standards, Servers, and Mapping
Methods</A></STRONG><BR></LI></UL></LI></UL>
<HR>
<P>Anderson CL, Hukill M, Wang W, Bangerter B, Kattelman M, Hartmann-Voss
K. A practical approach to structuring data in an integrated expert
system. Proc Annu Symp Comput Appl Med Care 1990:599-603. At the onset of
creating an expert system integrated into existing clinical information
systems, the need for a special data dictionary which could map to diverse
terminology in a variety of domains at a variety of health care delivery
sites was identified. Based upon research conducted on existing medical
nomenclatures, a methodology for structuring the expert system data
dictionary was produced. The dictionary is segmented into specific domains
(e.g. pharmacy, laboratory, etc.) as determined by traditional health care
specialties. Terms within each domain are categorized further with
guidance from working conventions commonly found within that specialty
(e.g. ICD-9-CM, CPT-4, etc.). Emphasis was placed on selecting protocols
consistent with those used in the Unified Medical Language System to
accommodate future translatability. Copyright by and reprinted with
permission of the American Medical Informatics Association.</P>
<P>Chute CG, Cesnik B, van Bemmel JH. Medical data and knowledge
management by integrated medical workstations: summary and
recommendations. Int J Biomed Comput 1994 Jan;34(1-4):175-83. The health
care professional workstation will function as an interface between the
user and the patient data as well as an interface pertinent medical
knowledge. Appropriate knowledge focus will require the workstation to
recognize the concepts and structure of patient data, and understand the
scope and access methods of knowledge sources. Issues are organized around
five major themes: (i) structure, (ii) reliability and validation, (iii)
views, (iv) location, and (v) ethical and legal. Conventional database
representations can effectively address data structure and format
variations that will inevitably persist in local data stores. The
reliability of data and the validation of knowledge are critical issues
that may determine the ultimate utility of clinical workstations.
Alternative views of patient information and knowledge sources represent
the true power of an intelligent data portal, represented by a
well-designed clinical workstation. Both data and knowledge are optimally
represented in decentralized information networks, although the
confidentiality and ownership of this information must be respected.
Evolutionary progress toward consistent representations of knowledge and
patient data will be facilitated by the establishment of
self-documentation standards for the developers of data encoding systems
and knowledge sources, perhaps extended from the preliminary model
afforded by the Unified Medical Language System (UMLS).</P>
<P>Cimino JJ. Data storage and knowledge representation for clinical
workstations. Int J Biomed Comput 1994 Jan;34(1-4):185-94. The
representation of patient information for use in clinical workstations is
a complex problem. Ideally, it should be addressed in a way that allows
multiple uses of the data, including simple manual review, sharing and
pooling across institutions, and as input to knowledge-based decision
support systems. To a great extent, this means coding information with
controlled medical vocabularies, but it does not mean that all information
must be codable before workstations are feasible. This paper defines some
of the choices, both current and future, that are available to address the
needs of controlled medical vocabularies for representing data and
knowledge in clinical workstations and explores some of the implications
of those choices.</P>
<P>Cimino JJ, Barnett GO. Automated translation between medical
terminologies using semantic definitions. MD Comput 1990
Mar-Apr;7(2):104-9. Published erratum appears in MD Comput 1990
Jul-Aug;7(4):268. Automatic translation of medical terms from one
controlled vocabulary into another is essential to the integration of
diverse medical informatics systems. We have developed a strategy in which
medical terms are represented in a standard format that provides semantic
description of the terms. We demonstrate the representational power of our
method by showing that a subset of medical terms (procedures) from diverse
vocabularies can be described in this manner. We assess the potential
usefulness of our approach for facilitating automatic translation by
finding the closest match for MeSH cardiovascular procedures with ICD-9
procedures. Copyright 1990 Springer-Verlag.</P>
<P>Cimino JJ, Johnson SB, Hripcsak G, Sideli RV, Fink DJ, Friedman C,
Clayton PD. One year's experience with the Unified Medical Language System
(UMLS) in academia and patient care. Medinfo 1992;7(Pt 2):1501-5. The
first edition of the Unified Medical Language System (UMLS), released in
September 1990 by the National Library of Medicine consists of a
metathesaurus of 78862 interrelated terms and a semantic network for
categorizing these terms and representing additional relationships between
them. The integration of information systems at the Columbia-Presbyterian
Medical Center requires attention to the problem of reconciling the
diverse controlled vocabularies used by each system. One of the purposes
of the UMLS is to facilitate automatic methods for such reconciliation.
The authors have been exploring the suitability of the UMLS for various
aspects of the vocabulary management tasks, including vocabulary
organization, vocabulary representation and automated vocabulary
translation. The UMLS is demonstrated to have specific value for
vocabulary representation and translation; however, many areas are
identified where further development of its knowledge sources would be
useful.</P>
<P>France FH. Standards for nomenclature (HIS). In: Bakker AR, Ehlers CTh,
Bryant JR, Hammond WE, editors. Hospital information systems:
scope-design-architecture. Proceedings of the IMIA Working Conference;
1991 Sep 7-11; Gottingen, Germany. Amsterdam: North-Holland; 1992. p.
167-74. Uniform HISs which allow one to retrieve medical terms with the
same meaning are discussed. The ICD-10 (International Classification of
Diseases, 10th Revision) is expected to be published in 1993 by the World
Health Organisation (WHO), with an alphabetic index containing former
ICD-9 codes (conversion table). Each country has to decide when ICD-10
will be in use for hospitalized patients. Mapping extensions of ICD-9 to
ICD-10 will take some more time, as well as conversion tables to DSM III,
SNOMED, or MeSH, as performed by UMLS (Unified Medical Language System of
the National Library of Medicine-USA). ICD-9-CM is updated regularly in
the USA, but insufficient to describe laboratory tests, X-Rays procedures,
drugs; ICCS (International Classification of Clinical Services) contains
such information, complementary to ICD-9-CM. ICCS might be tested for
mapping other codes, as a kind of metacode, in order to detect differences
between national nomenclatures, when they exist. Up to now it remains
'Canadian-American' rather than 'international'. Standards for
nomenclature should also include rules for coding, as well as elements of
semantics in order to enable similar interpretation.</P>
<P>Houtchens BA, Allen A, Clemmer TP, Lindberg DA, Pedersen S.
Telemedicine protocols and standards: development and implementation. J
Med Syst 1995 Apr;19(2):93-119.</P>
<P>Humphreys BL, Hole WT, McCray AT, Fitzmaurice JM. Planned NLM/AHCPR
large-scale vocabulary test: using UMLS technology to determine the extent
to which controlled vocabularies cover terminology needed for health care
and public health. J Am Med Inform Assoc 1996 Jul-Aug;3(4):281-7. The
National Library of Medicine (NLM) and the Agency for Health Care Policy
and Research (AHCPR) are sponsoring a test to determine the extent to
which a combination of existing health-related terminologies covers
vocabulary needed in health information systems. The test vocabularies are
the 30 that are fully or partially represented in the 1996 edition of the
Unified Medical Language System (UMLS) Metathesaurus, plus three planned
additions: the portions of SNOMED International not in the 1996
Metathesaurus, the Read Clinical Classification, and the Logical
Observations Identifiers, Names, and Codes (LOINC) system. These
vocabularies are available to testers through a special interface to the
Internet-based UMLS Knowledge Source Server. The test will determine the
ability of the test vocabularies to serve as a source of controlled
vocabulary for health data systems and applications. It should provide the
basis for realistic resource estimates for developing and maintaining a
comprehensive "standard" health vocabulary that is based on existing
terminologies. Copyright by and reprinted with permission of the American
Medical Informatics Association.</P>
<P>Masys DR. Of codes and keywords: standards for biomedical nomenclature.
Acad Med 1990 Oct;65(10):627-9.</P>
<P>McCormick KA, Lang N, Zielstorff R, Milholland DK, Saba V, Jacox A.
Toward standard classification schemes for nursing language:
recommendations of the American Nurses Association Steering Committee on
Databases to Support Clinical Nursing Practice. J Am Med Inform Assoc 1994
Nov-Dec;1(6):421-7. The American Nurses Association (ANA) Cabinet on
Nursing Practice mandated the formation of the Steering Committee on
Databases to Support Clinical Nursing Practice. The Committee has
established the process and the criteria by which to review and recommend
nursing classification schemes based on the ANA Nursing Process Standards
and elements contained in the Nursing Minimum Data Set (NMDS) for
inclusion of nursing data elements in national databases. Four
classification schemes have been recognized by the Committee for use in
national databases. These classification schemes have been forwarded to
the National Library of Medicine (NLM) for inclusion in the Unified
Medical Language System (UMLS) and to the International Council of Nurses
for the development of a proposed International Classification of Nursing
Practice. Copyright by and reprinted with permission of the American
Medical Informatics Association.</P>
<P>Pretschner DP. Data analysis and information modelling: objects codes,
concepts. Radiat Prot Dosim 1995;57 (1-4):175-84. </P>
<P>Prokosch HU, Dudeck J, Michel A. Standards for data dictionaries (HIS).
In: Bakker AR, Ehlers CTh, Bryant JR, Hammond WE, editors. Hospital
information systems: scope-design-architecture. Proceedings of the IMIA
Working Conference; 1991 Sep 7-11; Gottingen, Germany. Netherlands:
North-Holland; 1992. p. 189-95. A controlled vocabulary is a basic
requirement in the development and implementation of HIS. A medical data
dictionary (MDD) has to provide a framework for such a controlled
vocabulary and additionally the possibility to define semantic
relationships and mappings to other MDDs. Several useful models for MDDs
have been developed in the last years. Among these the UMLS seems to be
the most comprehensive one. Unfortunately this project is still limited to
the US. In order to achieve one standard framework for MDD development,
researchers from Europe and all over the world will have to carefully
analyze the work which has already been done within UMLS and try to
finally agree to one common approach.</P>
<P>Prokosch HU, Kamm S, Wieczorek D, Dudeck J. Knowledge representation in
pharmacology. A possible application area for the Arden Syntax? Proc Annu
Symp Comput Appl Med Care 1991:243-7. In 1990 the Arden Syntax was
proposed as a first version of a standardized syntax for the
representation of medical knowledge. For the evaluation of the
practicability of this first release we have analyzed the medical and
pharmacological knowledge applied in the process of drug prescription. The
separation of declarative (e.g. in a semantic network) and procedural
knowledge is a basic issue of our research. We therefore propose to
further extend the Arden syntax with declarative knowledge representation
facilities. One way to do this may be the incorporation of a standardized
medical data dictionary (e.g. the UMLS Metathesaurus) which promotes the
representation of medical terms in a semantic network. Furthermore the
problem of 'institution-specific knowledge', which is especially important
for the issue of knowledge sharing between different institutions, is
analyzed based on examples of knowledge modules for monitoring drug
allergies and drug-drug-interactions. Copyright by and reprinted with
permission of the American Medical Informatics Association.</P>
<P>Rocha RA, Beatriz MD, Huff SM. Automated translation between medical
vocabularies using a frame-based interlingua. Proc Annu Symp Comput Appl
Med Care 1993:690-4. The integration of clinical systems almost always
requires a translation phase, where vocabularies are compared and the
similar concepts are matched. The lack of standards in the area of medical
concept representation makes this task very difficult. The authors
describe the development of a frame-based application that automatically
translates terms found in one vocabulary to another. The application
implements an innovative scoring algorithm that ranks the best matches
using an exponential scale. Preliminary results and the comparison against
a manual process in the same domain are also discussed. Copyright by and
reprinted with permission of the American Medical Informatics
Association.</P>
<P>Rocha RA, Huff SM. Using digrams to map controlled medical
vocabularies. Proc Annu Symp Comput Appl Med Care 1994:172-6. A program
for matching between controlled medical vocabularies has been developed
which adopts methods used in the domain of Information Retrieval. This
program combines a stemmer based on fragments of words (digrams) with a
similarity function. The proposed stemmer did not require any knowledge
about word-formation rules and helped the identification of several kinds
of word variants. The adopted similarity function assigned the highest
score to the best candidate match in 99.0% of the cases. Copyright by and
reprinted with permission of the American Medical Informatics
Association.</P>
<P>Rocha RA, Huff SM, Haug PJ, Warner HR. Designing a controlled medical
vocabulary server: the VOSER project. Comput Biomed Res 1994
Dec;27(6):472-507. The authors describe their experience designing a
controlled medical vocabulary server created to support the exchange of
patient data and medical decision logic. The first section introduces
practical and theoretical premises that guided the design of the
vocabulary server. The second section describes a series of structures
needed to implement the proposed server, emphasizing their conformance to
the design premises. The third section introduces potential applications
that provide services to end users and also a group of tools necessary for
maintaining the server corpus. In the fourth section, the authors propose
an implementation strategy based on a common framework and on the
participation of groups from different health-related domains. Copyright
1994 Academic Press.</P>
<P>Walker DC, Walters RF. Developing a multilingual index to access
health-care terminologies. M Comput 1993 Sep;1(4):32-3, 36-42.</P>
<P>Walker DC, Walters RF, Cimino JJ, Dujols P, Li Ensheng, Giere W, Kiuchi
T, Lamberts H, Moore WG, Roger FH, Satomura Y, Stitt FW.
Internationalization of health care terminology. Medinfo 1992;7(Pt
2):1444-51. The Unified Medical Language System (UMLS) of the National
Library of Medicine (NLM) provides a terminology interface for biomedical
resources in the USA. A project to develop a multinational terminology
resource could effectively extend the existing thesaurus of the UMLS, and
help the internationalization of medical information. What the UMLS is at
this moment, is summarized in this paper. Some terminologies with
'terminology browsers' are briefly described. The formation of a more
encompassing multilingual master index to access various terminologies and
their 'browsers' is advocated. An international body to initiate and
coordinate any such project would be needed.</P>
<P>Zeng Q, Cimino JJ. Mapping medical vocabularies to the Unified Medical
Language System. Proc AMIA Fall Symp 1996:105-9. This paper presents our
work in automated mapping of medical vocabularies to the National Library
of Medicine's Unified Medical Language System (UMLS). We used the UMLS
Knowledge Source (KS) tool to map terms from several sources to UMLS
Metathesaurus concepts. We compared performance of the KS tools with our
own Minimal Representable Units Method (MRUM). The KS tools were able to
map terms from 13% to 54% of the time, depending on the term set and the
KS options used. Our MRUM method mapped between 96% and 99% of the terms.
Based on our experience, we believe that questions remain about the best
method by which the UMLS can be used to achieve automated term
translation. Copyright by and reprinted with permission of the American
Medical Informatics Association.</P>
<P>Zielstorff RD, Lang NM, Saba VK, McCormick KA, Milholland DK. Toward a
uniform language for nursing in the US: work of the American Nurses
Association Steering Committee on databases to support clinical practice.
Medinfo 1995;8(Pt 2):1362-6. This paper reports on the work of the
American Nurses Association Steering Committee on Databases to Support
Clinical Practice, in existence since 1989. Responding to its broad
charges, the Steering Committee has laid down the foundations for its work
in declaring the nursing process as the framework for nursing data in
database systems, and in endorsing the Nursing Minimum Data Set as the set
of minimum elements for any system designed to carry health-related data
that reflects nursing care. In addition, the Steering Committee has begun
initiatives to: 1) promote the inclusion of nursing-related data in large
health-related databases, and 2) develop a Uniform Language for nursing
through a phased approach. The Steering Committee also works directly with
the International Council of Nurses to promote the inclusion of nursing
data in internationally used classification systems and to develop an
international language that describes nursing care.</P><A
href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#list">Return to title
page</A> | <A
href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#15">Return to table of
contents</A>
<HR>
<UL>
<LI>
<UL>
<LI><STRONG><A name=3c>Knowledge Acquisition and Concept
Discovery</A></STRONG><BR></LI></UL></LI></UL>
<HR>
<P>Burgun A, Bodenreider O, Denier P, Delamarre D, Botti G, Lukacs B,
Mayeux D, Bremond M, Kohler F, Fieschi M, et al. Knowledge acquisition
from the UMLS sources: application to the description of surgical
procedures. Medinfo 1995;8(1):75-9. The re-usability of lexicons and
knowledge in medicine is a crucial challenge. The Unified Medical Language
System (UMLS) project has attempted to provide a repository of concepts,
semantically categorized for biomedical domain. This paper describes some
results about the relevance of UMLS structures for specific purposes. We
have focused on the description of surgical procedures. Discussion
concerns synonymy of terms, granularity of concepts, and ontology. A
preliminary work on the exploitation of interconcept links by a
computerized application reveals a heterogeneous implementation of those
relationships. However, the UMLS provides a powerful knowledge base for
developers.</P>
<P>Burgun A, Botti G, Lukacs B, Mayeux D, Seka LP, Delamarre D, Bremond M,
Kohler F, Fieschi M, Le Beux P. A system that facilitates the orientation
within procedure nomenclatures through a semantic approach. Med Inf (Lond)
1994 Oct-Dec;19(4):297-310.</P>
<P>Burgun A, Delamarre D, Botti G, Lukacs B, Mayeux D, Bremond M, Kohler
F, Fieschi M, Le Beux P. Designing a sub-set of the UMLS knowledge base
applied to a clinical domain: methods and evaluation. Proc Annu Symp
Comput Appl Med Care 1994:968. The UMLS is a complex collection of
interconnected biomedical concepts derived from standard nomenclatures.
Designing a specific subset of the UMLS knowledge base relevant to a
medical domain is a prerequisite for the development of specialized
applications based on UMLS. We have developed a method based on the
selection of the appropriate terms in original nomenclatures and the
capture of a set of UMLS terms that are linked to them in the network to a
certain degree. We have experimented it as the foundation for a concept
base applied to urology. Results depend on the exhaustiveness of the
relationships between the Meta-1 concepts. A preliminary analysis of the
sub-base reveals that some adaptations of vocabulary and ontology are
required for clinical applications. Copyright by and reprinted with
permission of the American Medical Informatics Association.</P>
<P>Gangemi A, Galanti M, Galeazzi E, Rossi Mori A. Beyond UMLS:
computational semantics for medical records. Medinfo 1992;7(Pt 1):703-8.
Computational semantics is a promising approach for effective processing
of clinical data, integrating medical record, information retrieval
applications, statistical databases and knowledge based systems. The
authors introduce 'semiotic codes', a generalization of medical language
and artificial coding systems, and describe their power by a scale: (C1)
non-combinatorial Codes (icons); (C2) combinatorial Codes, with finite set
of signs (conventional coding systems); (C3) combinatorial Codes, with
potentially infinite set of signs (combinatorial expressions); (C4)
combinatorial Codes, with calculable synonymy (formal languages); (C5)
creative Codes with unpredictable synonymy and homonymy (natural
languages). In order to convert each potential Semiotic Code to another,
one needs a system of class C4, that is computationally 'more powerful'
than any other. It is based on formal expressions, allowing to compare
definitions of concepts to decide their equivalence. It acts as an
interlingua to represent medical concepts in the computer, in a neutral
way with respect to other semiotic codes and applications.</P>
<P>Hardy B, Burgun A, Le Beux P. Accessing to knowledge base terms using
UMLS concepts. In: Brender J, Christensen JP, Scherrer JR, McNair P,
editors. Medical Informatics Europe '96: Human facets in information
technologies. Washington: IOS Press; 1996. p. 164-8. (Studies in health
technology and informatics; 34). This paper presents the first phase of a
project of a terminology server based on the UMLS project and using both
lexical mapping and conceptual relations. The choice of tools has been to
build a user to data knowledge base using the PERL language associated the
World Wide Web technology and relational data base (ORACLE <SUP><FONT
size=1>tm</FONT></SUP>).</P>
<P>Hersh WR, Campbell EH, Evans DA, Brownlow ND. Empirical, automated
vocabulary discovery using large text corpora and advanced natural
language processing tools. Proc AMIA Fall Symp 1996:159-63. A major
impediment to the full benefit of electronic medical records is the lack
of a comprehensive clinical vocabulary. Most existing vocabularies do not
allow the full expressiveness of clinical diagnoses and findings that are
often qualified by modifiers relating to severity, acuity, and temporal
factors. One reason for the lack of expressivity is the inability of
traditional manual construction techniques to identify the diversity of
language used by clinicians. This study used advanced natural language
processing tools to identify terminology in a clinical findings domain,
compare its coverage with the UMLS Metathesaurus, and quantify the effort
required to discover the additional terminology. It was found that
substantial amounts of phrases and individual modifiers were not present
in the UMLS Metathesaurus and that modest effort in human time and
computer processing were needed to obtain the larger quantity of terms.
Copyright by and reprinted with permission of the American Medical
Informatics Association.</P>
<P>Nelson SA, Olson NE, Fuller L, Tuttle MS, Cole WG, Sherertz DD.
Identifying concepts in medical knowledge. Medinfo 1995;8(Pt 1):33-6. The
barrier word method of identifying nominal phrases in text, using a very
long barrier word list, was evaluated in two different sets of text. In a
sample of 10 paragraphs from the Medical Knowledge Self-Assessment Program
of the American College of Physicians, the yield of nominal phrases as a
percent of total chunks isolated was 66%. Some 500,000 chunks were
isolated from Principles and Practice of Oncology (PPO). 38% of these
chunk-occurrences were of chunks which matched to 10,000 concept names in
Meta-1.4, the most recent version of the UMLS Metathesaurus. 50 paragraphs
from PPO were chosen at random. Co-occurrences of concepts in those
paragraphs were reviewed. 42 of the paragraphs had unique or infrequently
occurring co-occurrences which described closely the major thrust of the
paragraph.</P>
<P>Nelson SJ, Cole WG, Tuttle MS, Olson NE, Sherertz DD. Recognizing new
medical knowledge computationally. Proc Annu Symp Comput Appl Med Care
1993:409-13. Can new medical knowledge be recognized computationally? We
know knowledge is changing, and our knowledge-based systems will need to
accommodate that change in knowledge on a regular basis if they are to
stay successful. Computational recognition of these changes seems
desirable. It is unlikely that low level objects in the computational
universe, bits and characters, will change much over time, higher level
objects of language, where meaning begins to emerge, may show change. An
analysis of ten arbitrarily selected paragraphs from the Medical Knowledge
Self-Assessment Program of the American College of Physicians was used as
a test bed for nominal phrase recognition. While there were words not
known to Meta-1.2, only 8 of the 32 concepts new to the primary author
were pointed to by new words. Use of a barrier word method was successful
in identifying 23 of the 32 new concepts. Use of co-occurrence (in
sentences) of putative nominal phrases may reduce the amount of human
effort involved in recognizing the emergence of new relationships.
Copyright by and reprinted with permission of the American Medical
Informatics Association.</P>
<P>Rindflesch TC, Aronson AR. Ambiguity resolution while mapping free text
to the UMLS Metathesaurus. Proc Annu Symp Comput Appl Med Care 1994:240-4.
We propose a method for resolving ambiguities encountered when mapping
free text to the UMLS Metathesaurus. Much of the research in medical
informatics involves the manipulation of free text. The Metathesaurus
contains extensive information which supports solutions to problems
encountered while processing such text. After discussing the process of
mapping free text to the Metathesaurus and describing the ambiguities
which are often the result of such mapping, we provide examples of rules
designed to eliminate mapping ambiguities. These rules refer to the
context in which the ambiguity occurs and crucially depend on semantic
types obtained from the Metathesaurus. We have conducted a preliminary
test of the methodology and the results obtained indicate that the rules
successfully resolve ambiguity around 80% of the time. Copyright by and
reprinted with permission of the American Medical Informatics
Association.</P>
<P>Sneiderman CA, Rindflesch TC, Aronson AR. Finding the findings:
identification of findings in medical literature using restricted natural
language processing. Proc AMIA Fall Symp 1996:239-43. The ability to
search the biomedical literature based on findings would provide enhanced
access to information. We describe a computer program called FINDX which
relies on the UMLS Metathesaurus and restricted natural language
processing to identify findings in free text. Such identification can
serve as a filtering mechanism while selecting relevant papers. After
discussing the salient characteristics of findings on which FINDX depends,
we report on the results of an experiment in which we tested the program
on a set of MEDLINE abstracts pertaining to the diagnosis of Parkinson
Disease. Copyright by and reprinted with permission of the American
Medical Informatics Association.</P><A
href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#list">Return to title
page</A> | <A
href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#15">Return to table of
contents</A>
<HR>
<UL>
<LI><STRONG>Data Creation</STRONG><BR>
<UL>
<LI><STRONG><A name=3d>Clinical Data</A></STRONG><BR></LI></UL></LI></UL>
<HR>
<P>Cimino JJ. Use of the Unified Medical Language System in patient care
at the Columbia-Presbyterian Medical Center. Methods Inf Med 1995
Mar;34(1-2):158-64. The Unified Medical Language System (UMLS) project at
the United States National Library of Medicine contains and organizes a
large number of terms from controlled medical vocabularies. This study
examines the suitability of the UMLS for representing patient care
information as it exists in the Columbia-Presbyterian Medical Center
(CPMC) clinical in formation system. Comparisons were made between the
semantic types, semantic relations and medical concepts of the UMLS and
the data model entities, semantic classes, semantic relations and concepts
in the CPMC system. Results of the comparison demonstrate that the UMLS
structural model is appropriate for representing CPMC vocabularies and
patient data and that the UMLS concepts provide excellent coverage of CPMC
concepts in many areas. Recommendations are made for enhancing UMLS
structure to provide additional coverage of the CPMC model. It is
concluded that content expansion to provide better coverage of clinical
terminology is possible within the current UMLS model.</P>
<P>Cimino JJ, Barnett GO. The physician's workstation: recording a
physical examination using a controlled vocabulary. Proc Annu Symp Comput
Appl Med Care 1987:287-91. A system has been developed which runs on
MS-DOS personal computers and serves as an experimental model of a
physician's workstation. The program provides an interface to a controlled
vocabulary which allows rapid selection of appropriate terms and modifiers
for entry of clinical information. Because it captures patient
descriptions, it has the ability to serve as an intermediary between the
physician and computer-based medical knowledge resources. At present, the
vocabulary permits rapid, reliable representation of cardiac physical
examination findings. Copyright 1987 IEEE. Reprinted, with permission.</P>
<P>Lindberg DA, Humphreys BL. The Unified Medical Language System (UMLS)
and computer-based patient records. In: Ball MJ, Collen MF, editors.
Aspects of the computer-based patient record. New York: Springer-Verlag;
1992. p. 165-75.</P>
<P>Lowe HJ. Image Engine: an object-oriented multimedia database for
storing, retrieving and sharing medical images and text. Proc Annu Symp
Comput Appl Med Care 1993:839-43. This paper describes Image Engine, an
object-oriented, microcomputer-based, multimedia database designed to
facilitate the storage and retrieval of digitized biomedical still images,
video, and text using inexpensive desktop computers. The current prototype
runs on Apple Macintosh computers and allows network database access via
peer to peer file sharing protocols. Image Engine supports both free text
and controlled vocabulary indexing of multimedia objects. The latter is
implemented using the TView thesaurus model developed by the author. The
current prototype of Image Engine uses the National Library of Medicine's
Medical Subject Headings (MeSH) vocabulary (with UMLS Meta-1 extensions)
as its indexing thesaurus. Copyright by and reprinted with permission of
the American Medical Informatics Association.</P>
<P>Lowe HJ, Buchanan BG, Cooper GF, Vries JK. Building a medical
multimedia database system to integrate clinical information: an
application of high-performance computing and communications technology.
Bull Med Libr Assoc 1995 Jan;83(1):57-64. The rapid growth of
diagnostic-imaging technologies over the past two decades has dramatically
increased the amount of nontextual data generated in clinical medicine.
The architecture of traditional, text-oriented, clinical information
systems has made the integration of digitized clinical images with the
patient record problematic. Systems for the classification, retrieval, and
integration of clinical images are in their infancy. Recent advances in
high-performance computing, imaging, and networking technology now make it
technologically and economically feasible to develop an integrated,
multimedia, electronic patient record. As part of The National Library of
Medicine's Biomedical Applications of High-Performance Computing and
Communications program, we plan to develop Image Engine, a prototype
microcomputer-based system for the storage, retrieval, integration, and
sharing of a wide range of clinically important digital images. Images
stored in the Image Engine database will be indexed and organized using
the Unified Medical Language System Metathesaurus and will be dynamically
linked to data in a text-based, clinical information system. We will
evaluate Image Engine by initially implementing it in three clinical
domains (oncology, gastroenterology, and clinical pathology) at the
University of Pittsburgh Medical Center. Copyright by and reprinted with
permission of the Medical Library Association.</P>
<P>Stitt FW. The problem-oriented medical synopsis: coding, indexing, and
classification sub-model. Proc Annu Symp Comput Appl Med Care 1994:964. A
clinical information system consists of four major components: the
clinical database, decision support, data analysis (including outcomes),
and the development system. We have created such a system using generally
available database methodology. The system is documented using a
conceptual model, a physical model, and sub-models for individual
components. A key sub-model of the clinical database, for record-keeping,
has been defined for coding, indexing, and classification of the medical
narrative typically encountered in medical records. We describe an
approach to the development of the coding component that results in a
hybrid system for recording information, locating indexed information, and
summarizing it for analysis of outcomes. These are based on a primary term
list--the problem glossary; SNOMed--the Systematized Nomenclature of
Medicine (3rd. edition); and ICD-9-CM. The relationship with the UMLS is
also discussed. Copyright by and reprinted with permission of the American
Medical Informatics Association.</P>
<P>Stitt FW. A standards-based clinical information system for HIV/AIDS.
Medinfo 1995;8(Pt 1):402. Objective: To create a clinical data repository
to interface the Veteran's Administration (VA) Decentralized Hospital
Computer Program (DHCP) and a departmental clinical information system for
the management of HIV patients. This system supports record-keeping,
decision-making, reporting, and analysis. The database development was
designed to overcome two impediments to successful implementations of
clinical databases: (i) lack of a standard reference data model, and; (ii)
lack of a universal standard for medical concept representation.
Background: Health Level Seven (HL7) is a standard protocol that specifies
the implementation of interfaces between two computer applications (sender
and receiver) from different vendors or sources of electronic data
exchange in the health care environment. This eliminates or substantially
reduces the custom interface programming and program maintenance that
would otherwise be required. HL7 defines the data to be exchanged, the
timing of the interchange, and the communication of errors to the
application. The formats are generic in nature and must be configured to
meet the needs of the two applications involved. The standard conceptually
operates at the seventh level of the ISO model for Open Systems
Interconnection (OSI). The OSI simply defines the data elements that are
exchanged as abstract messages, and does not prescribe the exact bit
stream of the messages that flow over the network. Lower level network
software developed according to the OSI model may be used to encode and
decode the actual bit stream. The OSI protocols are not universally
implemented and, therefore, a set of encoding rules for defining the exact
representation of a message must be specified. The VA has created an HL7
module to assist DHCP applications in exchanging health care information
with other applications using the HL7 protocol. The DHCP HL7 module
consists of a set of utility routines and files that provide a generic
interface to the HL7 protocol for all DHCP applications. Setting: The VA's
DHCP core modules are in standard use at 169 hospitals, and the role of
the VA system in health care delivery has been discussed elsewhere. This
development was performed at the Miami VA Medical Center Special
Immunology Unit, where a database was created for an HIV patient registry
in 1987. Over 2,300 patients have been entered into a database that
supports a problem-oriented summary of the patient's clinical record. The
interface to the VA DHCP was designed and implemented to capture
information from the patient treatment file, pharmacy, laboratory,
radiology, and other modules. Results: We obtained a suite of programs for
implementing the HL7 encoding rules from Columbia-Presbyterian Medical
Center in New York, written in ANSI C. This toolkit isolates our
application programs from the details of the HL7 encoding rules, and
allows them to deal with abstract messages and the programming level.
While HL7 has become a standard for healthcare message exchange, SQL
(Structured Query Language) is the standard for database definition, data
manipulation, and query. The target database provides clinical workstation
functionality. Medical concepts are encoded using a preferred terminology
derived from over 15 sources that include the Unified Medical Language
System and SNOMed International.</P>
<P>Trace D, Naeymi-Rad F, Almeida FD, Moidu K, Haines D. A longitudinal
medical record (IMR). Proc Annu Symp Comput Appl Med Care 1993:911. The
Intelligent Medical Record (IMR) is currently being used in patient care
activities at Norwalk Hospital in Norw alk, CT, and at Cook County
Hospital in Chicago, IL. IMR has evolved into a multi-encounter patient
record, stored in a multi-user database management system. The graphical
user interface is designed to support physician efforts to capture patient
data, c reate progress notes, and produce a longitudinal medical record.
The authors describe the program's major components, including its
multi-encounter knowledge management system, problem list, progress notes,
point-of-entry query, and interface to UMLS. Copyright by and reprinted
with permission of the American Medical Informatics Association.</P>
<P>Wagner MM. An automatic indexing method for medical documents. Proc
Annu Symp Comput Appl Med Care 1991:1011-7. This paper describes
MetaIndex, an automatic indexing program that creates symbolic
representations of documents for the purpose of document retrieval.
MetaIndex uses a simple transition network parser to recognize a language
that is derived from the set of main concepts in the Unified Medical
Language System Metathesaurus (Meta-1). MetaIndex uses a hierarchy of
medical concepts, also derived from Meta-1, to represent the content of
documents. The goal of this approach is to improve document retrieval
performance by better representation of documents. An evaluation method is
described, and the performance of MetaIndex on the task of indexing the
Slice of Life medical image collection is reported. Copyright by and
reprinted with permission of the American Medical Informatics
Association.</P>
<P>Wagner MM, Cooper GF. Evaluation of a Meta-1-based automatic indexing
method for medical documents. Comput Biomed Res 1992 Aug;25(4):336-50.
This paper describes MetaIndex, an automatic indexing program that creates
symbolic representations of documents for the purpose of document
retrieval. MetaIndex uses a simple transition network parser to recognize
a language that is derived from the set of main concepts in the Unified
Medical Language System Metathesaurus (Meta-1). MetaIndex uses a hierarchy
of medical concepts, also derived from Meta-1, to represent the content of
documents. The goal of this approach is to improve document retrieval
performance by better representation of documents. An evaluation method is
described, and the performance of MetaIndex on the task of indexing the
Slice of Life medical image collection is reported. Copyright 1992
Academic Press.</P><A
href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#list">Return to title
page</A> | <A
href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#15">Return to table of
contents</A>
<HR>
<UL>
<LI>
<UL>
<LI><STRONG><A name=3e>Curricula and Faculty
Interests</A></STRONG><BR></LI></UL></LI></UL>
<HR>
<P>Breene M, Jasmin R, Eisner J. Computer-based curriculum analysis. A
customized approach using external standards and the UMLS. Proc Annu Symp
Comput Appl Med Care 1993:919. This article describes the beta test stage
of the first software product developed by The American Association of
Dental Schools (AADS) Curriculum Database Consortium, which is known as
CATs (Curriculum Analysis Tools). The consortium wanted to develop a
software tool that could adapt to the special circumstances of each of the
fifty Dental Schools and Allied Dental Programs, while accurately and
comprehensively representing their curricula. The product has satisfied
the principle requirements for user customization, cross-referencing to
external standards, and content searching by keyword using the UMLS. The
product provides an intuitive method of curriculum analysis with powerful
tools for viewing and interpreting the results. Copyright by and reprinted
with permission of the American Medical Informatics Association.</P>
<P>Clyman SG. UMLS linked to a system for authoring simulations used in
evaluation of physicians. Proc Annu Symp Comput Appl Med Care 1993:921.
The National Board of Medical Examiners (NBME) develops examinations used
in licensing physicians in the United States. To complement existing
multiple-choice examinations, NBME has developed and is studying uncued,
dynamic, computer-based simulations (CBX) of the patient care environment.
In CBX, physicians type free-text orders for diagnostic studies,
procedures , consultants, medications, and other therapies. As simulated
time passes, patient conditions evolve in response to physician management
decisions; multiple outcomes are possible. One impediment to widespread
use of CBX is the technical expertise, time, a nd cost associated with it.
A new case authoring system called SEEDS (Simulation Environment
Engineering and Development System) will increase the efficiency of this
process. The National Library of Medicine's Unified Medical Language
System (UMLS) is use d in the development of SEEDS to link UMLS and CBX
terms and concepts. Copyright by and reprinted with permission of the
American Medical Informatics Association.</P>
<P>Eisner J. Curriculum Analysis Tools (CATs). A cooperative approach to
the design of curriculum databases. Proc Annu Symp Comput Appl Med Care
1993:766-70. In 1990, a small group of dental schools agreed to pool their
resources and cooperate in the design and programming of curriculum
analysis software. After two and one-half years, the consortium had grown
to include more than 50 institutions. Its efforts have been endorsed by
the American Association of Dental Schools, and it is now beta testing its
first software product, known as Curriculum Analysis Tools (CATs). The
process by which the software has been developed, as well as its current
design, offers a unique blend of flexibility and creativity, which could
perhaps be adopted by other health professionals. Copyright by and
reprinted with permission of the American Medical Informatics
Association.</P>
<P>Eisner J. Multi-national, multi-lingual, multi-professional CATs:
(Curriculum Analysis Tools). Medinfo 1995;8(Pt 2):1706. A consortium of
dental schools and allied dental programs was established in 1991 with the
expressed purpose of creating a curriculum database program that was
end-user modifiable. In April of 1994, a beta version (Beta 2.5 written in
FoxPro(TM) 2.5) of the software CATs, an acronym for Curriculum Analysis
Tools, was released for use by over 30 of the consortium's 60 member
institutions, while the remainder either waited for the Macintosh (TM) or
Windows (TM) versions of the program or were simply not ready to begin an
institutional curriculum analysis project. Shortly after this release, the
design specifications were rewritten based on a thorough critique of the
Beta 2.5 design and coding structures and user feedback. The result was
Beta 3.0 which has been designed to accommodate any health professions
curriculum, in any country that uses English or French as one of its
languages. Given the program's extensive use of screen generation tools,
it was quite easy to offer screen displays in a second language. As more
languages become available as part of the Unified Medical Language System,
used to document curriculum content, the program's design will allow their
incorporation. When the software arrives at a new institution, the choice
of language and health profession will have been preselected, leaving the
Curriculum Database Manager to identify the country where the member
institution is located. With these 'macro' end-user decisions completed,
the database manager can turn to a more specific set of end-user questions
including: 1) will the curriculum view selected for analysis be created by
the course directors (provider entry of structured course outlines) or by
the students (consumer entry of class session summaries)?; 2) which
elements within the provided course outline or class session modules will
be used?; 3) which, if any, internal curriculum validation measures will
be in cluded?; and 4) which, if any, external validation measures will be
included. External measures can include accreditation standards,
entry-level practitioner competencies, an index of learning behaviors, an
index of discipline integration, or others defined by the institution.
When data entry, which is secure to the course level, is complete users
may choose to browse a variety of graphic representations of their
curriculum, or either preview or print a variety of reports that offer
more detail about the content and adequacy of their curriculum. The
progress of all data entry can be monitored by the database manager over
the course of an academic year, and all reports contain extensive missing
data reports to ensure that the user knows whether they are studying
complete or partial data. Institutions using the beta version of the
program have reported considerable satisfaction with its functionality and
have also offered a variety of design and interface enhancements. The
anticipated release date for Curriculum Analysis Tools (CATs) is the first
quarter of 1995.</P>
<P>Fowler J, Wheeler DA, Camerino PW, Bat O, Burch PE. Development of a
faculty research interest resource. Proc AMIA Fall Symp 1996:363-72. We
have developed a faculty research interests resource by "mining" MEDLINE
for relationships that are no t directly queryable through the normal
MEDLINE schema. Faculty citations are retrieved and World-Wide Web pages
built to interconnect authors, their citations, and the MeSH terms that
have been assigned to these citations. The design and development of t he
resource are discussed and examples of the results illustrated. Copyright
by and reprinted with permission of the American Medical Informatics
Association.</P>
<P>Kanter SL. Using the UMLS to represent medical curriculum content. Proc
Annu Symp Comput Appl Med Care 1993:762-5. Recent innovations in medical
education have highlighted the need for faculty involved with the
curriculum to carefully examine curricular content with goals of detecting
omissions and unwanted redundancies of subject matter, adding and
integrating new content, and deleting old content. A number of medical
schools have attempted to deal with these issues by developing a database
of curricular content information, most often using faculty- or
student-selected keywords to represent each unit of instruction. However,
several problems have been identified with this method, and achieving the
goals mentioned above remains a formidable task. This paper outlines an
alternative method that uses the resources of the UMLS to characterize a
medical concept by the semantic types of its co-occurring terms. This
approach can facilitate achievement of the aforementioned goals. Copyright
by and reprinted with permission of the American Medical Informatics
Association. </P>
<P>Kanter SL, Miller RA, Tan M, Schwartz J. Using POSTDOC to recognize
biomedical concepts in medical school curricular documents. Bull Med Libr
Assoc 1994 Jul;82(3):283-7. Recognition of the biomedical concepts in a
document is prerequisite to further processing of the document: medical
educators examine curricular documents to discover the coverage of certain
topics, detect unwanted redundancies, integrate new content, and delete
old content; and clinicians are concerned with terms in patient medical
records for purposes ranging from creation of an electronic medical record
to identification of medical literature relevant to a particular case.
POSTDOC (POSTprocessor of DOCuments) is a computer application that (1)
accepts as input a free-text, ASCII-formatted document and uses the
Unified Medical Language System (UMLS) Metathesaurus to recognize relevant
main concept terms; (2) provides term co-occurrence data and thus is able
to identify potentially increasing correlations among concepts within the
document; and (3) retrieves references from MEDLINE files based on user
identification of relevant subjects. This paper describes a formative
evaluation of POSTDOC's ability to recognize UMLS Metathesaurus biomedical
concepts in medical school lecture outlines. The precision and recall
varied over a wide range and were deemed not yet acceptable for automated
creation of a database of concepts from curricular documents. However,
results were good enough to warrant further study and continued system
development. Copyright by and reprinted with permission of the Medical
Library Association.</P>
<P>Zucker J, Chase H, Molholt P, Bean C, Kahn RM. A comprehensive strategy
for designing a web-based medical curriculum. Proc AMIA Fall Symp
1996:41-5. In preparing for a full featured online curriculum, it is
necessary to develop scaleable strategies for software design that will
support the pedagogical goals of the curriculum and which will address the
issues of acquisition and updating of materials, of robust content-based
linking, and of integration of the online materials into other methods of
learning. A complete online curriculum, as distinct from an individual
computerized module, must provide dynamic updating of both content and
structure and an easy pathway from the professor's notes to the finished
online product. At the College of Physicians and Surgeons, we are
developing such strategies including a scripted text conversion process
that uses the Hypertext Markup Language (HTML) as structural markup rather
than as display markup, automated linking by the use of relational
databases and the Unified Medical Language System (UMLS), integration of
text, images, and multimedia along with interface designs which promote
multiple contexts and collaborative study. Copyright by and reprinted with
permission of the American Medical Informatics Association.</P><A
href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#list">Return to title
page</A> | <A
href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#15">Return to table of
contents</A>
<HR>
<UL>
<LI><STRONG>Natural Language Processing, Indexing and
Retrieval</STRONG><BR>
<UL>
<LI><STRONG><A name=3f>NLP Methods and
Algorithms</A></STRONG><BR></LI></UL></LI></UL>
<HR>
<P>Baud RH, Rassinoux A-M, Lovis C, Wagner J, Griesser V, Michel P-A,
Scherrer J-R. Knowledge sources for natural language processing. Proc AMIA
Fall Symp 1996:70-4. This paper aims at reviewing the problem of feeding
Natural Language Processing (NLP) too ls with convenient linguistic
knowledge in the medical domain. A syntactic approach lacks the potential
to solve a number of typical situations with ambiguities and is clearly
insufficient for quality treatment of natural language. On the other hand,
a co nceptual approach relies on some modelling of the domain, of which
the elaboration is a long-term process and where the ultimate solutions
are far from being recognised and universally accepted. In-between is the
beauty of the compromise. How can we signi ficantly improve the coverage
of linguistic knowledge in the years to come? Copyright by and reprinted
with permission of the American Medical Informatics Association.</P>
<P>Evans DA, Brownlow ND, Hersh WR, Campbell EM. Automating concept
identification in the eletronic medical record: an experiment in
extracting dosage information. Proc AMIA Fall Symp 1996:388-92. We discuss
the development and evaluation of an automated procedure for extracting
drug-dosage information from clinical narratives. The process was
developed rapidly using existing technology and resources, including
categories of terms from UMLS96. Evaluations over a large training and
smaller test set of medical records demonstrate an approximately 80% rate
of exact and partial matches on target phrases, with few false positives
and a modest rate of false negatives. The results suggest a strategy for
automating general concept identification in electronic medical records.
Copyright by and reprinted with permission of the American Medical
Informatics Association.</P>
<P>Evans DA, Chute CG, Handerson SK, Yang Y, Monarch IA, Hersh WR. 'Latent
semantics' as a basis for managing variation in medical terminologies.
Medinfo 1992;7(Pt 2):1462-8. The authors are exploiting a version of
latent semantic indexing as a general solution to the problem of managing
language variation. They treat medical terms as the 'documents' to be
retrieved by natural-language expressions of concepts, taken as 'queries'.
In experiments, they have focused on (1) establishing a basis for the
decomposition of concepts (terms) by lexical items and (2) exploiting
existing medical thesauri to create Lexical-Item x Term spaces. They have
demonstrated the ability to interpret natural-language statements of
medical findings in multiple medical terminologies simultaneously (e.g.
INTERNIST-I/QMR, PTXT, and NLM/UMLS META-1 vocabularies) and also to
derive concept-relation spaces from collections of terms in the NLM/UMLS
Metathesaurus (META-1). The power of this approach is that it does not
depend on detailed semantic representations or on word-for-word
correspondences among terms and that multiple vocabularies can be
represented side-by-side.</P>
<P>Johnson SB, Aguirre A, Peng P, Cimino J. Interpreting natural language
queries using the UMLS. Proc Annu Symp Comput Appl Med Care 1993:294-8.
This paper describes AQUA (A QUery Analyzer), the natural language front
end of a prototype information retrieval system. AQUA translates a user's
natural language query into a representation in the Conceptual Graph
formalism. The graph is then used by subsequent components to search
various resources such as databases of the medical literature. The focus
of the parsing method is on semantics rather than syntax, with semantic
restrictions being provided by the UMLS Semantic Net. The intent of the
approach is to provide a method that can be emulated easily in
applications that require simple natural language interfaces. Copyright by
and reprinted with permission of the American Medical Informatics
Association.</P>
<P>Joubert M, Fieschi M, Robert JJ. A conceptual model for information
retrieval with UMLS. Proc Annu Symp Comput Appl Med Care 1993:715-9.
Information retrieval in large information databases is a
non-deterministic process which needs a sequence of search steps
generally. One of the main problems to which the end-users are faced is to
parse efficiently their questions into the query language that the
computer systems allow. Conceptual graphs were initially designed for
natural language analysis and understanding. Due to their closeness to
semantic networks, their expressiveness is powerful enough to be applied
to knowledge representation and use by computer systems. This work
demonstrates that conceptual graphs are a suitable means to model the
end-users queries on the basis of the thesaurus and the semantic network
of the UMLS project. Copyright by and reprinted with permission of the
American Medical Informatics Association.</P>
<P>Joubert M, Fieschi M, Robert JJ, Tafazzoli A. Users conceptual views on
medical information databases. Int J Biomed Comput 1994 Oct;37(2):93-104.
As information databases we consider all the kinds of information
repositories that are handled by computer systems. When querying very
large information databases, the end-users are often faced with the
problem to parse their questions efficiently into the query languages of
the computer systems. Conceptual graphs were initially designed for
natural language analysis and understanding. Due to their closeness to
semantic networks, their expressiveness is powerful enough to be applied
to knowledge representation and use by computer systems. This work
demonstrates that conceptual graphs are a suitable means to model both the
information in patient databases and the queries to these databases, and
that operations on graphs can compute the pattern matching process needed
to provide the answers. A prototype that exploits this model is presented.
Experiments have been made with the material furnished by the Unified
Medical Language System project (version 2, 1992) of the National Library
of Medicine, USA.</P>
<P>Joubert M, Robert J-J, Miton F, Fieschi M. The project ARIANE:
conceptual queries to information databases. Proc AMIA Fall Symp
1996:378-82. As information databases we consider all the collections of
data records indexed by key-words, stored and delivered by computer
systems. In previous research works we demonstrated the interest to design
a conceptual model, in the conceptual graphs formalism, and to implement a
computational model for information retrieval in large information
databases. These models are based on the UMLS knowledge sources. This
paper reminds briefly these models and describes tests done in querying a
patients database and a bibliographical database. Copyright by and
reprinted with permission of the American Medical Informatics
Association.</P>
<P>Lamiell JM, Wojcik ZM, Isaacks J. Computer auditing of surgical
operative reports written in English. Proc Annu Symp Comput Appl Med Care
1993:269-73. We developed a script-based scheme for automated auditing of
natural language surgical operative reports. Suitable operations
(appendectomy and breast biopsy) were selected, then audit criteria and
operation scripts conforming with our audit criteria were developed. Our
LISP parser was context and expectation sensitive. Parsed sentences were
represented by semigraph structures and placed in a textual database to
improve efficiency. Sentence ambiguities were resolved by matching the
narrative textual database to the script textual database and employing
the Uniform Medical Language System (UMLS) Knowledge Sources. All audit
criteria questions were successfully answered for typical operative
reports by matching parsed audit questions to the textual database.
Copyright by and reprinted with permission of the American Medical
Informatics Association.</P>
<P>McCray AT. Extending a natural language parser with UMLS knowledge.
Proc Annu Symp Comput Appl Med Care 1991:194-8. Over the past several
years our research efforts have been directed toward the identification of
natural language processing methods and techniques for improving access to
biomedical information stored in computerized form. To provide a testing
ground for some of these ideas we have undertaken the development of
SPECIALIST, a prototype system for parsing and accessing biomedical text.
The system includes linguistic and biomedical knowledge. Linguistic
knowledge involves rules and facts about the grammar of the language.
Biomedical knowledge involves rules and facts about the domain of
biomedicine. The UMLS knowledge sources, Meta-1 and the Semantic Network,
as well as the UMLS test collection, have recently contributed to the
development of the SPECIALIST system. Copyright by and reprinted with
permission of the American Medical Informatics Association.</P>
<P>McCray AT, Aronson AR, Browne AC, Rindflesch TC, Razi A, Srinivasan S.
UMLS knowledge for biomedical language processing. Bull Med Libr Assoc
1993 Apr;81(2):184-94. This paper describes efforts to provide access to
the free text in biomedical databases. The focus of the effort is the
development of SPECIALIST, an experimental natural language processing
system for the biomedical domain. The system includes a broad coverage
parser supported by a large lexicon, modules that provide access to the
extensive Unified Medical Language System (UMLS) Knowledge Sources, and a
retrieval module that permits experiments in information retrieval. The
UMLS Metathesaurus and Semantic Network provide a rich source of
biomedical concepts and their interrelationships. Investigations have been
conducted to determine the type of information required to effect a map
between the language of queries and the language of relevant documents.
Mappings are never straightforward and often involve multiple inferences.
Copyright by and reprinted with permission of the Medical Library
Association.</P>
<P>Murphy SN, Barnett GO. Achieving automated narrative text
interpretation using phrases in the electronic medical record. Proc AMIA
Fall Symp 1996:532-6. Stereotypic phrases are used by clinicians
throughout the medical record, as seen in an analysis of our COSTAR
medical record database. These phrases are often associated with an
underlying semantic concept; for example the phrase CLEAR LUNGS may be
linked with the concept "normal lung exam" for a particular physician.
Formalizing these associations with concepts from the UMLS using the
MEDPhrase application allowed us to automate interpretation of narrative
text within our electronic medical record. Copyright by and reprinted with
permission of the American Medical Informatics Association. </P>
<P>Peng P, Aguirre A, Johnson SB, Cimino JJ. Generating MEDLINE search
strategies using a librarian knowledge-based system. Proc Annu Symp Comput
Appl Med Care 1993:596-600. We describe a librarian knowledge-based system
that generates a search strategy from a query representation based on a
user's information need. Together with the natural language parser AQUA,
the system functions as a human/computer interface, which translates a
user query from free text into a BRS Onsite search formulation, for
searching the MEDLINE bibliographic database. In the system, conceptual
graphs are used to represent the user's information need. The UMLS
Metathesaurus and Semantic Net are used as the key knowledge sources in
building the knowledge base. Copyright by and reprinted with permission of
the American Medical Informatics Association.</P>
<P>Pietrzyk PM. Free text analysis. Int J Biomed Comput 1995
Apr;39(1):139-44. In the context of hospital information systems (HIS)
medical free text analysis is reviewed with respect to current automated
approaches to literature retrieval, case retrieval and fact retrieval from
textual data in the patient record. The Unified Medical Language System
(UMLS) project has enormously stimulated current research. It is expected
that UMLS knowledge sources and SNOMED III (which need a translation into
other languages as soon as possible) as well as the conceptual graphs
formalism, could become standards to utilize free text information
contained in HIS databases.</P>
<P>Sager N, Lyman M, Bucknall C, Nhan N, Tick LJ. Natural language
processing and the representation of clinical data. J Am Med Inform Assoc
1994 Mar-Apr;1(2):142-60. OBJECTIVE: Develop a representation of clinical
observations and actions and a method of processing free-text patient
documents to facilitate applications such as quality assurance. DESIGN:
The Linguistic String Project (LSP) system of New York University utilizes
syntactic analysis, augmented by a sublanguage grammar and an information
structure that are specific to the clinical narrative, to map free-text
documents into a database for querying. MEASUREMENTS: Information
precision (I-P) and information recall (I-R) were measured for queries for
the presence of 13 asthma-health-care quality assurance criteria in a
database generated from 59 discharge letters. RESULTS: I-P, using counts
of major errors only, was 95.7% for the 28-letter training set and 98.6%
for the 31-letter test set. I-R, using counts of major omissions only, was
93.9% for the training set and 92.5% for the test set. Copyright by and
reprinted with permission of the American Medical Informatics
Association.</P>
<P>Satomura Y, do Amaral MB. Automated diagnostic indexing by natural
language processing. Med Inf (Lond) 1992 Jul-Sep;17(3):149-63.</P>
<P>Volot F, Zweigenbaum P, Bachimont B, Ben Said M, Bouaud J, Fieschi M,
Boisvieux JF. Structuration and acquisition of medical knowledge. Using
UMLS in the conceptual graph formalism. Proc Annu Symp Comput Appl Med
Care 1993:710-4. The use of a taxonomy, such as the concept type lattice
(CTL) of Conceptual Graphs, is a central structuring piece in a
knowledge-based system. The knowledge it contains is constantly used by
the system, and its structure provides a guide for the acquisition of
other pieces of knowledge. We show how UMLS can be used as a knowledge
resource to build a CTL and how the CTL can help the process of
acquisition for other kinds of knowledge. We illustrate this method in the
context of the MENELAS natural language understanding project. Copyright
by and reprinted with permission of the American Medical Informatics
Association.</P><A
href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#list">Return to title
page</A> | <A
href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#15">Return to table of
contents</A>
<HR>
<UL>
<LI>
<UL>
<LI><STRONG><A name=3g>Indexing and Retrieval Methods and
Algorithms</A></STRONG><BR></LI></UL></LI></UL>
<HR>
<P>Aronson AR. The effect of textual variation on concept based
information retrieval. Proc AMIA Fall Symp 1996:373-7. Accounting for
textual variation in the documents and queries processed by information
retrieval systems is considered essential for achieving good retrieval.
Recent research has called into question several of the techniques used to
support this endeavor. This paper reports on experiments with a concept
based information retrieval system which relies on a program called
MetaMap to account for textual variation in the process of mapping
biomedical text such as MEDLINE bibliographic citations to the UMLS
Metathesaurus. The experiments confirm that the effort expended in
handling textual variation is well-spent for at least one type of concept
based information retrieval. Copyright by and reprinted with permission of
the American Medical Informatics Association.</P>
<P>Chute CG, Yang Y. An evaluation of concept based latent semantic
indexing for clinical information retrieval. Proc Annu Symp Comput Appl
Med Care 1992:639-43. Latent Semantic Indexing (LSI) of surgical case
report text using ICD-9-CM procedure codes and index terms was evaluated.
The precision-recall performance of this two-step matrix retrieval process
was compared with the SMART Document retrieval system, surface word
matching, and humanly assigned procedure codes. Human coding performed
best, two-step LSI did less well than surface matching or SMART. This
evaluation suggests that concept-based LSI may be compromised by its
two-stage nature and its dependence upon a robust term database linked to
main concepts. However, the potential elegance of partial- credit concept
matching merits the continued evaluation of LSI for clinical case
retrieval. Copyright by and reprinted with permission of the American
Medical Informatics Association.</P>
<P>Chute CG, Yang Y, Evans DA. Latent Semantic Indexing of medical
diagnoses using UMLS semantic structures. Proc Annu Symp Comput Appl Med
Care 1991:185-9. The relational files within the UMLS Metathesaurus
contain rich semantic associations to main concepts. We invoked the
technique of Latent Semantic Indexing to generate information matrices
based on these relationships and created semantic vectors using singular
value decomposition. Evaluations were made on the complete set and subsets
of Metathesaurus main concepts with the semantic type Disease or Syndrome.
Real number matrices were created with main concepts, lexical variants,
synonyms, and associated expressions. Ancestors, children, siblings, and
related terms were added to alternative matrices, preserving the
hierarchical direction of the relation as the imaginary component of a
complex number. Preliminary evaluation suggests that this technique is
robust. A major advantage is the exploitation of semantic features which
derive from a statistical decomposition of UMLS structures, possibly
reducing dependence on the tedious construction of semantic frames by
humans. Copyright by and reprinted with permission of the American Medical
Informatics Association.</P>
<P>Doszkocs TE, Sass RK. An associative semantic network for machine-aided
indexing, classification and searching. In: Fidel R, Kwasnik BH, Smith PJ,
editors., Proceedings of 3rd ASIS SIG/CR Classification Research Workshop;
1992 Oct 25; Pittsburgh, PA. Medford (NJ): Learned Information; 1993. p.
15-35. Capturing and exploiting textual database associations has played a
pivotal role in the evolution of automated information systems. A variety
of statistical, linguistic and artificial intelligence approaches have
been described in the literature. Many of these R&amp;D concepts and
techniques are now being incorporated into commercially available search
systems and services. This paper discusses prior work and reports on
research in progress aimed at creating and utilizing a global semantic
associative database, AURA (Associative User Retrieval Aid), to facilitate
machine-assisted indexing, classification and searching in the large-scale
information processing environment of NLM's core bibliographic databases,
MEDLINE and CATLINE. AURA is a semantic network of over two million
natural language phrases derived from more than a million MEDLINE titles.
These natural language phrases are associatively linked to NLM's MeSH
(Medical Subject Headings) and UMLS (Unified Medical Language System)
metathesaurus controlled vocabulary and classification resources.
Reproduced with permission of the American Society for Information
Science.</P>
<P>Harbourt AM, Syed EJ, Hole WT, Kingsland LC 3d. The ranking algorithm
of the Coach browser for the UMLS metathesaurus. Proc Annu Symp Comput
Appl Med Care 1993:720-4. This paper presents the novel ranking algorithm
of the Coach Metathesaurus browser which is a major module of the Coach
expert search refinement program. An example shows how the ranking
algorithm can assist in creating a list of candidate terms useful in
augmenting a suboptimal Grateful Med search of MEDLINE. Copyright by and
reprinted with permission of the American Medical Informatics
Association.</P>
<P>Hersh WR. Evaluation of Meta-1 for a concept-based approach to the
automated indexing and retrieval of bibliographic and full-text databases.
Med Decis Making 1991 Oct-Dec;11(4 Suppl):S120-4. SAPHIRE is a
concept-based approach to information retrieval in the biomedical domain.
Indexing and retrieval are based on a concept-matching algorithm that
processes free text to identify concepts and map them to their canonical
form. This process requires a large vocabulary containing a breadth of
medical concepts and a diversity of synonym forms, which is provided by
the Meta-1 vocabulary from the Unified Medical Language System Project of
the National Library of Medicine. This paper describes the use of Meta-1
in SAPHIRE and an evaluation of both entities in the context of an
information retrieval study. Copyright 1991 Hanley and Belfus.</P>
<P>Hersh WR, Hickam DH. A comparative analysis of retrieval effectiveness
for three methods of indexing AIDS-related abstracts. In: Proceedings of
the 54th Annual Meeting of the American Society for Information Science;
1991 Oct 27-31; Washington, DC. Medford (NJ): Learned Information; 1991.
p. 211-25. SAPHIRE is an experimental information retrieval system
featuring concept-based automated indexing and natural language input,
relevance-based retrieval. This experiment evaluates SAPHIRE'S indexing
capability in a three-way comparison of retrieval effectiveness versus
traditional MEDLINE indexing and title-abstract word indexing. SAPHIRE's
recall and precision values are inferior to both methods in a
MEDLINE-style Boolean searching environment, although additional
experiments suggest that better retrieval performance is obtained when
SAPHIRE's natural language input and relevance ranking features are
used.</P>
<P>Hersh WR, Hickam DH. A comparison of retrieval effectiveness for three
methods of indexing medical literature. Am J Med Sci 1992
May;303(5):292-300. Conventional approaches to indexing medical literature
include the human assignment of terms from a controlled vocabulary, such
as MeSH, or the computer assignment of all words in the title and abstract
as indexing terms. Human indexing suffers from inconsistency, while
word-based indexing suffers from the multiple meanings of words. SAPHIRE
is a computer program designed to provide indexing using controlled terms
that are assigned by computer, based on their occurrence in the title and
abstract. In this first evaluation of SAPHIRE, the authors compared the
retrieval performance of the three indexing approaches--human-based
MEDLINE with text words; machine-based SAPHIRE with text words; and text
words only--for searches by measuring recall and precision for each search
using a test collection of 200 abstracts. The abstracts were judged by
human reviewers for relevance as applied to 12 literature queries. The
results suggest that text word indexing is more effective than indexing
with MeSH terms. SAPHIRE's indexing performance was slightly inferior but
the program has other advantageous features. Copyright Southern Society
for Clinical Investigation; published by Lippincott-Raven Publishers.</P>
<P>Hersh WR, Hickam DH. A comparison of two methods for indexing and
retrieval from a full-text medical database. Med Decis Making 1993
Jul-Sep;13(3):220-6. The objective of this study was to compare how well
medical professionals are able to retrieve relevant literature references
using two computerized literature searching systems that provide automated
(non-human) indexing of content. The first program was SAPHIRE, which
features concept-based indexing, free-text input of queries, and ranking
of retrieved references for relevance. The second program was SWORD, which
provides single-word searching using Boolean operators (AND, OR). Sixteen
fourth-year medical students participated in the study. The database for
searching was six volumes from the 1989 Yearbook series. The queries were
ten questions generated on teaching rounds. All subjects searched half the
queries with each program. After the searching, each subject was given a
questionnaire about prior experience and preferences about the two
programs . Recall (proportion of relevant articles retrieved from the
database) and precision (proportion of relevant articles in the retrieved
set) were measured for each search done by each participant. Mean recall
was 57.6% with SAPHIRE; it was 58.6% with SWORD. Precision was 48.1% with
SAPHIRE vs 57.6% with SWORD. Each program was rated easier to use than the
other by half of the searchers, and preferences were associated with
better searching performance for that program. Both systems achieved
recall and precision comparable to existing systems and may represent
effective alternatives to MEDLINE and other retrieval systems based on
human indexing for searching medical literature. Copyright 1993 Hanley and
Belfus.</P>
<P>Hersh WR, Hickam DH. An evaluation of interactive boolean and natural
language searching with an online medical textbook. J Am Soc Inf Sci 1995
Aug;46(7):478-89. Few studies have compared the interactive use of Boolean
and natural language searching systems. We studied the use of three
retrieval systems by senior medical students searching on queries
generated by actual physicians in a clinical setting. The searchers were
randomized to search on two of three different retrieval systems: a
Boolean system, a word-based natural language system, and a concept-based
natural language system. Our results showed no statistically significant
differences in recall or precision among the three systems. Likewise, we
found no user preference for any system over the others. In the course of
this study we did find, however, a number of problems with traditional
measures of retrieval evaluation when applied to the interactive search
setting. Copyright 1995 by and reproduced with permission of John Wiley
and Sons. </P>
<P>Hersh WR, Hickam DH, Leone TJ. Words, concepts, or both: optimal
indexing units for automated information retrieval. Proc Annu Symp Comput
Appl Med Care 1992:644-8. What is the best way to represent the content of
documents in an information retrieval system? This study compares the
retrieval effectiveness of five different methods for automated
(machine-assigned) indexing using three test collections. The consistently
best methods are those that use indexing based on the words that occur in
the available text of each document. Methods used to map text into
concepts from a controlled vocabulary showed no advantage over the
word-based methods. This study also looked at an approach to relevance
feedback which showed benefit for both word-based and concept-based
methods. Copyright by and reprinted with permission by the American
Medical Informatics Association.</P>
<P>Jenders RA, Estey G, Martin M, Hamilton G, Ford-Carleton P, Thompson
BT, Oliver DE, Eccles R, Barnett GO, Zielstorff RD, et al. Indexing
guidelines: applications in use of pulmonary artery catheters and pressure
ulcer prevention. Proc Annu Symp Comput Appl Med Care 1994:802-6. In a
busy clinical environment, access to knowledge must be rapid and specific
to the clinical query at hand. This requires indices which support easy
navigation within a knowledge source. We have developed a computer-based
tool for trouble-shooting pulmonary artery waveforms using a graphical
index. Preliminary results of domain knowledge tests for a group of
clinicians exposed to the system (N = 33) show a mean improvement on a
30-point test of 5.33 (p &lt; 0.001) compared to a control group (N = 19)
improvement of 0.47 (p = 0.61). Survey of the experimental group (N = 25)
showed 84% (p = 0.001) found the system easy to use. We discuss lessons
learned in indexing this domain area to computer-based indexing of
guidelines for pressure ulcer prevention. Copyright by and reprinted with
permission of the American Medical Informatics Association.</P>
<P>Merz RB, Cimino C, Barnett GO, Blewett DR, Gnassi JA, Grundmeier R,
Hassan L. A pre-search estimation algorithm for MEDLINE strategies with
qualifiers. Proc Annu Symp Comput Appl Med Care 1994:910-4. Inexperienced
users of online medical databases often have difficulty formulating their
queries. Systems designed to assist them usually do not estimate how
effective the initial search strategy will be before performing an actual
search. Consequently, the search may find an overwhelming number of
citations, or retrieve nothing at all. We have developed an estimation
algorithm to predict the outcome of a MEDLINE search. The portion of the
algorithm described here estimates retrieval for strategies containing
qualifiers. In test searches, the estimate reduced the trial-and-error of
strategy formulation. However, the accuracy of the estimate fell short of
expectations. Our results show that pre-search estimation for strategies
with qualifiers cannot be performed effectively with only the occurrence
data that is presently available. They further imply that automated search
intermediaries can benefit from medical knowledge which expresses the
relationships that exist between terms. Copyright by and reprinted with
permission of the American Medical Informatics Association. </P>
<P>Richwine PW. A study of MeSH and UMLS for subject searching in an
online catalog. Bull Med Libr Assoc 1993 Apr;81(2):229-33.</P>
<P>Rindflesch TC, Aronson AR. Semantic processing in information
retrieval. Proc Annu Symp Comput Appl Med Care 1993:611-5. Intuition
suggests that one way to enhance the information retrieval process would
be the use of phrases to characterize the contents of text. A number of
researchers, however, have noted that phrases alone do not improve
retrieval effectiveness. In this paper we briefly review the use of
phrases in information retrieval and then suggest extensions to this
paradigm using semantic information. We claim that semantic processing,
which can be viewed as expressing relations between the concepts
represented by phrases, will in fact enhance retrieval effectiveness. The
availability of the UMLS domain model, which we exploit extensively,
significantly contributes to the feasibility of this processing. Copyright
by and reprinted with permission of the American Medical Informatics
Association.</P>
<P>Robert JJ, Joubert M, Nal L, Fieschi M. A computational model of
information retrieval with UMLS. Proc Annu Symp Comput Appl Med Care
1994:167-71. A high level representation of data would clarify the complex
collection of medical concepts, terms and relationships derived from
standard classifications that the Unified Medical Language System
contains. A conceptual model is described which represents the data
structure. A second objective of this conceptual model is to provide users
with the capability to build queries to information databases as easily as
possible on the basis of this data structure. The methods used to build
this model are semantic networks and conceptual graphs. The
object-oriented computational model which implements this conceptual model
is detailed. It reuses part of the generic C++ classes of the National
Institutes of Health library. New classes are added to this library to
implement the needed functionalities. Copyright by and reprinted with
permission of the American Medical Informatics Association.</P>
<P>Yang Y, Chute CG. Words or concepts: the features of indexing units and
their optimal use in information retrieval. Proc Annu Symp Comput Appl Med
Care 1993:685-9. Words or Concepts, which are a better choice for indexing
the contents of documents? The answer depends on what method is used for
retrieval. This paper studies the effects of using canonical concepts
versus document words in different retrieval systems with a testing
collection of MEDLINE documents. In our tests, for a retrieval system
which does not use any human knowledge, using words yielded better
retrieval results, while using concepts suffered from a vocabulary
difference between canonical expressions of concepts and non-canonical
words in queries or documents. For a system which depends on the UMLS
synonym set for a mapping from queries or documents to canonical concepts,
the retrieval results were slightly better than the case of not using the
synonyms, but still worse than the systems using words. For the systems
which automatically learn empirical connections between words and concepts
from examples in the testing collection, the vocabulary problem was
effectively solved, and the results of using concepts were competitive or
better, compared to those using words. Copyright by and reprinted with
permission of the American Medical Informatics Association.</P><A
href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#list">Return to title
page</A> | <A
href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#15">Return to table of
contents</A>
<HR>
<UL>
<LI>
<UL>
<LI><STRONG><A name=3h>Information Retrieval
Systems</A></STRONG><BR></LI></UL></LI></UL>
<HR>
<P>Hersh W, Hickam D. Information retrieval in medicine: the SAPHIRE
experience. Medinfo 1995;8(Pt 2):1433-7. Information retrieval systems are
proliferating in biomedical settings, but many problems in indexing,
retrieval, and evaluation of systems continue to exist. The SAPHIRE
Project was undertaken to seek solutions to these problems. This paper
summarizes the evaluation studies that have been done with SAPHIRE,
highlighting the lessons learned and laying out the challenges ahead to
all medical information retrieval efforts.</P>
<P>Hersh W, Hickam DH, Haynes RB, McKibbon KA. Evaluation of SAPHIRE: an
automated approach to indexing and retrieving medical literature. Proc
Annu Symp Comput Appl Med Care 1991:808-12. An analysis of SAPHIRE, an
experimental information retrieval system featuring automated indexing and
natural language retrieval, was performed on MEDLINE references using data
previously generated for a MEDLINE evaluation. Compared with searches
performed by novice and expert physicians using MEDLINE, SAPHIRE achieved
comparable recall and precision. While its combined recall and precision
performance did not equal the level of librarians, SAPHIRE did achieve a
significantly higher level of absolute recall. SAPHIRE has other potential
advantages over existing MEDLINE systems. Its natural language interface
does not require knowledge of MeSH, and it provides relevance ranking of
retrieved references. Copyright by and reprinted with permission of the
American Medical Informatics Association.</P>
<P>Hersh W, Leone TJ. The SAPHIRE server: a new algorithm and
implementation. Proc Annu Symp Comput Appl Med Care 1995:858-62. SAPHIRE
is an experimental information retrieval system implemented to test new
approaches to automated indexing and retrieval of medical documents. Due
to limitations in its original concept-matching algorithm, a modified
algorithm has been implemented which allows greater flexibility in partial
matching and different word order within concepts. With the concomitant
growth in client-server applications and the Internet in general, the new
algorithm has been implemented as a server that can be accessed via other
applications on the Internet. Copyright by and reprinted with permission
of the American Medical Informatics Association.</P>
<P>Hersh WR, Greenes RA. SAPHIRE--an information retrieval system
featuring concept matching, automatic indexing, probabilistic retrieval,
and hierarchical relationships. Comput Biomed Res 1990 Oct;23(5):410-25.
SAPHIRE (Semantic and Probabilistic Heuristic Information Retrieval
Environment) is an experimental computer program designed to test new
techniques in automated information retrieval in the biomedical domain. A
main feature of the program is a concept-finding algorithm that processes
free text to find canonical concepts. The algorithm is designed to handle
a wide variety of synonyms and convert them to canonical form. This allows
natural language to be used for query input and also serves as the basis
for a new approach to automatic indexing based on a combination of
probabilistic and linguistic methods. Copyright 1990 Academic Press.</P>
<P>Hersh WR, Hickam D. Information retrieval in medicine. The SAPHIRE
experience. J Am Soc Inf Sci 1995 Dec;46(10):743-7. Information retrieval
systems are being used increasingly in biomedical settings, but many
problems still exist in indexing, retrieval, and evaluation. The SAPHIRE
Project was undertaken to seek solutions for these problems. This article
summarizes the evaluation studies that have been done with SAPHIRE,
highlighting the lessons learned and laying out the challenges ahead to
all medical information retrieval efforts. Copyright 1995 by and
reproduced with permission of John Wiley and Sons.</P>
<P>Hersh WR, Hickam DH, Haynes RB, McKibbon KA. A performance and failure
analysis of SAPHIRE with a MEDLINE test collection. J Am Med Inform Assoc
1994 Jan-Feb;1(1):51-60. OBJECTIVE: Assess the performance of the SAPHIRE
automated information retrieval system. DESIGN: Comparative study of
automated and human searching of a MEDLINE test collection. MEASUREMENTS:
Recall and precision of SAPHIRE were compared with those attributes of
novice physicians, expert physicians, and librarians for a test collection
of 75 queries and 2,334 citations. Failure analysis assessed the efficacy
of the Metathesaurus as a concept vocabulary; the reasons for retrieval of
nonrelevant articles and nonretrieval of relevant articles; and the effect
of changing the weighting formula for relevance ranking of retrieved
articles. RESULTS: Recall and precision of SAPHIRE were comparable to
those of both physician groups, but less than those of librarians.
CONCLUSION: The current version of the Metathesaurus, as utilized by
SAPHIRE, was unable to represent the conceptual content of one-fourth of
physician-generated MEDLINE queries. The most likely cause for retrieval
of nonrelevant articles was the presence of some or all of the search
terms in the article, with frequencies high enough to lead to retrieval.
The most likely cause for nonretrieval of relevant articles was the
absence of the actual terms from the query, with synonyms or
hierarchically related terms present instead. There were significant
variations in performance when SAPHIRE's concept-weighing formulas were
modified. Copyright by and reprinted with permission of the American
Medical Informatics Association.</P>
<P>Hersh WR, Pattison-Gordon E, Evans DA. Adaption of Meta-1 for SAPHIRE,
a general purpose information retrieval system. Proc Annu Symp Comput Appl
Med Care 1990:156-60. The Unified Medical Language Systems Project (UMLS)
of the National Library of Medicine (NLM) has produced Meta-1, a
metathesaurus featuring over 40000 concepts and their synonyms from
several commonly-used medical vocabularies. The authors have adapted
Meta-1 for use in SAPHIRE, an information retrieval system featuring
automated indexing and probabilistic retrieval. They have also built
DESYGNS, a semantic network system designed to contain Meta-1 concepts
along with their sematic relationships. Future plans include improved
concept matching, improved indexing capability, and the use of semantic
relationships. Copyright by and reprinted with permission of the American
Medical Informatics Association.</P>
<P>Jachna JS, Powsner SM, Miller PL. Augmenting GRATEFUL MED with the UMLS
Metathesaurus: an initial evaluation. Bull Med Libr Assoc 1993
Jan;81(1):20-8. Clinicians in patient care settings must be able to locate
relevant recent medical literature quickly. Computer literacy is
increasing, but many clinicians remain ill at ease with search strategies
for online bibliographic databases. As part of an ongoing project to
simplify the translation of clinical questions into effective searches, a
Unified Medical Language System (UMLS) Metathesaurus tool was designed.
The authors compared bibliographic searches by relatively inexperienced
users employing only GRATEFUL MED to searches done using GRATEFUL MED
augmented with this tool. The users were clinicians examining questions
related to a test set of clinical cases. Their problems and successes were
monitored; the results suggest that the addition of a thesaurus helps
resolve some problems in citation retrieval that trouble the novice user.
By helping the user understand indexing terms in context and by reducing
typing errors, a thesaurus can help provide an intelligent solution to
lexical mismatches in bibliographic retrieval. Copyright by and reprinted
with permission of the Medical Library Association.</P>
<P>Joubert M, Riouall D, Fieschi M, Botti G, Proudhon H. Contextual aids
for medical information retrieval. Medinfo 1992;7(Pt 2):1522-7. The paper
presents the first results of a work that the authors began in 1990. This
research work concerns the representation and use of medical concepts in
medical information management. Customisation of the user interfaces and
management of users contexts are addressed. These capabilities enhance the
material furnished by UMLS.</P>
<P>Kingsland LC 3d, Harbourt AM, Syed EJ, Schuyler PL. Coach: applying
UMLS knowledge sources in an expert searcher environment. Bull Med Libr
Assoc 1993 Apr;81(2):178-83. With the development of the Unified Medical
Language System (UMLS) Knowledge Sources, the National Library of Medicine
(NLM) has produced a resource of great potential for improving the
searching of MEDLINE. The Coach expert searcher system, an inhouse
research project at NLM, is designed to help users of the GRATEFUL MED
front-end software improve MEDLINE search and retrieval capabilities. This
paper describes the Coach program, the knowledge sources it uses, and some
of the ways it applies elements of the UMLS Metathesaurus to facilitate
access to the biomedical literature. Copyright by and reprinted with
permission of the Medical Library Association.</P>
<P>Kingsland LC 3d, Syed EJ, Lindberg DA. Coach: an expert searcher
program to assist Grateful Med users searching MEDLINE. Medinfo 1992;7(Pt
1):382-6. The Coach expert searcher system is being developed as an
in-house research project at the USA National Library of Medicine (NLM).
It brings to bear the Unified Medical Language System (UMLS) Metathesaurus
and ten additional knowledge sources to assist Grateful Med users seeking
help in improving retrieval from the ELHILL mainframe retrieval engine.
Initial work has concentrated on MEDLINE and its backfiles, and in
particular on the problem of null retrieval. Subsequent functions will
address searching problems relevant to other MEDLARS files. Coach offers
true ELHILL multifile searches, ELHILL sorting of output citations before
download, and considerable flexibility in the print format of downloaded
results. It works interactively with the user, with Grateful Med and with
ELHILL.</P><A
href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#list">Return to title
page</A> | <A
href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#15">Return to table of
contents</A>
<HR>
<UL>
<LI><STRONG><A name=3i>Linking Clinical Systems to Knowledge-based
Information Sources</A></STRONG><BR></LI></UL>
<HR>
<P>Cimino JJ. Linking patient information systems to bibliographic
resources. Methods Inf Med 1996 Jun;35(2):122-6. Medical informatics
researchers have explored a number of ways to integrate medical
information resources into patient care systems. Particular attention has
been given to the integration of on-line bibliographic resources. This
paper presents an information model which breaks down the integration task
into three components, each of which answers a question: what is the
user's question?, where can the answer be found?, and how is the retrieval
strategy composed? Twelve experimental systems are reviewed and their
methods for addressing one or more of these questions are described. </P>
<P>Cimino JJ, Aguirre A, Johnson SB, Peng P. Generic queries for meeting
clinical information needs. Bull Med Libr Assoc 1993 Apr;81(2):195-206.
This paper describes a model for automated information retrieval in which
questions posed by clinical users are analyzed to establish common
syntactic and semantic patterns. The patterns are used to develop a set of
general-purpose questions called generic queries. These generic queries
are used in responding to specific clinical information needs. Users
select generic queries in one of two ways. The user may type in questions,
which are then analyzed, using natural language processing techniques, to
identify the most relevant generic query; or the user may indicate patient
data of interest and then pick one of several potentially relevant
questions. Once the query and medical concepts have been determined, an
information source is selected automatically, a retrieval strategy is
composed and executed, and the results are sorted and filtered for
presentation to the user. This work makes extensive use of the National
Library of Medicine's Unified Medical Language System (UMLS): medical
concepts are derived from the Metathesaurus, medical queries are based on
semantic relations drawn from the UMLS Semantic Network, and automated
source selection makes use of the Information Sources Map. The paper
describes research currently under way to implement this model and reports
on experience and results to date. Copyright by and reprinted with
permission of the Medical Library Association.</P>
<P>Cimino JJ, Johnson SB, Aguirre A, Roderer N, Clayton PD. The MEDLINE
Button. Proc Annu Symp Comput Appl Med Care 1992:81-5. We have developed a
computerized method for performing bibliographic searches directly from
patient data involving five steps: 1) identifying specific patient data
which raises a question in the mind of the user, 2) selection (from a list
of generic questions) of a small number of questions which fit the
selected patient data, 3) automated translation of the patient data into
appropriate terms used for bibliographic indexing, 4) conversion of the
question selected by the user into a search strategy, and 5) transfer of
the search strategy to a search engine for a bibliographic database. We
have modified the Columbia-Presbyterian Clinical Information System to
experiment with this method. The first implementation converts patient
diagnoses and procedures coded in ICD9-CM into Medical Subject Headings
(MeSH) and searches Medline using BRS/Onsite. Challenges include
development of a useful set of generic questions and translation from
ICD9-CM to MeSH using the Unified Medical Language System (UMLS).
Copyright by and reprinted with permission of the American Medical
Informatics Association.</P>
<P>Cimino JJ, Johnson SB, Peng P, Aguirre A. From ICD9-CM to MeSH using
the UMLS: a how-to guide. Proc Annu Symp Comput Appl Med Care 1993:730-4.
One purpose of the Unified Medical Language System (UMLS) is to facilitate
conversion of terms from one controlled medical vocabulary to another. We
examined our ability to convert International Classification of Diseases,
9th Edition, Clinical Modifications (ICD9-CM) to Medical Subject Headings
(MeSH) using the UMLS. We describe a method which mapped 30.4% of ICD9-CM
to UMLS. Of these, 95.0% were linked to MeSH, of which translation was
straightforward in 90.4%. We discuss the use of these translations for
retrieval from MeSH-indexed databases, such as Medline. Copyright by and
reprinted with permission of the American Medical Informatics
Association.</P>
<P>Cimino JJ, Sideli RV. Using the UMLS to bring the library to the
bedside. Med Decis Making 1991 Oct-Dec;11(4 Suppl):S116-20. This paper
presents an algorithm that can be used to convert ICD9 terms to related
MeSH terms. Preliminary evaluation indicates that together, the algorithm
and the UMLS provide a reasonable resource for facilitating such
conversions. Copyright 1991 Hanley and Belfus.</P>
<P>Lowe HJ, Walker WK, Polonkey Se, Jiang F, Vries JK, McCray AT. The
image engine HPCC project: a medical digital library system using
agent-based technology to create an integrated view of the electronic
medical record. In: Adam N, Halem M, Yesha Y, editors. Proceedings of the
3rd Forum on Research and Technology Advances in Digital Libraries, ADL
'96. Los Alamitos: IEEE Computer Society Press; 1996. p. 45-56.</P>
<P>Merz RB, Cimino C, Barnett GO, Blewett DR, Gnassi JA, Grundmeier R,
Hassan L. Q &amp; A: a query formulation assistant. Proc Annu Symp Comput
Appl Med Care 1993:498-502. Inexperienced users of online medical
databases often do not know how to formulate their queries for effective
searches. Previous attempts to help them have provided some standard
procedures for query formulation, but depend on the user to enter the
concepts of a query properly so that the correct search strategy will be
formed. Intelligent assistance specific to a particular query often is not
given. Several systems do refine the initial strategy based on relevance
feedback but usually do not make an effort to determine how well-formed a
query is before actually performing the search. As part of the Interactive
Query Workstation (IQW), we have developed an expert system, Questions and
Answers (Q&amp;A), that assists in formulating an initial strategy given
concepts entered by the user and that determines if the strategy is
well-formed, refining it when necessary. Copyright by and reprinted with
permission of the American Medical Informatics Association.</P>
<P>Miller PL, Frawley SJ. Trade-offs in producing patient-specific
recommendations from a computer-based clinical guideline: a case study. J
Am Med Inform Assoc 1995 Jul-Aug;2(4):238-42. This case study explored 1)
how much online clinical data is required to obtain patient-specific
recommendations from a computer-based clinical practice guideline, 2)
whether the availability of increasing amounts of online clinical data
might allow a higher specificity of those recommendations, and 3) whether
that increased specificity is necessarily desirable. The "quick reference
guide" version of the guideline for acute postoperative pain management in
adults, developed by the Agency for Health Care Policy and Research, was
analyzed. Patient-specific data items that might be used to tailor the
computer's output for a particular case were grouped into rough categories
depending on how likely they were to be available online and how readily
they might be determined from online clinical data. The patient-specific
recommendations were analyzed to determine to what degree the amount of
text produced depended on the online availability of different categories
of data. An examination of example recommendations, however, illustrated
that high specificity may not always be desirable. The study provides a
concrete illustration of how the richness of online clinical data can
affect patient-specific recommendations, and describes a number of related
design trade-offs in converting a clinical guideline into an interactive,
computer-based form. Copyright by and reprinted with permission of the
American Medical Informatics Association.</P>
<P>Miller RA, Gieszczykiewicz FM, Vries JK, Cooper GF. CHARTLINE:
providing bibliographic references relevant to patient charts using the
UMLS Metathesaurus Knowledge Sources. Proc Annu Symp Comput Appl Med Care
1992:86-90. A successful medical informatics program helps its users to
match their information needs as closely and efficiently as possible to
the capabilities of the system. CHARTLINE is a computer program whose
input is a free text, natural language patient chart in ASCII format.
Using the UMLS Metathesaurus Knowledge Sources, CHARTLINE can suggest
bibliographic references relevant to the patient case described in the
chart. The program does not attempt to understand the natural language
content of the chart. CHARTLINE only recognizes UMLS Metathesaurus Main
Concept terms (or their synonyms) as they occur in the medical text, since
those terms represent the tokens used to index the literature. The program
depends on user feedback to determine which topics of a large number of
potentially relevant subjects are of interest to the user. Copyright by
and reprinted with permission of the American Medical Informatics
Association.</P>
<P>Nelson SJ, Sherertz DD, Tuttle MS. Issues in the development of an
information retrieval system: the Physician's Information Assistant.
Medinfo 1992;7(Pt 1):371-5. There are many models of electronic
information retrieval systems. The diversity of these systems, each
requiring the user to learn new and idiosyncratic operating methods, is
inhibiting to the user. In an effort to find a useful set of conventions
of information organization and user navigation, the authors have
developed the Physician's Information System (PIA). The model is that of a
hypertext browser which reflects an assessment of the manner a user is
most likely to approach the knowledge (the user model). The PIA uses
existing knowledge bases and resources, including a semantic network
browser and a communications program which handles literature searches,
and achieves interoperability over these multiple resources. Browsing
allows a wide variety of cognitive styles and supports answering
poorly-formed queries. The user must exercise judgment in determining if
the information found is relevant to the clinical situation. Difficulties
with large volumes of text on a CRT screen can occur; nontextual visual
representations of information, such as maps, appear to be helpful in
reducing the amount of text. The methodology used in building the PIA
appears to be adaptable to a variety of knowledge sources and other
resources. The consistent user metaphor provides an example of the type of
conventions that may be necessary to enable users to approach multiple
knowledge sources.</P>
<P>Nelson SJ, Sherertz DD, Tuttle MS, Abarbanel RA, Olson NE, Erlbaum MS,
Sperzel WD. The Physician's Information Assistant. Proc Annu Symp Comput
Appl Med Care 1991:950-2.</P>
<P>Patil RS, Silva JS, Swartout WR. An architecture for a health care
provider's workstation. Int J Biomed Comput 1994 Jan;34(1-4):285-99. This
paper presents an architecture for a health care provider's workstation
designed to assist health care providers in performing their daily
activities. The design is based on the concept of a clinician's associate
which acts as an intelligent intermediary between the provider and a
diverse collection of clinical, administrative, and educational
information sources. The architecture is designed to be hardware platform
independent, to work across different I/O capabilities, and to be open,
allowing specialized applications to be easily integrated with the system
and their functionality delivered through a common user environment.</P>
<P>Powsner SM, Miller PL. Automated online transition from the medical
record to the psychiatric literature. Methods Inf Med 1992
Sep;31(3):169-74. Psych Topix is a knowledge-based program which guides
the clinician from an on-line clinical report to a search of the
psychiatric literature or of other relevant databases. It provides this
guidance by using an outline of key topics in a clinical field to provide
"concept-based" links. Each topic is augmented with an activation
expression to signal when that topic is potentially relevant to a case,
and with database search expressions to allow focused retrieval of
information. The bibliographic retrieval component of Psych Topix is
currently operational as part of the daily, routine operation of a
psychiatric consultation service. The system is also implemented in a
demonstration mode to provide retrieval from three additional textual
databases. The current Psych Topix system provides a working demonstration
of the clinical feasibility of using concept-based links to facilitate the
focused, automated transition between on-line medical databases.</P>
<P>Powsner SM, Miller PL. From patient reports to bibliographic retrieval:
a Meta-1 front-end. Proc Annu Symp Comput Appl Med Care 1991:526-30. A
software front-end has been programmed to help construct Medline query
expressions from selected text in clinical records. The user clicks to
choose pertinent words or phrases from the text with a pointing device and
the words are translated into Medical Subject Headings (MeSH). The
National Library of Medicine's Unified Medical Language System Meta-1
Thesaurus is used to look up the words selected by the user. The software
traces through chains of synonyms to assemble a small set of MeSH indexing
terms. The user then makes the final selection from among the MeSH terms
and combines chosen terms using logical connectives to form a Medline
query which is passed on to Grateful Med. This approach provides the
clinical user with a natural starting point, the text of a patient report
with no need to know the MeSH terminology. The software handles the
translation that otherwise would necessitate looking up terms in MeSH
guidebooks, as well as handling the added drudgery of checking out
different synonyms. Preliminary evaluation of this approach with clinical
trainees indicated that they find the front-end a straightforward way to
search for literature relevant to a clinical case. Having a tool for
immediate translation from clinical terminology to indexing terminology
seems to be an important factor. Apparently minor issues in interface
design, such as keeping the clinical report displayed simultaneously along
with the search under construction, and keeping both visible during the
search itself seem to help orient the user. Copyright by and reprinted
with permission of the American Medical Informatics Association.</P>
<P>Powsner SM, Miller PL. Linking bibliographic retrieval to clinical
reports. PsychTopix. Proc Annu Symp Comput Appl Med Care 1989:431-5.
PsychTopix is an expert system which guides the clinician from a computer
based clinical record to a focused bibliographic retrieval. Specifically,
PsychTopix searches the literature for references pertinent to a
psychiatric consultation report. It provides intelligent guidance by
drawing on a knowledge base of current issues in psychiatry. It scans the
report to determine which clinical topics (issues) are likely to be
relevant to the case. The clinician then selects those topics for which he
or she desires a literature search. There is no need for the user to know
the mechanics or protocols of computerized literature retrieval.
PsychTopix initiates a Medline search and presents the references
retrieved to the user. More generally, PsychTopix provides an effective
demonstration of the key topics approach to medical database linkage.
Copyright by and reprinted with permission of the American Medical
Informatics Association.</P>
<P>Powsner SM, Riely CA, Barwick KW, Morrow JS, Miller PL. Automated
bibliographic retrieval based on current topics in hepatology: Hepatopix.
Comput Biomed Res 1989 Dec;22(6):552-64. The Hepatopix computer program
helps the physician go from a computerized clinical record directly to a
computerized search of the medical literature. The program uses a
hierarchical list of current (key) topics in hepatology to offer
"intelligent" searches. Each topic has associated "selection logic" and a
tested Medline search. Starting with a liver biopsy case record, Hepatopix
evaluates the selection logic to determine which topics may be pertinent
to the case (based on clinical findings, lab tests, and critical words or
phrases in the summary). The physician then picks those topics which are
interesting enough to warrant a literature search. The citations are
retrieved using search strategies stored for each topic and presented.
Hepatopix is operational with over 200 topics in the realm of liver
neoplasms, operating on liver biopsy case summaries from the Klatskin
Database of Liver Biopsies. Besides demonstrating clinical case-directed
bibliographic retrieval, it demonstrates the utility of a "key topics"
list as a bridge between medical databases. Copyright 1989 Academic
Press.</P>
<P>Sherertz DD, Tuttle MS, Olson NE, Hsu GT, Carlson RW, Fagan LM, Acuff
RD, Cole WG, Nelson SJ. Accessing oncology information at the point of
care: experience using speech, pen, and 3-D interfaces with a knowledge
server. Medinfo 1995;8(Pt 1):792-5. Oncologists' information needs arise
at diverse times and settings. For example: Is superior vena cava syndrome
a medical emergency? Our collaborative group is developing a system that
supports an interface with combinations of spoken, gestural, and simulated
three-dimensional manipulation to help an oncologist focus on the
information need, not the system. The system requires a small amount of
input from the oncologist, and then anticipates what information is
pertinent to the patient at hand, based on the sources it has available.
The system makes use of a Knowledge Server to find relevant information.
The Knowledge Server uses selected data for the particular patient from a
Computer-based Patient Record (CPR) to provide context for the information
needs. The Knowledge Server leverages the Unified Medical Language System
(UMLS) resources as well as relevant communications standards. A layered,
interaction protocol is used to help manage the fulfillment of information
needs. Each of the oncology knowledge sources is transformed into a
uniform representation that utilizes both its formal schema (e.g., its
table of contents) and its concepts and words indexed through the UMLS
Metathesaurus. Our focus on the appropriate use of information from a CPR,
and on anticipating oncologists' information needs, resulted from our
study of several longitudinal patient scenarios. We believe that our use
of scenario-based design techniques will help to ensure the system's
success.</P>
<P>Tuttle MS, Sherertz DD, Fagan LM, Carlson RW, Cole WG, Schipma PB,
Nelson SJ. Toward an interim standard for patient-centered
knowledge-access. Proc Annu Symp Comput Appl Med Care 1993:564-8. Most
care-giver knowledge needs arise at the point of care and are
patient-centered. Many of these knowledge needs can be met using existing
on-line knowledge sources, but the process is too time-consuming,
currently, for even the computer-proficient. We are developing a set of
public domain standards aimed at bringing potentially relevant knowledge
to the point of care in a straight-forward and timely fashion. The
standards will a) make use of selected items from a Computer-based Patient
Record (CPR), e.g., a diagnosis and measure of severity, b) anticipate
certain care-giver knowledge needs, e.g., therapy, protocols,
complications, and c) try to satisfy those needs from available knowledge
sources, e.g., knowledge-bases, citation databases, practice guidelines,
and on-line textbooks. The standards will use templates, i.e.,
fill-in-the-blank structures, to anticipate knowledge needs and UMLS
Metathesaurus enhancements to represent the content of knowledge sources.
Together, the standards will form the specification for a Knowledge-Server
(KS) designed to be accessed from any CPR system. Plans are in place to
test an interim version of this specification in the context of medical
oncology. We are accumulating anecdotal evidence that a KS operating in
conjunction with a CPR is much more compelling to users than either a CPR
or a KS operating alone. Copyright by and reprinted with permission of the
American Medical Informatics Association.</P>
<P>Tuttle MS, Sherertz DD, Olson NE, Nelson SJ, Erlbaum MS, Keck KD, Davis
AN, Suarez-Munist ON, Lipow SS, Cole WG. Toward reusable software
components at the point of care. Proc AMIA Fall Symp 1996:150-4. An
architecture built from five software components -- a Router, Parser,
Matcher, Mapper, and Server -- fulfills key requirements common to several
point-of-care information and knowledge processing tasks. The requirements
include problem-list creation, exploiting the contents of the Electronic
Medical Record for the patient at hand, knowledge access, and support for
semantic visualization and software agents. The components use the
National Library of Medicine Unified Medical Language System to create and
exploit lexical closure -- a state in which terms, text and reference
models are represented explicitly and consistently. Preliminary versions
of the components are in use in an oncology knowledge server. Copyright by
and reprinted with permission of the American Medical Informatics
Association. </P>
<P>van Mulligen EM. UMLS-based access to CPR data. Proc AMIA Fall Symp
1996:819. This abstract describes the results of a project that explores
the use the Unified Medical Language System (UMLS) in browsing a
computer-based patient record (CPR)]. The project consisted of a number of
steps: the mapping between CPR terms and UMLS concepts, the development of
an algorithm that explores the CPR data using this mapping, and the
implementation of a first prototype browser that visualizes "found" data.
A second issue in this project has been the direct access to online
medical literature (MEDLINE) using the UMLS concepts found in the CPR
data. In this project, we used a preliminary version of the Open Records
for Patient Care (ORCA) CPR that consisted only of the history and
physical examination data of patients suffering from heart failure.
Copyright by and reprinted with permission of the American Medical
Informatics Association.</P><A
href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#list">Return to title
page</A> | <A
href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#15">Return to table of
contents</A>
<HR>
<UL>
<LI><STRONG><A name=3j>Access to Multiple Knowledge-based Information
Sources</A></STRONG><BR></LI></UL>
<HR>
<P>Barber S, Fowler J, Long KB, Dargahi R, Meyer B. Integrating the UMLS
into VNS retriever. Proc Annu Symp Comput Appl Med Care 1992:273-7. We are
developing a networked resource for the National Library of Medicine's
Unified Medical Language System. We call this resource the UMLS Retriever,
which is an instance of our VNS Retriever architecture. Our prototype user
interface makes use of the Virtual Notebook System Browser. The
development of a networked UMLS service will result in numerous advantages
to our user community. Copyright by and reprinted with permission of the
American Medical Informatics Association.</P>
<P>Cimino C, Barnett GO. Standardizing access to computer-based medical
resources. Proc Annu Symp Comput Appl Med Care 1990:33-7. The paper
describes a working Interactive Query Workstation (IQW). The IQW allows
users to query multiple resources: a medical knowledge base (DXplain), a
clinical database (COSTAR/MQL), a bibliographic database (MEDLINE), a
cancer database (PDQ), and a drug interaction database (PDR). The IQW has
evolved from requiring alteration of resource code to using off-the-shelf
products (Kappa &amp; Microsoft Windows) to control resources.
Descriptions of each resource were developed to allow IQW to access these
resources. There are three components to these descriptions; information
on how data is sent and received from a resource, in formation on types of
queries to which a resource can respond, and information on what types of
information are needed to execute a query. These components form the basis
of a standard description of resources. Copyright by and reprinted with
permission of the American Medical Informatics Association.</P>
<P>Cimino C, Barnett GO, Blewett DR, Hassan LJ, Grundmeier R, Merz R, Kahn
JA, Gnassi JA. Interactive query workstation: a demonstration of the
practical use of UMLS knowledge sources. Proc Annu Symp Comput Appl Med
Care 1992:823-4. The Interactive Query Workstation (IQW) has been
developed to provide clinicians with a uniform program interface for
retrieving medical-related information from various computer-based
information resources. These resources can vary in content (bibliographic
databases, drug information, general medical text databases), function
(article retrieval, differential diagnosis, drug interaction detection, or
drug dosage and administration information), and media formats (local hard
disk, CD-ROM, local area network, or distant telecommunication link). IQW
allows modular addition of new resources as well as extension of
previously installed resources. The National Library of Medicine's three
Unified Medical Language System (UMLS) Knowledge Sources, the
Metathesaurus (Meta), the Semantic Network, and the Information Sources
Map (ISM) have been incorporated into many aspects of IQW. Meta provides
information about medical terminology and aids IQW in isolating the basic
concepts from a clinician's question. The Semantic Network provides
information about the categorization of concepts and possible relations
between concepts. It also assists IQW in determining which queries are
appropriate for a set of concepts contained in the clinician's question.
The ISM provides information about the content available from a
computer-based resources and aids IQW in selecting an appropriate resource
from which to collect information. The computer-based resource selection
is performed without user intervention. This interactive demonstration
shows an environment which increases the accessibility of medical
information to clinicians by utilizing the three UMLS Knowledge Sources.
Copyright by and reprinted with permission of the American Medical
Informatics Association.</P>
<P>Cimino C, Barnett GO, Hassan L, Blewett DR, Piggins JL. Interactive
query workstation: standardizing access to computer-based medical
resources. Comput Methods Programs Biomed 1991 Aug;35(4):293-9. Methods of
using multiple computer-based medical resources efficiently have
previously required either the user to manage the choice of resource and
terms, or specialized programming. Standardized descriptions of what
resources can do and how they may be accessed would allow the creation of
an interface for multiple resources. This interface would assist a user in
formulating queries, accessing the resources and managing the results.
This paper describes a working prototype, the Interactive Query
Workstation (IQW). The IQW allows users to query multiple resources: a
medical knowledge base (DXplain), a clinical database (COSTAR/MQL), a
bibliographic database (MEDLINE), a cancer database (PDQ), and a drug
interaction database (PDR). Descriptions of each resource were developed
to allow IQW to access these resources. The descriptions are composed of
information on how data are sent and received from a resource, information
on types of query to which a resource can respond, and information on what
types of information are needed to execute a query. These components form
the basis of a standard description of resources.</P>
<P>Clyman JI, Powsner SM, Paton JA, Miller PL. Using a network menu and
the UMLS Information Sources Map to facilitate access to online reference
materials. Bull Med Libr Assoc 1993 Apr;81(2):207-16. As computer
technology advances, clinicians and biomedical researchers are becoming
more dependent upon information from online databases and information
systems. By using specially configured computer workstations and
high-speed computer networks, it is now possible to access this
information in a rapid and straightforward manner. To empower users by
providing these capabilities, the authors are assembling a variety of
network workstations to be located throughout Yale-New Haven Medical
Center. At the heart of the workstation is NetMenu, a program designed to
help users connect to a number of important online information systems,
including a hospital order entry and results reporting system, a drug
reference, bibliographic retrieval systems, and educational programs. In
addition, as part of the National Library of Medicine's Unified Medical
Language System (UMLS) project, the authors have developed a local
prototype of the UMLS Information Sources Map (ISM) and a companion query
assistant program to complement the NetMenu in helping users select and
connect automatically to information services relevant to a particular
question. The ISM query assistant draws from a listing of many online
information sources accessible via local and international networks.
Copyright by and reprinted with permission of the Medical Library
Association.</P>
<P>Dolin RH. Internet medical resources [letter]. Ann Intern Med 1996 Feb
1;124(3):375. Comment on: Ann Intern Med 1995 Jul 15;123(2):123-31.</P>
<P>Freiburger G, Levy SR, LePoer PM, Murray J, Heinold S, Warfield T. UMLS
workstation project. Progress to date. Proc Annu Symp Comput Appl Med Care
1993:877. In 1992, the Health Science Library at the University of
Maryland was awarded a three-year grant from the National Library of
Medicine to create a Windows-based interface to the Unified Medical
Language System (UMLS). This interface will use the UMLS Knowledge Sources
to assist users searching various databases available at the Library,
including the online catalog, PsycLIT, CINAHL, MEDLINE, and HSL Current
Contents. This paper traces the evolution of the interface during its
first 18 months by illustrating the revisions made to the prototype.
Revisions are based on user feedback elicited in an iterative process of
design, development, and review. Copyright by and reprinted with
permission of the American Medical Informatics Association.</P>
<P>Gnassi JA, Barnett GO. A survey of electronic drug information
resources and identification of problems associated with the differing
vocabularies used to key them. Proc Annu Symp Comput Appl Med Care
1994:631-5. Drug information resources are increasingly becoming
electronically available. They differ in scope, granularity, and purpose.
These considerations have shaped the selection of dissimilar drug name
keys, complicating access. An abbreviated and simplified historical
context of the development of official controlled vocabularies and their
relationships is followed by a review of the kinds of information
available in several electronic drug information resources. The key
vocabularies used are discussed with examples. Problems using the
differing terms of the resource vocabularies are identified. Copyright by
and reprinted with permission of the American Medical Informatics
Association.</P>
<P>Gnassi JA, Bormel JI, Blewett DR, Kim RJ, Barnett GO. A medical
information resource server: one stop shopping on the Internet. Proc Annu
Symp Comput Appl Med Care 1994:1025.</P>
<P>Hersh WR, Brown KE, Donohoe LC, Campbell EM, Horacek AE. CliniWeb:
managing clinical information on the World Wide Web. J Am Med Inform Assoc
1996 Jul-Aug;3(4):273-80. The World Wide Web is a powerful new way to
deliver on-line clinical information, but several problems limit its value
to health care professionals: content is highly distributed and difficult
to find, clinical information is not separated from non-clinical
information, and the current Web technology is unable to support some
advanced retrieval capabilities. A system called CliniWeb has been
developed to address these problems. CliniWeb is an index to clinical
information on the World Wide Web, providing a browsing and searching
interface to clinical content at the level of the health care student or
provider. Its database contains a list of clinical information resources
on the Web that are indexed by terms from the Medical Subject Headings
disease tree and retrieved with the assistance of SAPHIRE. Limitations of
the processes used to build the database are discussed, together with
directions for future research. Copyright by and reprinted with permission
of the American Medical Informatics Association.</P>
<P>Loonsk JW, Lively R, TinHan E, Litt H. Implementing the Medical
Desktop: tools for the integration of independent information resources.
Proc Annu Symp Comput Appl Med Care 1991:574-7. The increasing
availability of medical information resources has moved the Medical
Desktop from a theoretical construct to a practical necessity. Many
micro-computers are becoming available in clinical and academic settings
that can access several medical information applications. These computers
are usually not powerful workstations that are part of a clinically
oriented information support system, but are personal computers with
varied capabilities. The applications on these computers come from
different sources, are accessed through different user interfaces and do
not share data well. The de facto Medical Desktop this situation presents
will discourage most end-users because the combination of applications is
complex, the applications are poorly integrated, and individual
applications are inconsistent. At the State University of New York at
Buffalo School of Medicine and Biomedical Sciences we have developed
several Microsoft Windows-based tools that accept a systems level
diversity of resources, but work toward the construction of a coherent
Medical Desktop. These tools include a lexical term linker, a resource
database, and a context sensitive help system that is tailored to locally
available resources. Copyright by and reprinted with permission of the
American Medical Informatics Association.</P>
<P>Rodgers RP. Automated retrieval from multiple disparate information
sources. The World Wide Web and the NLM's Sourcerer project. J Am Soc Inf
Sci 1995 Dec;46(10):755-64. The burgeoning amount of information available
via the internet has heightened awareness of the need for improved tools
for resource identification. The U.S. National Library of Medicine's (NLM)
Sourcerer project is developing software which accepts a user query,
automatically identifies appropriate information resources, and
facilitates connection to those sources for information retrieval. The
current Sourcerer prototype utilizes the
multimedia/multiplatform/multiprotocol network-based hypertext system
known as World Wide Web. It also relies upon the knowledge sources of the
Unified Medical Language System (UMLS). The UMLS is the result of a
long-term project of NLM. It comprises a large Metathesaurus of biomedical
concepts (coupled with a semantic network and syntactical/lexical software
tools) and the information Sources Map (ISM), a database of records
describing specific biomedical information resources. Recent advances in
the standardization of information exchange over computer networks,
coupled with the tools provided by UMLS, facilitate query refinement and
augmentation, connection to resources, and retrieval from resources.
Daunting challenges remain with respect to optimizing resource
descriptions, defining optimal algorithms for searching for sources,
optimizing user interface design, and organizing retrieved information.
Copyright 1995 by and reproduced with permission of John Wiley and
Sons.</P>
<P>Sperzel WD, Abarbanel RM, Nelson SJ, Erlbaum MS, Sherertz DD, Tuttle
MS, Olson NE, Fuller LF. Biomedical database inter-connectivity: an
experiment linking MIM, GENBANK, and META-1 via MEDLINE. Proc Annu Symp
Comput Appl Med Care 1991:190-3. The linkage of disparate biomedical
databases is an important goal of the Unified Medical Language (UMLS)
Project. We conducted an experiment to investigate the feasibility of
using UMLS resources to link databases in clinical genetics and molecular
biology. References from MIM (Mendelian Inheritance in Man) were lexically
mapped to the equivalent citations in MEDLINE. The MeSH major subject
headings by which the citations in a particular MIM entry had been indexed
were used to develop a genetic-disorder-centered view of the world in
Meta-1 (the first official version of the UMLS Metathesaurus). Our
hypothesis was that these MeSH subject headings could provide access to a
semantic neighborhood in Meta-1 that would be relevant to a particular
genetic disorder. By browsing in this semantic neighborhood, a user could
select various combinations of terms with which to search MEDLINE through
an interface between Meta-1 and Grateful Med. Such searches might retrieve
citations that were more recent than those in MIM or that provided useful
supplementary information. Since some MEDLINE records contain pointers to
entries in GENBANK, information about genetic sequences related to a
particular clinical genetic disorder could also be retrieved. This
scenario was implemented for a small number of MIM entries, providing a
concrete demonstration that linking disparate electronic databases in an
important subdomain of biomedicine is relatively straightforward.
Copyright by and reprinted with permission of the American Medical
Informatics Association.</P>
<P>Tuttle MS, Cole WG, Sherertz DD, Nelson SJ. Navigating to knowledge.
Methods Inf Med 1995 Mar;34(1-2):214-31. One way to fulfill point-of-care
knowledge needs is to present caregivers with a visual representation of
the available "answers". Using such a representation, caregivers can
recognize what they want, rather than have to recall what they need, and
then navigate to an appropriate answer. Given selected pieces of
information from a computer-based patient record, an interface can
anticipate certain knowledge needs by initializing caregiver navigation in
a semantic neighbourhood on answers likely to be relevant to the patient a
hand. These notions draw heavily on two collaborative projects - the U.S.
National Library of Medicine Unified Medical Language System and the U.S.
National Cancer Institute Knowledge Server. Both these projects support
navigation because they make the structure of medical knowledge explicit
in a way that can be exploited by human interfaces.</P><A
href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#list">Return to title
page</A> | <A
href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#15">Return to table of
contents</A>
<HR>
<H3>Preliminary and Ancillary Studies</H3>
<UL>
<LI><STRONG><A name=4a>User Information Needs</A></STRONG> </LI></UL>
<HR>
<P>Cimino C, Barnett GO. Analysis of physician questions in an ambulatory
care setting. Proc Annu Symp Comput Appl Med Care 1991:995-9. We collected
38 questions generated by physicians based on their active patient medical
records. Each question was associated with a single term in a specific
record (Key Term). These questions were analyzed with respect to word
content and concept content. Concepts were matched to the National Library
of Medicine's Metathesaurus (Meta-1). Thirty-seven Key Terms matched
completely to Meta-1 terms. Each question matched to an average of 4.1
Meta-1 terms for a total of 156 concepts. Based on word count, these 156
concepts accounted for 40 percent, stop words accounted for 39 percent,
and numbers and drug trade names accounted for less than 1 percent of the
words. The remaining 20 percent of the words could be matched to 69
concepts not in Meta-1. Review of all concepts showed that they could be
divided into medical terms (Noun Concepts), modifiers (Modifier Concepts),
and concepts that provided context for the questions (Relation Concepts).
The majority of Relation Concepts did not match to Meta-1. A vocabulary of
Relation Concepts would provide a useful starting point for a computer
system designed to aid physicians in answering clinical questions.
Copyright by and reprinted with permission of the American Medical
Informatics Association.</P>
<P>Cimino C, Barnett GO. Analysis of physician questions in an ambulatory
care setting. Comput Biomed Res 1992 Aug;25(4):366-73. We collected 69
questions generated by physicians based on their active patient medical
records. Each question was associated with a single term in a specific
record (Key Term). These questions were analyzed with respect to word
content and concept content. Concepts were matched to the National Library
of Medicine's Metathesaurus (Meta-1). Sixty-eight Key Terms were
completely matched by Meta-1 terms. Each question matched to an average of
3.7 Meta-1 terms for a total of 255 concepts. Based on word count, these
255 concepts accounted for 43%, stop words accounted for 36%, and numbers
and drug trade names accounted for 3% of the words. The remaining 18% of
the words could be matched to 143 concepts not in Meta-1. Review of all
concepts showed that they could be divided into medical terms (Noun
Concepts), modifiers (Modifier Concepts), and concepts that provided
context for the questions (Relation Concepts). The majority of Relation
Concepts did not match concepts in Meta-1. A vocabulary of Relation
Concepts would provide a useful starting point for a computer system
designed to aid physicians in answering these questions. Copyright 1992
Academic Press.</P>
<P>Forsythe DE, Buchanan BG, Osheroff JA, Miller RA. Expanding the concept
of medical information: an observational study of physicians' information
needs. Comput Biomed Res 1992 Apr;25(2):181-200. The authors describe an
empirical study of information needs in four clinical settings in internal
medicine in a university teaching hospital. In contrast to the
retrospective data often used in previous studies, this research used
ethnographic techniques to facilitate direct observation of communication
about information needs. On the basis of this experience, the authors
address two main issues: how to identify and interpret expressions of
information needs in medicine and how to broaden ones conception of
'information needs' to account for the empirical data. Copyright 1992
Academic Press.</P>
<P>Osheroff JA, Forsythe DE, Buchanan BG, Bankowitz RA, Blumenfeld BH,
Miller RA. Physicians' information needs: analysis of questions posed
during clinical teaching. Ann Intern Med 1991 Apr 1;114(7):576-81.
OBJECTIVE: To describe information requests expressed during clinical
teaching. SETTING: Residents' work rounds, attending rounds, morning
report, and interns' clinic in a university-based general medicine
service. SUBJECTS: Attending physicians, medical house staff, and medical
students in a general medicine training program. METHODS: An
anthropologist observed communication among study subjects and recorded in
field notes expressions of a need for information. We developed a coding
scheme for describing information requests and applied the coding scheme
to the data recorded. Based on assigned codes, we created a subset of
strictly clinical requests. MEASUREMENTS: Five hundred nineteen
information requests recorded during 17 hours of observed clinical
activity were selected for detailed analysis. These requests related to
the care of approximately 90 patients by 24 physicians and medical
students. Sixty-five requests were excluded because they were not strictly
clinical, leaving a subset of 454 clinical questions for analysis. MAIN
RESULTS: On average, five clinical questions were raised for each patient
discussed. Three hundred thirty-seven requests (74%) concerned patient
care. Of these 337 questions, 175 (52%) requested a fact that could have
been found in a medical record. Seventy-seven (23%) of these questions,
motivated by the needs of patient care, were potentially answerable by a
library, a textbook, a journal, or MEDLINE. Eighty-eight (26%) of the
questions asked for patient care required synthesis of patient information
and medical knowledge. CONCLUSIONS: Clinicians in the study settings
requested information frequently. Many of these information needs required
the synthesis of patient information and medical knowledge and thus were
potentially difficult to satisfy. A typology is proposed that
characterizes information needs as consciously recognized, unrecognized,
and currently satisfied. Copyright Annals of Internal Medicine; <A
"http://www.acponline.org/">http://www.acponline.org/</A>.</P><A
href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#list">Return to title
page</A> | <A
href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#15">Return to table of
contents</A>
<HR>
<UL>
<LI><STRONG><A name=4b>Vocabulary Analysis and Merging</A></STRONG>
</LI></UL>
<HR>
<P>Bicknell EJ, Sneiderman CA, Rada RF. Computer-assisted merging and
mapping of medical knowledge bases. Proc Annu Symp Comput Appl Med Care
1988:158-64. A user-interactive rule-based computer program, developed for
the purpose of mapping and merging multiple hierarchical thesauri, is
described. The program, called DynaSaurI (dynamic thesaurus integration),
was tested on subsets of two medical thesauri, the Systemized Nomenclature
of Medicine (SNOMED) and the Medical Subject Headings (MeSH). Each
thesaurus is treated as a knowledge base, containing information both in
the terms and in the various types of relationships between terms.
DynaSaurI uses combinations of string matching and tree browsing to
propose a ranked array of related MeSH terms for each SNOMED term
presented. A medical expert selected the closest match from the array of
terms proposed by DynaSaurI and entered the appropriate type of
relationship between the terms. The information acquired from the expert
was then used to refine DynaSaurI's mapping rules. With DynaSaurI, all 84
SNOMED concepts were successfully merged with and mapped to MeSH main
headings; 74(88%) were mapped by the initial DynaSaurI pass, and the
remainder by incorporating the user's responses. All merging utilized the
relationship descriptions (e.g., "is narrower than") provided by the
online interaction with the medical expert. Copyright by and reprinted
with permission of the American Medical Informatics Association.</P>
<P>From the president: reviewing nursing concepts to be included in the
1995 version of the Unified Medical Language System. Nurs Diagn 1995
Apr-Jun;6(2):53-4.</P>
<P>Kannry JL, Wright L, Shifman M, Silverstein S, Miller PL. Portability
issues for a structured clinical vocabulary: mapping from Yale to the
Columbia medical entities dictionary. J Am Med Inform Assoc 1996
Jan-Feb;3(1):66-78. To examine the issues involved in mapping an existing
structured controlled vocabulary, the Medical Entities Dictionary (MED)
developed at Columbia University, to an institutional vocabulary, the
laboratory and pharmacy vocabularies of the Yale New Haven Medical Center.
200 Yale pharmacy terms and 200 Yale laboratory terms were randomly
selected from database files containing all of the Yale laboratory and
pharmacy terms. These 400 terms were then mapped to the MED in three
phases: mapping terms, mapping relationships between terms, and mapping
attributes that modify terms. 73% of the Yale pharmacy terms mapped to MED
terms. 49% of the Yale laboratory terms mapped to MED terms. After certain
obsolete and otherwise inappropriate laboratory terms were eliminated, the
latter rate improved to 59%. 23% of the unmatched Yale laboratory terms
failed to match because of differences in granularity with MED terms. The
Yale and MED pharmacy terms share 12 of 30 distinct attributes. The Yale
and MED laboratory terms share 14 of 23 distinct attributes. The mapping
of an institutional vocabulary to a structured controlled vocabulary
requires that the mapping be performed at the level of terms,
relationships, and attributes. The mapping process revealed the importance
of standardization of local vocabulary subsets, standardization of
attribute representation, and term granularity. Copyright by and reprinted
with permission of the American Medical Informatics Association.</P>
<P>Lowe HJ, Barnett GO. Understanding and using the medical subject
headings (MeSH) vocabulary to perform literature searches. JAMA 1994 Apr
13;271(14):1103-8. Comment in: JAMA 1995 Jan 18;273(3):184; discussion
184-5.</P>
<P>Masarie FE Jr, Miller RA. Medical Subject Headings and medical
terminology: an analysis of terminology used in hospital charts. Bull Med
Libr Assoc 1987 Apr;75(2):89-94. Terminology used by health professionals
in everyday written discourse was compared with terminology in a
standardized medical vocabulary, the Medical Subject Headings (MeSH).
Fifty written hospital charts were selected at random and analyzed by a
computer program that identified MeSH terms in the charts. The charts were
analyzed against two related MeSH vocabularies- one containing MeSH terms
and one containing both MeSH terms and backwards cross-reference terms.
when small words such as articles and prepositions were disregarded,
approximately 50% of the words in a medical chart were found to be
MeSH-related terminology. In addition, about 40% of MeSH-related words in
the charts were either MeSH terms or backwards cross-reference terms.
Copyright by and reprinted with permission of the Medical Library
Association.</P>
<P>McCray AT, Browne AC, Moore DL. The semantic structure of neo-classical
compounds. Proc Annu Symp Comput Appl Med Care 1988:165-8. The automated
analysis of neo-classical compounds in the medical domain has been
proposed and carried out by a number of researchers in recent years. This
paper discusses the semantics of these compounds. The results indicate
that neo-classical compounds are semantically underdetermined by their
constituent parts. Thus, automated analysis of these compounds will need
to be supplemented by human review. Copyright by and reprinted with
permission of the American Medical Informatics Association.</P>
<P>Miller PL, Smith P, Morrow JS, Riely CA, Powsner SM. Semantic
relationships and MeSH. Proc Annu Symp Comput Appl Med Care 1988:174-9.
This paper compares bibliographic retrieval using current MeSH (Medical
Subject Headings) to bibliographic retrieval using explicitly coded
semantic relationships between index terms. In a previous study, 10 lists
of abstracts, each list containing 20-40 papers discussing a specific pair
of terms, were analyzed to identify the specific relationship(s) between
those terms discussed in each paper. In the present study, we analyze how
well current MeSH coding, using topical subheadings and check tags, can
selectively retrieve those papers discussing each semantic relationship.
Copyright by and reprinted with permission of the American Medical
Informatics Association.</P><A
href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#list">Return to title
page</A> | <A
href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#15">Return to table of
contents</A>
<HR>
<UL>
<LI><STRONG><A name=4c>Knowledge Acquisition and
Representation</A></STRONG> </LI></UL>
<HR>
<P>Ball S, Wright L, Miller P. SENEX, an object-oriented biomedical
knowledge base. Proc Annu Symp Comput Appl Med Care 1989:85-9. An
object-oriented knowledge base, SENEX, in the domain of neurodegeneration
and loss of memory in aging is being developed. Initially, the focus is on
three sets of issues in the representation of biomedical information.
First, the authors are seeking to extend the medical subject headings
(MeSH) nomenclature to include new classes of biomedical entities and to
include relationships among those entities. Second, they are structuring
biomedical information rather than categorizing text for bibliographic
retrieval. Third, they are exploring ways in which such information could
be used in an interactive system created for purposes of education and for
designing basic research experiments. The current behavior of SENEX, which
is being developed using the Common Lisp Object System (CLOS), is
described. Various issues raised and plans for future development are
discussed. Copyright by and reprinted with permission of the American
Medical Informatics Association.</P>
<P>Ball SS, Mah VH, Miller PL. SENEX: a computer-based representation of
cellular signal transduction processes in the central nervous system.
Comput Appl Biosci 1991 Apr;7(2):175-87. The SENEX project is exploring
knowledge representation in the neurobiology of ageing through
object-oriented programming. SENEX is built from a classification
structure of biologic entities and significant relationships among them.
For example, an enzyme is an entity and an enzymatic reaction is a
relationship among enzyme, cofactor(s), substrate(s) and product(s). There
are currently 2600 classes of entities and 50 classes of relationships in
SENEX. The class structure serves several functions. One function is to
interrelate general and specific categories of molecular and morphologic
entities. For example, tyrosine kinase and serine/threonine kinase are
specific types of the more general class of protein kinase enzymes.
Another function of the class structure is to serve as a network through
which inheritance of attributes may occur. For example, the attribute
'subunits' is inherited by all subclasses of the general class
multisubunit protein. Information may be accessed through links
established in the class structure and through links relating one object
as part of another. Relationships form the basis of separate modules
within SENEX. This paper describes the types of relationships currently
used and planned in the representation of age-related changes in cellular
signal transduction processes of mammalian central nervous systems. We
also describe tools for specific retrieval of relationships and for
tracing links in complex reaction cascades. Application of these tools to
identifying possible signal transduction pathways to guide further
exploration through experimentation is discussed. Reprinted by permission
of Oxford University Press.</P>
<P>Barr CE, Komorowski HJ, Pattison-Gordon E, Greenes RA. Conceptual
modeling for the unified medical language system. Proc Annu Symp Comput
Appl Med Care 1988:148-51. The Unified Medical Language System was
proposed by the National Library of Medicine to facilitate the exchange
and utilization of information from multiple sources. We are using
semantic networks as the knowledge representation scheme in a prototype
system to explore how to accomplish these goals. Conceptual modeling helps
define a complete and consistent set of objects and relationships to
include in the semantic net. Both top-down and bottom-up approaches were
found useful in the seven step process of building the semantic network.
Theoretical and practical issues are discussed as well as future
extensions to the current prototype. Copyright by and reprinted with
permission of the American Medical Informatics Association.</P>
<P>Berman L, Cullen M, Miller PL. Automated integration of external
databases: a knowledge-based approach to enhancing rule-based expert
systems. Comput Biomed Res 1993 Jun;26(3):230-41. Expert system
applications in the biomedical domain have long been hampered by the
difficulty inherent in maintaining and extending large knowledge bases. We
have developed a knowledge-based method for automatically augmenting such
knowledge bases. The method consists of automatically integrating data
contained in commercially available, external, online databases with data
contained in an expert system's knowledge base. We have built a prototype
system, named DBX, using this technique to augment an expert system's
knowledge base as a decision support aid and as a bibliographic retrieval
tool. In this paper, we describe this prototype system in detail,
illustrate its use, and discuss the lessons we have learned in its
implementation. Copyright 1993 Academic Press.</P>
<P>Berman L, Cullen MR, Miller PL. Automated integration of external
databases: a knowledge-based approach to enhancing rule-based expert
systems. Proc Annu Symp Comput Appl Med Care 1992:227-33. Expert system
applications in the biomedical domain have long been hampered by the
difficulty inherent in maintaining and extending large knowledge bases. We
have developed a knowledge-based method for automatically augmenting such
knowledge bases. The method consists of automatically integrating data
contained in commercially available, external, on-line databases with data
contained in an expert system's knowledge base. We have built a prototype
system, named DBX, using this technique to augment an expert system's
knowledge base as a decision support aid and as a bibliographic retrieval
tool. In this paper, we describe this prototype system in detail,
illustrate its use and discuss the lessons we have learned in its
implementation. Copyright by and reprinted with permission of the American
Medical Informatics Association.</P>
<P>Canfield K, Bray B, Huff S. Representation and database design for
clinical information. Proc Annu Symp Comput Appl Med Care 1990:350-3.
Semantic discourse analysis and sublanguage methods are used to create a
database model from free-text echocardiography reports. This model
dictates the object structure of a sematic model that is implemented in a
relations database form and evaluated for representational adequacy. The
sematic frame structure of this relational patient database is a flexible
projection of a hierarchical dictionary. The Unified Medical Language
System (UMLS) Metathesaurus could be used as such a dictionary. The result
is a structured clinical report database model that is built on a standard
dictionary and is generalizable to other domains. Copyright by and
reprinted with permission of the American Medical Informatics
Association.</P>
<P>Canfield KC, Bray BE, Huff SM, Warner HR. Database capture of natural
language echocardiographic reports: A UMLS approach. Proc Annu Symp Comput
Appl Med Care 1989:559-63. We describe a prototype system for
semiautomatic database capture of free-text echocardiography reports. The
system is very simple and uses a Unified Medical Language System
compatible architecture. We use this system and a large body of texts to
create a patient database and develop a comprehensive hierarchical
dictionary for echocardiography. Copyright by and reprinted with
permission of the American Medical Informatics Association.</P>
<P>Chang S-Y. Kanes: knowledge acquisition for a neuroradiology expert
system [dissertation]. [Salt Lake City]: The University of Utah; 1991. 151
p. Available from: University Microforms, Ann Arbor, MI; 9133706. One of
the most severe obstacles to applying medical informatics to solve
practical medical problems is acquiring the knowledge base. The Iliad
knowledge base is among the most comprehensive medical knowledge bases in
existence. The amount of effort devoted to its creation and maintenance is
a testimony to the difficulty of building academic-quality, comprehensive
knowledge bases for practical medical applications. In addition to the
difficulty of knowledge acquisition, the accuracy and reliability of
knowledge base are also major concerns for the developers and users of
Iliad expert system. The major emphasis of this project was to use a
patient database to improve the efficiency of creating a knowledge base
for the neuroradiology domain and increase the accuracy of Iliad expert
system based on this knowledge base. The project introduced a knowledge
engineering model to automatically generate disease profiles in
neuroradiology. The model used a new technique to collect patient data,
obtain important statistics, calculate finding utility, and extract the
best findings for the diagnostic frames. Knowledge Acquisition for a
Neuroradiology Expert System (KANES) is an efficient, accurate, and
easy-to-use personal computer program that can assist knowledge engineers
in managing the patient database and executing the analysis tasks
described above. The experience with the KANES program using a relational
Database Management System (DBMS) can be extended to a larger environment
where information is gathered from multiple sources and where real-time
decisions need to be made. The knowledge engineering session in the
Department of Medical Informatics is a good example of such an environment
where different categories of individuals need and generate information
and make decisions related to teaching, research, management, and
administration. Under contract from the Unified Medical Language System
(UMLS) project of the National Library of Medicine, a database is being
built to contain clinical data from multiple sources like QMR, HELP, and
Iliad. As the quality of the data in medical information systems improves,
such databases will become an important resource for all of the
probabilities that drive computerized diagnostic systems. The KANES
program has the potential to expand to be a decision support system for
all medical domains that would help the groups in the knowledge
engineering session to make decisions more easily and more appropriately.
Provided by UMI.</P>
<P>Cimino JJ, Elkin PL, Barnett GO. As we may think: the concept space and
medical hypertext. Comput Biomed Res 1992 Jun;25(3):238-63. Hypertext, a
medium for presenting written material in a nonsequential manner, is
gaining popularity as a format for medical text. The structure of
traditional hypertext documents (hyperdocuments) includes author-created
links among text segments. This structure poses challenge for those who
create and maintain hyperdocuments, while reading them can introduce
disorientation and cognitive overload. An alternative model is presented
in which text segments are linked to the concepts which they contain and
the concepts are linked to each other in a semantic network called the
Concept Space. The concepts and semantic links attempt to approximate
potential topics of interest, allowing the reader to browse the
hyperdocument in an individualized manner, rather than in an
author-designated one. The concept space approach offers advantages for
both the author and the reader. Copyright 1992 Academic Press.</P>
<P>Cimino JJ, Mallon LJ, Barnett GO. Automated extraction of medical
knowledge from Medline citations. Proc Annu Symp Comput Appl Med Care
1988:180-4. The Medline database consists of over six million citations to
the medical literature, indexed by the National Library of Medicine with
the use of Medical Subject Headings (MeSH) and Subheadings. We propose
that analysis of MeSH Headings and Subheadings in Medline citations will
reveal the interrelationships among medical concepts described in the
original articles. We have developed a rule-based system which postulates
relationships based on the co-occurrence of MeSH Headings in Medline
citations. At present, the rule base consists of 504 rules which propose
57 relationships. When this rule base was applied to a test of 673
citations, 93% of the proposed relationships were determined to be correct
(96%, after correction of a transcription error in the rule base). We
believe this approach has great potential, both for assisting acquisition
of medical knowledge and for improving the quality of Medline retrievals.
Copyright by and reprinted with permission of the American Medical
Informatics Association.</P>
<P>Elkin PL, Cimino JJ, Lowe HJ, Aronow DB, Payne TH, Pincetl PS, Barnett
GO. Mapping to MeSH (the art of trapping MeSH equivalence from within
narrative text). Proc Annu Symp Comput Appl Med Care 1988:185-90. A tool
for identifying medical subject headings (MeSH) terms found in narrative
text is evaluated and discussed. The system's task is to discern unique
matches from within MeSH for noun phrases in narrative text. The program
consists of a medical morphological reduction routine, coupled with data
structures created for the MeSH vocabulary searcher, MicroMeSH. To
evaluate this tool, a study was undertaken within which three physicians
were asked to review citations from the Annals of Internal Medicine and
three paragraphs from a Textbook of Cardiology. They were asked to
identify all of the important medical concepts within both the citations
and text. Then these same physicians used MicroMeSH, to see which of these
medical concepts could be mapped to MeSH. These results were compared to
the output of our automated system. Of the concepts which were found to be
medical concepts by our panel of experts 89% were identified using
MicroMeSH as being represented in MeSH. The automated system was able to
translate 90% of those medical concepts to the same MeSH term as
identified by MicroMeSH. The remaining 10% of the concepts, which were
recognized by the experts and not by the system, were terms where the
medical knowledge of the experts allowed them to find matches which had no
representation, morphologically or through an Entry Term, in the MeSH
vocabulary. The specific algorithms, details of evaluation and potential
usefulness of the system are discussed. Copyright by and reprinted with
permission of the American Medical Informatics Association.</P>
<P>Evans DA. Pragmatically-structured, lexical-semantic knowledge bases
for unified medical language systems. Proc Annu Symp Comput Appl Med Care
1988:169-73. Unified medical language systems must accommodate expressions
ranging from fixed-form standardized vocabularies to the free-text,
natural language of medical charts. Such ability will depend on the
identification, representation, and organization of the concepts that form
the useful core of the biomedical conceptual domain. The MedSORT-II and
UMLS Projects at Carnegie Mellon University have established a feasibile
design for the development of lexicons and knowledge bases to support the
automated processing of varieties of expressions (in the subdomain of
clinical findings) into uniform representations. The essential principle
involves incorporating lexical-semantic typing restrictions in a
pragmatically -structured knowledge base. The approach does not depend on
exhaustive knowledge representation, rather takes advantage of selective,
limited relations among concepts. In particular, the Projects have
demonstrated that practical, comprehensive, and accurate processing of
natural-language expressions is attainable with partial knowledge bases,
which can be rapidly prototyped. Copyright by and reprinted with
permission of the American Medical Informatics Association.</P>
<P>Greenes RA, McClure RC, Pattison-Gordon E, Sato L. The
findings--diagnosis continuum: implications for image descriptions and
clinical databases. Proc Annu Symp Comput Appl Med Care 1992:383-7. As
part of the Unified Medical Language System (UMLS) project, we have been
exploring the use of semantic net representation to build a medical
ontology that can adapt to the needs and perspective of differing kinds of
users with varying purposes. A principal objective is to facilitate
indexing and retrieval of objects in a variety of target databases, using
their own source vocabularies, while maintaining the representation of
concepts to which these source vocabularies refer in a single consistent
form, so that retrievals that span resource types can be accommodated. In
addition, a particular area of deficiency of the existing UMLS
Metathesaurus is that of clinical findings, a part of the problem being
the multiple alternative views and granularity levels at which clinical
findings are described in different target databases. The problem is
particularly obvious when one examines the way in which image findings are
described, which may be at a purely perceptual level, or at varying levels
of aggregation into higher level observations or interpretations. We have
developed a recursive model for representing observations and
interpretations in a semantic net along a continuum of degree of
aggregation, that appears to lend itself well to adaptation to varying
perspectives. Copyright by and reprinted with permission of the American
Medical Informatics Association.</P>
<P>Komorowski J, Barr CE, Pattison-Gordon E, Greenes RA. Knowledge
modeling for the Unified Medical Language System. In: Kangassalo H, Ohsuga
S, Jaakkola H, editors. Information modelling and knowledge bases.
Amsterdam: IOS; 1990. p. 313-17.</P>
<P>Masarie FE Jr, Miller RA, Bouhaddou O, Giuse NB, Warner HR. An
interlingua for electronic interchange of medical information: using
frames to map between clinical vocabularies. Comput Biomed Res 1991
Aug;24(4):379-400. The proliferation of medical knowledge has led to the
development of extensive dictionaries for electronically accessing
information resources. The task of standardizing terminology used for
electronic hospital records and for knowledge bases for medical expert
systems and indexing the medical literature cannot easily be met by
developing a single, monolithic official medical vocabulary. Developing a
monolithic vocabulary would require a massive effort, and its existence
would not guarantee its use by third-party payors, by practicing
clinicians, or by developers of electronic medical information systems.
Recognizing this, the National Library of Medicine (NLM) has begun to
develop the Unified Medical Language System (UMLS) as a means of promoting
electronic information exchange among systems with controlled
vocabularies. The authors describe a frame-based system developed as an
experimental approach to mapping between controlled clinical vocabularies.
Copyright 1991 Academic Press.</P>
<P>Miller PL, Barwick KW, Morrow JS, Powsner SM, Riely CA. Towards a
conceptual scema of medical knowledge: facilitating transition between
different computer-based forms of clinical information. In: Hammond WE.
Proceedings of the AAMSI Congress 88; 1988 May 5-7; San Francisco.
Washington (DC): American Association for Medical Systems and Informatics;
1988. p. 77-82.</P>
<P>Nelson SJ, Sheretz DD, Erlbaum MS, Tuttle MS. Representing medical
knowledge in the form of structured text. The development of current
disease descriptions. Proc Annu Symp Comput Appl Med Care 1989:66-70. As
part of the Unified Medical Language System (UMLS) initiative, about 900
diseases have been described using "structured text." Structured text is
words and short phrases entered under labelled contexts. Vocabulary is not
controlled. The contexts comprise a template for the disease description.
The structured text is both manipulable by machine and readable by humans.
Use of the template was natural, and only a few problems arose in using
the template. Instructions to disease description composers must be
explicit in definitions of the contexts. Diseases to be described are
chosen, after clustering related diseases, according to the distinctions
that physicians practicing in the area under question believe are
important. Limiting disease descriptions to primitive observations and to
entities otherwise described within the corpus appears to be both feasible
and desirable. Copyright by and reprinted with permission of the American
Medical Informatics Association.</P><A
href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#list">Return to title
page</A> | <A
href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#15">Return to table of
contents</A>
<HR>
<UL>
<LI><STRONG><A name=4d>Information and Retrieval Techniques</A></STRONG>
</LI></UL>
<HR>
<P>Elkin PL, McLatchey J, Packer M, Hoffer E, Cimino C, Studney D, Barnett
GO. Automated batch searching of MEDLINE for DXplain. Proc Annu Symp
Comput Appl Med Care 1989:436-40. To obtain references for the diseases in
the DXplain database a generic search strategy was created and then
combined with a communication protocol for MEDLINE. The system's efficacy
has been tested on the concepts contained in the DXplain disease names.
The system takes the DXplain disease name and identifies MeSH Terms or
their equivalent from within this unstructured input. These terms are then
utilized to search MEDLINE. How the searches are constructed and the order
in which they are performed, depend upon a user defined script (protocol
for querying MEDLINE). These scripts can be run repetitively to cover
multiple concepts. This technique for searching MEDLINE was used to
download citations that will be used as references for diseases in the
DXplain Database. DXplain is a medical diagnostic aid program developed
and maintained at the MGH. The script used was a 28 step algorithm which
was designed to download the most recent review articles about each of the
DXplain diseases. The system provides the user with the ability to specify
the number of articles which he/she would like returned from MEDLINE. This
paper describes the technique by which the articles were retrieved, as
well as the review process and the success rate of the system in
identifying appropriate articles. Copyright by and reprinted with
permission of the American Medical Informatics Association.</P>
<P>Miller PL, Barwick KW, Morrow JS, Powsner SM, Riely CA. Semantic
relationships and medical bibliographic retrieval: a preliminary
assessment. Comput Biomed Res 1988 Feb;21(1):64-77. This paper describes a
project exploring whether semantic relationships between bibliographic
terms may effectively partition the clinical literature. To address this
question, a set of semantic relationships was identified between pairs of
bibliographic terms taken from four categories: (1) diseases, (2)
treatments, (3) tests, and (4) patient characteristics. The MEDLINE system
of the National Library of Medicine was used to generate lists of
abstracts relating to pairs of clinical terms. Each list of abstracts was
examined to identify the semantic relationships, if any, which applied to
the two terms in each paper. The study suggests that semantic
relationships may play a potentially valuable role in assisting
computer-based medical bibliographic retrieval. The degree to which
relationships partition the literature is strongly dependent on the
underlying semantics of the particular bibliographic terms involved.
Copyright 1988 Academic Press.</P>
<P>Miller PL, Morrow JS, Powsner SM, Riely CA. Semantically assisted
medical bibliographic retrieval: an experimental computer system. Bull Med
Libr Assoc 1988 Apr;76(2):131-6. An experimental computer-based
bibliographic retrieval system has been implemented to explore how
semantic (conceptual) relationships between MeSH terms might assist the
retrieval process. To construct the experimental system's database, lists
of abstracts were produced using MEDLINE. Each list contained papers
discussing a specified pair of terms. Each abstract was then analyzed to
determine the specific relationship(s) between the two terms discussed in
that paper. The project then explored how these semantic relationships
could be incorporated into the computer to enhance bibliographic
retrieval. Copyright by and reprinted with permission of the Medical
Library Association.</P>
<P>Miller PL, Smith P, Morrow JS, Riely CA, Powsner SM. Capturing the
semantic relationship between clinical terms with current MeSH
bibliographic coding. Comput Methods Programs Biomed 1988
Nov-Dec;27(3):205-11. This paper compares bibliographic retrieval using
current MeSH (Medical Subject Headings) to bibliographic retrieval using
explicitly coded semantic relationships between index terms. In a previous
study, ten lists of abstracts, each list containing 20-40 papers
discussing a specific pair of terms, were analyzed to identify the
specific relationship(s) between those terms discussed in each paper. In
the present study, we analyze how well current MeSH coding using topical
subheadings and check tags, can selectively retrieve those papers
discussing each semantic relationship.</P>
<P>Powsner SM, Barwick KW, Morrow JS, Riely CA, Miller PL. Coding semantic
relationships for medical bibliographic retrieval: a preliminary study.
Proc Annu Symp Comput Appl Med Care 1987:108-12. It is suggested that the
coding of semantic relationships may permit more precise searches of the
medical literature than conventional key/index term coding with Boolean
operators for retrieval. Such semantic coding captures the distinction
between papers concerned with how hepatitis B (HB) may cause/predispose to
liver neoplasms (LN) and papers concerned with how HB may effect outcome
in patients with LN. These distributions were demonstrated by retrieving
sets of MEDLINE abstracts, each set relevant to two clinical terms. Each
abstract was then reviewed to determine the implied semantic
relationship(s) between the two terms. Even in the restricted realm of
liver diseases a number of very different relationships between terms are
addressed in the literature. In addition, coding 'no relationship' allows
articles discussing LN and HB independently to be avoided. It is concluded
that semantic-relationship coding may prove to be very helpful for
retrieving concise reference lists, to support clinical decisions.
Copyright 1987 IEEE. Reprinted, with permission.</P>
<P>Radow DP, Blake M, Howard E, Jones C, Milgrom L, Ostergard M, Shaffer
E. Using the Metathesaurus for bibliographic retrieval: a
pre-implementation study. Proc Annu Symp Comput Appl Med Care
1994:980.</P><A
href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#list">Return to title
page</A> | <A
href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#15">Return to table of
contents</A>
<HR>
<UL>
<LI><STRONG><A name=4e>Vocabulary Browsers</A></STRONG> </LI></UL>
<HR>
<P>Appel RD, Komorowski HJ, Barr CE, Greenes RA. Intelligent focusing in
knowledge indexing and retrieval - the relatedness tool. Proc Annu Symp
Comput Appl Med Care 1988:152-7. Most present day information retrieval
systems use the presence or absence of certain words to decide which
documents are appropriate for a user's query. This approach has had
certain successes, but it fails to capture relationships between concepts
represented by the words, and hence reduces the potential specificity of
both indexing and searching of documents. A richer representation of the
semantics of documents and queries, and methods for reasoning about these
representations, have been provided by artificial intelligence.
Navigational tools for browsing and authoring knowledge bases (KB's) add a
convenient technique for focusing in the complex landscape of semantic
representations. The center of such representations is usually a frame or
a semantic network system. We are developing a prototype Unified Medical
Language System (UMLS) taxonomy to represent objects and relationships in
medicine. One focus of our research is improved methods for indexing and
querying repositories of biomedical literature. The technique which we
propose is based on the notion of relatedness of concepts. To this end we
define heuristics which find related concepts and apply it to the UMLS
taxonomy. Preliminary results from experiments with the implemented
heuristics demonstrate its potential usefulness. Copyright by and
reprinted with permission of the American Medical Informatics
Association.</P>
<P>Komorowski HJ, Greenes RA, Barr C, Pattison-Gordon E. Browsing and
authoring tools for a Unified Medical Language System. In: User-oriented
content-based text and image handling. RIAO 88 Program. Conference with
Presentation of Prototypes and Operational Demonstrations; 1988 Mar 21-24;
Cambridge, MA. Paris: C.I.D.; 1988. p. 624-41.</P>
<P>Komorowski HJ, Greenes RA, Pattison-Gordon E. The use of fisheye views
for displaying semantic relationships in a medical taxonomy. Proc Annu
Symp Comput Appl Med Care 1987:113-6. One of the critical issues for
development of the unified medical language system (UMLS), or taxonomy of
medical terms, is the identification of semantic features and
relationships that should be represented in the UMLS and the design of the
appropriate structure for storing and displaying these features and
relationships. One approach, the use of the 'fisheye view' for displaying
a region of interest in a semantic network, is discussed. This approach
narrows the field of view at any given time to include only the most
important and immediate 'landmarks', or items. Any of the se could then be
focused on, or another level of detail accessed. Copyright 1987 IEEE.
Reprinted, with permission.</P>
<P>Lowe H, Barnett GO, Scott J, Mallon L, Ryan-Blewett D. Remote Access
MicroMeSH: demonstration of an enhanced microcomputer system for searching
the MEDLINE database. Proc Annu Symp Comput Appl Med Care 1989:1009-11.
Remote Access MicroMeSH (RAMM) is a powerful but easy to use microcomputer
system for searching the medical literature. RAMM uses MicroMeSH, a system
for accessing the National Library of Medicine's (NLMs) Medical Subject
Headings (MeSH) vocabulary, to facilitate offline creation and refinement
of highly specific MEDLINE search queries. Using these queries, RAMM
automatically searches and retrieves citations from the MEDLINE databases
through the NLMs MEDical Literature Analysis and Retrieval System
(MEDLARS). As search query creation and citation review are performed
offline, the cost of online searching is minimized. Copyright by and
reprinted with permission of the American Medical Informatics
Association.</P>
<P>Lowe HJ, Barnett GO. MicroMeSH: a microcomputer system for searching
and exploring the National Library of Medicine's Medical Subject Headings
(MeSH) vocabulary. Proc Annu Symp Comput Appl Med Care 1987:717-20.
MicroMeSH is a microcomputer-based tool for searching and exploring a
complete, keyworded version of the National Library of Medicine's Medical
Subject Headings (MeSH) vocabulary. MeSH is used to index the MEDLINE
database. MicroMeSH allows the user to retrieve MeSH headings rapidly,
using either a powerful search operation or a user-friendly MeSH Tree
Walker. MicroMeSH can translate many commonly used biomedical terms to
equivalent MeSH headings. The program also provides access to the MeSH
subheadings vocabulary. The authors describe the operation of MicroMeSH
and the computer hardware required to use the system. Copyright 1987 IEEE.
Reprinted, with permission.</P>
<P>Lowe HJ, Barnett GO, Scott J, Mallon L, Blewett DR. Remote Access
MicroMeSH: evaluation of a microcomputer system for searching the MEDLINE
database. Proc Annu Symp Comput Appl Med Care 1989:445-7. Remote Access
MicroMeSH (RAMM) is a powerful but easy-to-use microcomputer system for
searching the MEDLINE database. RAMM incorporates MicroMeSH, a
microcomputer implementation of the National Library of Medicine's (NLMs)
Medical Subject Headings (MeSH) vocabulary. RAMM facilitates the creation
of highly specific MEDLINE search queries. The goals in creating RAMM were
to provide a system that could be used to search the medical literature
and to teach the basic skills required to use MeSH and MEDLINE. During the
past two years RAMM has been used by clinicians, library professionals,
researchers, and students at Harvard Medical School and at selected
academic sites in the US and Canada. In February of 1989, an effort to
formally evaluate RAMM was begun. This paper describes the preliminary
results of that evaluation. Copyright by and reprinted with permission of
the American Medical Informatics Association.</P><A
href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#list">Return to title
page</A> | <A
href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#15">Return to table of
contents</A>
<HR>
<UL>
<LI><STRONG><A name=4f>Research Tools</A></STRONG> </LI></UL>
<HR>
<P>Fu LS. A public domain unified medical language system (UMLS) patient
database (hospital information systems, event definition structures)
[dissertation]. [Salt Lake City]: The University of Utah; 1992. 132 p.
Available from: University Microforms, Ann Arbor, MI; 9236271. This
document has presented a research work under the Unified Medical Language
System (UMLS) design and its conceptual framework as well as its
experimental implementation has been introduced. Three hypotheses have
been proposed and tested with real patient cases from two hospital
information systems (HELP and VA). Primary conclusions of this work were:
(1) The total number of MOI entries will not grow indefinitely. For a
given domain, it tends to level-off as more data sources are added. (2) To
date, Event Definition structures can correctly represent a selected
subset of dictionary entries ranging from 83% to 99%. (3) The current
automatic instantiation algorithm has proven to have an 87% success rate.
(4) From the evidence shown using this prototype with the UMLS patient
database, it is possible to combine electronic patient records from
different patient information systems into a unified structure. Moreover,
this prototype allows the user to visually inspect the distribution of
relevant medical variables which demonstrates discrimination between
disease and nondisease groups independent of the source of data. Also,
several vital future enhancements were also discussed. Provided by
UMI.</P>
<P>Fu LS, Bouhaddou O, Huff SM, Sorenson DK, Warner HR. Toward a public
domain UMLS patient database. Proc Annu Symp Comput Appl Med Care
1990:170-4. The paper describes a unified structure with an associated
vocabulary to represent and store patient cases derived from different
computerized patient databases. The unified structure is based on the
concept of event definitions which are generic templates for representing
clinical data in a patient database. An implementation of this structure
has been evaluated using patient cases from two expert system (Iliad and
QMR) and a hospital information system (HELP). The primary focus of the
UMLS patient database is to accumulate patient information from different
sources and provide enhanced statistical estimates of clinically important
variables. Inter-communication and navigation among medical information
systems are other potential benefits of this unified computerized medical
record system. Copyright by and reprinted with permission of the American
Medical Informatics Association.</P>
<P>Fu LS, Huff S, Bouhaddou O, Bray B, Warner H. Estimating frequency of
disease findings from combined hospital databases: a UMLS project. Proc
Annu Symp Comput Appl Med Care 1991:373-7. Merging data from the Salt Lake
VA hospital database and the LDS hospital HELP system into a UMLS
sponsored unified patient database has demonstrated that distribution of
variables within a disease is hospital independent. Although disease
prevalence is clearly not the same among hospitals, analysis of data
within a disease group across hospitals can be done using such a merged
database. This unified patient database would allow study of unusual
diseases not possible using data from a single institution. Copyright by
and reprinted with permission of the American Medical Informatics
Association.</P>
<P>Schuyler PL, McCray AT, Schoolman HM. A test collection for
experimentation in bibliographic retrieval. Medinfo 1989;6(Pt 2):910-12.
To establish an environment in which various search and retrieval
experiments can be performed, a subset of MEDLINE, the National Library of
Medicine's bibliographic database, has been created according to the
following requirements: all citations have a 1986 journal publication
year, are in English, and have an author-prepared abstract. The resulting
file contain approximately 167000 citations. This is a reasonable size
that satisfies several necessary conditions for conducting search and
retrieval experiments. Accompanying this file are approximately one
hundred and fifty questions asked by users of the MEDLINE database and
approximately three thousand citations retrieved from the experimental
file in response to these queries. Assessments of the relevance of the
retrieved citations to the questions asked are also available.</P><A
href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#list">Return to title
page</A> | <A
href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#15">Return to table of
contents</A>
<HR>
<H2><A name=5>The UMLS in Relation to Other Programs</A></H2>
<HR>
<P>Cimino JJ. Review paper: coding systems in health care . Methods Inf
Med 1996 Dec;35(4-5):273-84. Computer-based patient data which are
represented in a coded form have a variety of uses, including direct
patient care, statistical reporting, automated decision support, and
clinical research. No standard exists which supports all of these
functions. Abstracting coding systems, such as ICD, CPT, DRGs and MeSH
fail to provide adequate detail, forcing application developers to create
their own coding schemes for systems. Some of these schemes have been put
forward as possible standards, but they have not been widely accepted.
This paper reviews existing schemes used for abstracting, electronic
record systems, and comprehensive coding. It also discusses the remaining
impediments to acceptance of standards and the current efforts to overcome
them, including SNOMED, the Gabrieli Medical Nomenclature, the Read
Clinical Codes, GALEN, and the Unified Medical Language System (UMLS).</P>
<P>Cimino JJ, Sengupta S. IAIMS and UMLS at Columbia-Presbyterian Medical
Center. Med Decis Making 1991 Oct-Dec;11(4 Suppl):89S-93S. The authors use
an example to illustrate combining Integrated Academic Information
Management System (IAIMS) components (applications) into an integral
whole, to facilitate using the components simultaneously or in sequence.
They examine a model for classifying IAIMS systems, proposing ways in
which the Unified Medical Language System (UMLS) can be exploited by them.
Copyright 1991 Hanley and Belfus.</P>
<P>Frawley SJ. Building a Database of Data Sets for Health Services
Research. Proc Annu Symp Comput Appl Med Care 1994:377-81. The Database of
Data Sets (DB/DS) for Health Services Research will be an online
searchable directory of data sets which are available, often with
restrictions and confidentiality safeguards, for use by health care
researchers. The DB/DS project is aimed at a wide audience, and intends to
include a very broad range of health care data sets, ranging from state
hospital discharge data bases, to national registries and health survey
data sets, to institutional clinical databases. The intended users are the
same community of researchers, policy-makers, administrators and
practitioners who are served by the National Library of Medicine's current
bibliographic databases. This paper describes a pilot phase of the DB/DS
project in which the issues involved in creating such a database were
explored with an initial set of 20 representative data sets. Copyright by
and reprinted with permission of the American Medical Informatics
Association.</P>
<P>Henry SB, Holzemer WL, Reilly CA, Campbell KE. Terms used by nurses to
describe patient problems: can SNOMED III represent nursing concepts in
the patient record? J Am Med Inform Assoc 1994 Jan-Feb;1(1):61-74.
OBJECTIVE: To analyze the terms used by nurses in a variety of data
sources and to test the feasibility of using SNOMED III to represent
nursing terms. DESIGN: Prospective research design with manual matching of
terms to the SNOMED III vocabulary. MEASUREMENTS: The terms used by nurses
to describe patient problems during 485 episodes of care for 201 patients
hospitalized for Pneumocystis carinii pneumonia were identified. Problems
from four data sources (nurse interview, intershift report, nursing care
plan, and nurse progress note/flowsheet) were classified based on the
substantive area of the problem and on the terminology used to describe
the problem. A test subset of the 25 most frequently used terms from the
two written data sources (nursing care plan and nurse progress
note/flowsheet) were manually matched to SNOMED III terms to test the
feasibility of using that existing vocabulary to represent nursing terms.
RESULTS: Nurses most frequently described patient problems as
signs/symptoms in the verbal nurse interview and intershift report. In the
written data sources, problems were recorded as North American Nursing
Diagnosis Association (NANDA) terms and signs/symptoms with similar
frequencies. Of the nursing terms in the test subset, 69% were represented
using one or more SNOMED III terms. Copyright by and reprinted with
permission of the American Medical Informatics Association.</P>
<P>Integrated Academic Information Management Systems (IAIMS). Bull Med
Libr Assoc 1992 Jul;80(3):241-3. This paper reviews the proceedings of the
symposia sponsored by the Integrated Academic Information Management
Systems Association. IAIMS is described from the perspectives of
information management, knowledge management, and information technology.
Papers delivered at the symposia are reviewed. An overview of the National
Library of Medicine and the IAIMS initiative at NLM, the use of an IAIMS
project at Georgetown University to bring together multiple sources of
information, and the linking of an IAIMS system to the Unified Medical
Language System initiative at Yale are also discussed. Copyright by and
reprinted with permission of the Medical Library Association.</P>
<P>Lindberg DA. Global information infrastructure. Int J Biomed Comput
1994 Jan;34(1-4):13-9. The High Performance Computing and Communications
Program (HPCC) is a multiagency federal initiative under the leadership of
the White House Office of Science and Technology Policy, established by
the High Performance Computing Act of 1991. It has been assigned a
critical role in supporting the international collaboration essential to
science and to health care. Goals of the HPCC are to extend USA leadership
in high performance computing and networking technologies; to improve
technology transfer for economic competitiveness, education, and national
security; and to provide a key part of the foundation for the National
Information Infrastructure. The first component of the National Institutes
of Health to participate in the HPCC, the National Library of Medicine
(NLM), recently issued a solicitation for proposals to address a range of
issues, from privacy to 'testbed' networks, 'virtual reality,' and more.
These efforts will build upon the NLM's extensive outreach program and
other initiatives, including the Unified Medical Language System (UMLS),
MEDLARS, and Grateful Med. New Internet search tools are emerging, such as
Gopher and 'Knowbots'. Medicine will succeed in developing future
intelligent agents to assist in utilizing computer networks. Our ability
to serve patients is so often restricted by lack of information and
knowledge at the time and place of medical decision-making. The new
technologies, properly employed, will also greatly enhance our ability to
serve the patient.</P>
<P>Lindberg DA. The IAIMS opportunity: the NLM view. Bull Med Libr Assoc
1988 Jul;76(3):224-5.</P>
<P>McCormick KA, Zielstorff R. Building a Unified Nursing Language System
(UNLS). In. Nursing data systems: the emergency framework. Washington
(DC): American Nurses Publishing; 1995. p.143-9.</P>
<P>Paton JA, Belanger A, Cheung KH, Grajek S, Branch KA, Ikeda N, Sette L,
Miller PL, Fryer RK. Online bibliographic information: integration into an
emerging IAIMS environment. Proc Annu Symp Comput Appl Med Care
1992:605-9. The Medical Library at Yale University has developed an online
free-text database containing Current Contents citations. The database was
designed to be integrated into an emerging campus-wide information
environment. To this end Current Contents at Yale was designed with a user
interface familiar to the Yale community, an alerting service based on
electronic mail, and search expansion using the National Library of
Medicine's Meta-1 metathesaurus. Copyright by and reprinted with
permission of the American Medical Informatics Association.</P>
<P>Paton JA, Clyman JI, Lynch P, Miller PL, Sittig DF, Berson BZ.
Strategic planning for IAIMS: prototyping as a catalyst for change. Proc
Annu Symp Comput Appl Med Care 1990:709-13. Yale School of Medicine has
developed a prototype integrated computing and information environment as
part of its strategic IAIMS planning. The prototype consists of a menu
system and underlying network communications programs and networks to
access a variety of medical information resources at Yale and elsewhere.
This prototype has been used in testing user needs, in designing a
technical architecture, in exploring related institutional issues, and as
a basis for research in integrated access to medical information using
UMLS tools and concepts. Copyright by and reprinted with permission of the
American Medical Informatics Association.</P>
<P>Roderer NK. Dissemination of medical information: organizational and
technological issues in health sciences libraries. Libr Trends 1993
Summer;42(1):108-26. This article describes five programs that have been
particularly significant to the evolution of biomedical communications
over the last twenty years: the National Network of Libraries of Medicine
(NNLM), Integrated Academic Information Management Systems (IAIMS),
National Research and Education Network (NREN), Unified Medical Language
System (UMLS), and the electronic journal. The major implications that
each of these programs will continue to have for health sciences
librarianship are examined. Reprinted with permission from Library Trends.
Copyright 1993 The Board of Trustees of the University of Illinois.</P>
<P>Scherrer JR. Medical languages: use, definition and processing in ward
information systems (WIS). In: Adlassnig KP, Grabner G, Bengtsson S,
Hansen R, editors. Medical informatics Europe 1991. Proceedings; 1991 Aug
19-22; Vienna, Austria. Berlin: Springer-Verlag; 1991. p. 19-27.</P>
<P>Scherrer JR. [New architectures destined for hospital computer networks
opening the medical world to more communication facilities of every kind].
Schweiz Med Wochenschr 1990 Dec 8;120(49):1866-71. (Fre). </P>
<P>Siegel ER. High priority research at NLM. In: Information: the
transformation of society. Proceedings of the 50th Annual Meeting of the
American Society for Information Science; 1987 Oct 4-8; Boston, MA.
Medford (NJ): Learned Information; 1987. p. 275-6. A growing body of
medically related machine-readable data of at least four types is
identified. These include: biomedical literature, clinical records,
medically relevant data banks, and knowledge bases. The development of a
unified medical language system (UMLS) is discussed. The use of artificial
intelligence techniques in diagnosis and management is explored.
Reproduced with permission of the American Society for Information
Science.</P>
<P>Smith KA. Medical information systems (National Library of Medicine
information services). Bull Am Soc Inf Sci 1986 Apr-May;12(4):17-8. This
description of information services from the National Library of Medicine
(NLM) highlights a new system for retrieving information from NLM's
databases (GRATEFUL MED); a formal Regional Medical Library Network;
DOCLINE; the Unified Medical Language System; and Integrated Academic
Information Management Systems. Research and development and the future
are discussed . Reproduced with permission of the American Society for
information Science.</P>
<P>Tilley CB. Medical databases and health information systems. Annu Rev
Inf Sci Tech 1990;25:313-82.</P><A
href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#list">Return to title
page</A> | <A
href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#15">Return to table of
contents</A>
<HR>
<H2><A name=6>Commentaries and Opinions about UMLS</A></H2>
<HR>
<P>Bishop CW. Alternate approaches to a UMLS. Med Decis Making 1991
Oct-Dec;11(4 Suppl):S99-102. A scheme for the continuing development of
Meta-1, a taxonomy of medical subjects based; on MeSH and other systems,
is described. The objective is a single, structured classification for
medical knowledge. Copyright 1991 Hanley and Belfus.</P>
<P>Bishop CW, Ewing P. Representing medical knowledge: reconciling the
present or creating the future? MD Comput 1992 Jul-Aug;9(4):218-25. Modern
technology has sparked the creation of computing systems that perform many
medically related tasks, but communication between these systems is
limited, in part by differences in the terminology used for various
purposes and in part by the changing nature of medical concepts. The
Unified Medical Language System represents an attempt to find a means of
translation between diverse knowledge systems. An alternative, which we
propose, is to agree on a knowledge base for the future and make use of
present accomplishments in moving toward that goal. Copyright 1992
Springer-Verlag.</P>
<P>Cimino JJ. Saying what you mean and meaning what you say: coupling
biomedical terminology and knowledge. Acad Med 1993 Apr;68(4):257-60.</P>
<P>Evans DA. Medical language processing: issues and methods in unifying
medical concepts: reflections on the UMLS project. In: Managing
information and technology. Proceedings of the 52nd Annual Meeting of the
American Society for Information Science; 1989 Oct 30-Nov 2; Washington,
DC. Medford (NJ): Learned Information; 1989. p. 252-3. Several
medical-related language processing projects are examined: (1) the UMLS
project, focusing on development of a "meta-thesaurus" for concepts in
biomedicine and an "information sources map" to coordinate access to
information across databases; (2) NYU's Medical Language Processor (MLP),
a 5-stage computer processing system which analyzes sentences so that
their informational elements are recognized and labeled for mapping into
the correct database field; and (3) the Systemized Nomenclature of
Medicine (SNOMED), which is a comprehensive indexing system for clinical
medicine. Reproduced with permission of the American Society for
Information Science.</P>
<P>Rudin JL. DART (Diagnostic Aid and Resource Tool): a computerized
clinical decision support system for oral pathology. Compendium 1994
Nov;15(11):1316, 1318, 1320 passim.</P>
<P>Tuttle MS, Nelson SJ. The role of the UMLS in 'storing' and 'sharing'
across systems. Int J Biomed Comput 1994 Jan;34(1-4):207-37. We will argue
that 'sharing', 're-use', 're-purposing', and 'addition' of health care
information is difficult, intrinsically; that the best way to overcome the
difficulty is to start doing it, as soon as possible, and that the UMLS
Knowledge Sources provide the best place to start. We recommend that the
UMLS be used as a default source of biomedical concept names and
relationships, as a comprehensive, data-based, 'reference model', and as
an example of a large, ecumenical, evolving, continuously updated source
of re-usable health care information.</P><A
href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#list">Return to title
page</A> | <A
href="http://www.nlm.nih.gov/archive/20040831/pubs/cbm/umlscbm.html#15">Return to table of
contents</A>
<P><!-- ************************* Content end ************************* -->
<br/>
<b>First published: </b>21 March 1997<br/><b>Last updated: </b>24 April 1998<br/><b>Date Archived: </b>31 August 2004<br/><a href="http://www.nlm.nih.gov/cgi/viewMeta.pl?url=http://www.nlm.nih.gov/archive//20040831/pubs/cbm/umlscbm.html&amp;description=full" onclick="javascript:openPopup('http://www.nlm.nih.gov/cgi/viewMeta.pl?url=http://www.nlm.nih.gov/archive//20040831/pubs/cbm/umlscbm.html&amp;description=full'); return false;"><strong>Metadata</strong></a> | <b> <a href="http://www.nlm.nih.gov/permlevels.html"onclick="javascript:openPopup('http://www.nlm.nih.gov/permlevels.html'); return false;">Permanence level</a>: </b>Permanent: Stable Content<br/>
<p> </p>
<!-- BEGIN NLM FOOTER --></P></TD></TR>
<TR>
<TD vAlign=top noWrap>
<CENTER>
<HR width=550>
<FONT face="helvetica, arial" size=2><A
"http://www.nlm.nih.gov/nlmhome.html">U.S. National Library of
Medicine</A>, 8600 Rockville Pike, Bethesda, MD 20894 <BR><A
"http://www.nih.gov/">National Institutes of Health</A>, <A
"http://www.os.dhhs.gov/">Department of Health &amp; Human
Services</A> <BR><A
"http://www.nlm.nih.gov/copyright.html">Copyright</A>, <A
"http://www.nlm.nih.gov/privacy.html">Privacy</A>, <A
"http://www.nlm.nih.gov/accessibility.html">Accessibility</A>
<BR>Last updated: 24 April 1998 <!-- EXPDATE="2003-04-30" --><!-- EMAIL="refweb@nlm.nih.gov" --></FONT></CENTER></TD></TR></TBODY></TABLE><!-- END NLM FOOTER -->
<p> </p>
<table width="100%" border="0" cellpadding="0" cellspacing="0" id="archeader">
<tr id="breadcrumb" >
<td colspan="5"><span id="arccontainerfooter">Home &gt; <strong>NLM Archives</strong> &gt; </span> <span id="disclaimerfooter"><strong>Document content is not current. Links may be broken.</strong></span><span class="spacer"></span></td>
</tr>
</table>
<div id="footer">
<br/>
<span id="subLeft"><a href="http://www.nlm.nih.gov/copyright.html">Copyright</a>, <a href="http://www.nlm.nih.gov/privacy.html">Privacy</a>, <a href="http://www.nlm.nih.gov/accessibility.html">Accessibility</a><br />
<a href="http://www.nlm.nih.gov">U.S. National Library of Medicine</a>, 8600 Rockville Pike, Bethesda, MD 20894<br />
<a href="http://www.nih.gov/">National Institutes of Health</a>, <a href="http://www.os.dhhs.gov/">Health &amp; Human
Services</a></span></div>
</body>
</html>