<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
    <front>
        <journal-meta>
            <journal-id journal-id-type="publisher-id">JMIR</journal-id>
            <journal-id journal-id-type="nlm-ta">J Med Internet Res</journal-id>
            <journal-title>Journal of Medical Internet Research</journal-title>
            <issn pub-type="epub">14388871</issn>
            <publisher>
                <publisher-name>JMIR Publications Inc.</publisher-name>
                <publisher-loc>Toronto, Canada</publisher-loc>
            </publisher>
        </journal-meta>
        <article-meta>
            <article-id pub-id-type="publisher-id">v15i7e144</article-id>
            <article-id pub-id-type="pmid">23903235</article-id>
            <article-id pub-id-type="doi">10.2196/jmir.2569</article-id>
            <article-categories>
                <subj-group subj-group-type="article-type">
                    <subject>Original Paper</subject>
                </subj-group>
            </article-categories>
            <title-group>
                <article-title>User Evaluation of the Effects of a Text Simplification Algorithm Using Term Familiarity on Perception, Understanding, Learning, and Information Retention</article-title>
            </title-group>
            <contrib-group>
                <contrib contrib-type="editor">
                    <name>
                        <surname>Eysenbach</surname>
                        <given-names>Gunther</given-names>
                    </name>
                </contrib>
            </contrib-group>
            <contrib-group>
                <contrib contrib-type="reviewer">
                    <name>
                        <surname>Ferreira</surname>
                        <given-names>Liliana</given-names>
                    </name>
                </contrib>
                <contrib contrib-type="reviewer">
                    <name>
                        <surname>Toldo</surname>
                        <given-names>Luca</given-names>
                    </name>
                </contrib>
            </contrib-group>
            <contrib-group>
                <contrib contrib-type="author" id="contrib1" corresp="yes" equal-contrib="yes">
                    <name name-style="western">
                        <surname>Leroy</surname>
                        <given-names>Gondy</given-names>
                    </name>
                    <degrees>MS, PhD</degrees>
                    <xref ref-type="aff" rid="aff1">1</xref>
                    <address>
                        <institution>Information Systems and Technology</institution>
                        <institution>Claremont Graduate University</institution>
                        <addr-line>ACB 225</addr-line>
                        <addr-line>130 E Ninth Street</addr-line>
                        <addr-line>Claremont, CA, 91711</addr-line>
                        <country>United States</country>
                        <phone>1 909 607 3270</phone>
                        <fax>1 909 621 8564</fax>
                        <email>gondy.leroy@cgu.edu</email>
                    </address>
                    <xref ref-type="aff" rid="aff2">2</xref>
                </contrib>
                <contrib contrib-type="author" id="contrib2" equal-contrib="yes">
                    <name name-style="western">
                        <surname>Endicott</surname>
                        <given-names>James E</given-names>
                    </name>
                    <xref ref-type="aff" rid="aff1">1</xref>
                </contrib>
                <contrib contrib-type="author" id="contrib3" equal-contrib="yes">
                    <name name-style="western">
                        <surname>Kauchak</surname>
                        <given-names>David</given-names>
                    </name>
                    <degrees>PhD</degrees>
                    <xref ref-type="aff" rid="aff3">3</xref>
                </contrib>
                <contrib contrib-type="author" id="contrib4" equal-contrib="yes">
                    <name name-style="western">
                        <surname>Mouradi</surname>
                        <given-names>Obay</given-names>
                    </name>
                    <xref ref-type="aff" rid="aff1">1</xref>
                </contrib>
                <contrib contrib-type="author" id="contrib5" equal-contrib="yes">
                    <name name-style="western">
                        <surname>Just</surname>
                        <given-names>Melissa</given-names>
                    </name>
                    <xref ref-type="aff" rid="aff4">4</xref>
                </contrib>
            </contrib-group>
            <aff id="aff1" rid="aff1">
                <sup>1</sup>
                <institution>Information Systems and Technology</institution>
                <institution>Claremont Graduate University</institution>
                <addr-line>Claremont, CA</addr-line>
                <country>United States</country>
            </aff>
            <aff id="aff2" rid="aff2">
                <sup>2</sup>
                <institution>Eller College of Management</institution>
                <institution>Department of Management Information System</institution>
                <institution>University of Arizona</institution>
                <addr-line>Tucson, AZ</addr-line>
                <country>United States</country>
            </aff>
            <aff id="aff3" rid="aff3">
                <sup>3</sup>
                <institution>Computer Science Department</institution>
                <institution>Middlebury College</institution>
                <addr-line>Middlebury, VT</addr-line>
                <country>United States</country>
            </aff>
            <aff id="aff4" rid="aff4">
                <sup>4</sup>
                <institution>Rutgers University Libraries</institution>
                <institution>Rutgers, The State University of New Jersey</institution>
                <addr-line>New Brunswick, NJ</addr-line>
                <country>United States</country>
            </aff>
            <author-notes>
                <corresp>Corresponding Author: Gondy Leroy <email>gondy.leroy@cgu.edu</email>
                </corresp>
            </author-notes>
            <pub-date pub-type="collection">
                <month>07</month>
                <year>2013</year>
            </pub-date>
            <pub-date pub-type="epub">
                <day>31</day>
                <month>07</month>
                <year>2013</year>
            </pub-date>
            <volume>15</volume>
            <issue>7</issue>
            <elocation-id>e144</elocation-id>
            <!--history from ojs - api-xml-->
            <history>
                <date date-type="received">
                    <day>06</day>
                    <month>02</month>
                    <year>2013</year>
                </date>
                <date date-type="rev-request">
                    <day>12</day>
                    <month>05</month>
                    <year>2013</year>
                </date>
                <date date-type="rev-recd">
                    <day>31</day>
                    <month>05</month>
                    <year>2013</year>
                </date>
                <date date-type="accepted">
                    <day>09</day>
                    <month>06</month>
                    <year>2013</year>
                </date>
            </history>
            <!--(c) the authors - correct author names and publication date here if necessary. Date in form ', dd.mm.yyyy' after jmir.org-->
            <copyright-statement>&#169;Gondy Leroy, James E Endicott, David Kauchak, Obay Mouradi, Melissa Just. Originally published in the Journal of Medical Internet Research (http://www.jmir.org), 31.07.2013. </copyright-statement>
            <copyright-year>2013</copyright-year>
            <license license-type="open-access" xlink:href="http://creativecommons.org/licenses/by/2.0/">
                <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (http://creativecommons.org/licenses/by/2.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in the Journal of Medical Internet Research, is properly cited. The complete bibliographic information, a link to the original publication on http://www.jmir.org/, as well as this copyright and license information must be included.</p>
            </license>
            <self-uri xlink:href="http://www.jmir.org/2013/7/e144/" xlink:type="simple" />
            <abstract>
                <sec sec-type="background">
                    <title>Background</title>
                    <p>Adequate health literacy is important for people to maintain good health and manage diseases and injuries. Educational text, either retrieved from the Internet or provided by a doctor&#8217;s office, is a popular method to communicate health-related information. Unfortunately, it is difficult to write text that is easy to understand, and existing approaches, mostly the application of readability formulas, have not convincingly been shown to reduce the difficulty of text.</p>
                </sec>
                <sec sec-type="objective">
                    <title>Objective</title>
                    <p>To develop an evidence-based writer support tool to improve perceived and actual text difficulty. To this end, we are developing and testing algorithms that automatically identify difficult sections in text and provide appropriate, easier alternatives; algorithms that effectively reduce text difficulty will be included in the support tool. This work describes the user evaluation with an independent writer of an automated simplification algorithm using term familiarity.</p>
                </sec>
                <sec sec-type="methods">
                    <title>Methods</title>
                    <p>Term familiarity indicates how easy words are for readers and is estimated using term frequencies in the Google Web Corpus. Unfamiliar words are algorithmically identified and tagged for potential replacement. Easier alternatives consisting of synonyms, hypernyms, definitions, and semantic types are extracted from WordNet, the Unified Medical Language System (UMLS), and Wiktionary and ranked for a writer to choose from to simplify the text. We conducted a controlled user study with a representative writer who used our simplification algorithm to simplify texts. We tested the impact with representative consumers. The key independent variable of our study is lexical simplification, and we measured its effect on both perceived and actual text difficulty. Participants were recruited from Amazon&#8217;s Mechanical Turk website. Perceived difficulty was measured with 1 metric, a 5-point Likert scale. Actual difficulty was measured with 3 metrics: 5 multiple-choice questions alongside each text to measure understanding, 7 multiple-choice questions without the text for learning, and 2 free recall questions for information retention.</p>
                </sec>
                <sec sec-type="results">
                    <title>Results</title>
                    <p>Ninety-nine participants completed the study. We found strong beneficial effects on both perceived and actual difficulty. After simplification, the text was perceived as simpler (<italic>P</italic>&#60;.001) with simplified text scoring 2.3 and original text 3.2 on the 5-point Likert scale (score 1: easiest). It also led to better understanding of the text (<italic>P</italic>&#60;.001) with 11% more correct answers with simplified text (63% correct) compared to the original (52% correct). There was more learning with 18% more correct answers after reading simplified text compared to 9% more correct answers after reading the original text (<italic>P</italic>=.003). There was no significant effect on free recall.</p>
                </sec>
                <sec sec-type="conclusions">
                    <title>Conclusions</title>
                    <p>Term familiarity is a valuable feature in simplifying text. Although the topic of the text influences the effect size, the results were convincing and consistent.</p>
                </sec>
            </abstract>
            <kwd-group>
                <kwd>text simplification</kwd>
                <kwd>health literacy</kwd>
                <kwd>consumer health information</kwd>
                <kwd>natural language processing</kwd>
                <kwd>evaluation study</kwd>
            </kwd-group>
        </article-meta>
    </front>
    <body>
        <sec sec-type="introduction">
            <title>Introduction</title>
            <sec>
                <title>Background and Significance</title>
                <p>Text is an important source for health-related information. It is easy to create, maintain, and distribute, and medical practitioners often use it to provide instructions and details on treatments. Health-related text is becoming increasingly available with an estimated 80% of online users [<xref ref-type="bibr" rid="ref1">1</xref>] from a wide array of backgrounds [<xref ref-type="bibr" rid="ref2">2</xref>] using the Internet to obtain health-related information. The information itself is diverse and includes prevention, treatment, and management of diseases and comes from a variety of sources ranging from professionals to salespeople to patients.</p>
                <p>Unfortunately, 90 million Americans have difficulty understanding and acting upon health information [<xref ref-type="bibr" rid="ref3">3</xref>], and many find the text currently available difficult to read [<xref ref-type="bibr" rid="ref4">4</xref>]. Some of this difficulty can be attributed to inherent complexity in understanding the diseases, their causes, and the associated treatments, which may require advanced knowledge of biology, chemistry, or physiology to understand in detail. Much of the difficulty, though, can be attributed to a mismatch between the content delivered and the consumers who often have limited health literacy, low general education, or inadequate language skills. Low health literacy reduces health statuses of individuals [<xref ref-type="bibr" rid="ref3">3</xref>], is considered a &#8220;silent killer&#8221; [<xref ref-type="bibr" rid="ref5">5</xref>], and is estimated to cost up to US$238 billion annually [<xref ref-type="bibr" rid="ref6">6</xref>].</p>
                <p>To increase health literacy, the method, medium, and language used play an important role. While one-on-one teaching may be the best solution, medical professionals do not have sufficient time or resources for this. Video and interactive methods can be very educative and are becoming increasingly available. The power of such methods to teach and demonstrate will likely play an important role in consumer health information. However, currently text remains the primary tool used to educate people.</p>
            </sec>
            <sec>
                <title>Factors Influencing Text Difficulty and Its Measurement</title>
                <p>
                    <xref ref-type="fig" rid="figure1">Figure 1</xref> provides an overview of three key factors representing the authors&#8217; view on influences on understanding and learning from text: personal characteristics, text characteristics, and measurement characteristics. Personal characteristics describe attributes about the reader. Some are innate and cannot be changed, for example, native language and general intelligence. Others are acquired, for example, vocabulary size and domain knowledge. Many of these characteristics have a direct effect on text comprehension and indirectly on learning since comprehension has been shown to affect learning [<xref ref-type="bibr" rid="ref7">7</xref>]. For example, stress, a personal characteristic, has been shown to affect reading behaviors. People with high stress rely more on visual summaries, even when incomplete, to answer text-based questions [<xref ref-type="bibr" rid="ref8">8</xref>]. Moreover, increased stress has also been related to lower comprehension of medical terminology [<xref ref-type="bibr" rid="ref9">9</xref>]. Other personal characteristics, such as the ability to form a good mental model, affects understanding since readers often rely on the mental model instead of the original text base [<xref ref-type="bibr" rid="ref10">10</xref>]. In addition, past behaviors and acquired skills can have an impact. Exposure to print, for example, has been found to be related to understanding. Landi [<xref ref-type="bibr" rid="ref11">11</xref>] found a positive relation with results for an author recognition test [<xref ref-type="bibr" rid="ref12">12</xref>] and question-answering tasks, while in our own work, we found a positive relation between self-reported reading and results for a fill-in-the-blank Cloze test [<xref ref-type="bibr" rid="ref13">13</xref>].</p>
                <p>Text characteristics influence text difficulty and therefore understanding. These characteristics can be adjusted to improve the usefulness of text, but this has been shown to be challenging and very few studies have shown strong improvements in reader understanding. To further clarify the analysis of text characteristics and the text simplification problem in general, we distinguish between the perceived and actual text difficulty of a text. The distinction is based on evidence for the existence of perceived barriers from the Health Belief Model [<xref ref-type="bibr" rid="ref14">14</xref>] and the importance of perceived difficulty of behavioral control from the Theory of Planned Behavior [<xref ref-type="bibr" rid="ref15">15</xref>]. While actual difficulty is easily accepted as important, perceived difficulty cannot be ignored. At a minimum, it will impact whether or not a text will be read. However, it may affect health literacy in more ways; for example, Velayo [<xref ref-type="bibr" rid="ref16">16</xref>] found that a higher perceived difficulty correlated with a decrease in the recall of information.</p>
                <p>Text characteristics can include surface features, for example, spacing or font, and range from smaller units such as words, to larger units such as sentences or paragraphs. Using a Likert scale to measure perceived difficulty, it was found that texts with a higher ratio of function words, verbs, verb phrases, or containing more high-frequency words were seen as easier [<xref ref-type="bibr" rid="ref17">17</xref>-<xref ref-type="bibr" rid="ref19">19</xref>]. For actual difficulty, simple surface features such as font and line spacing were shown not to affect remembering [<xref ref-type="bibr" rid="ref20">20</xref>]; however, using a fill-in-the-blanks test additive and causal connectors were shown to be easier than adversative or sequential connectors [<xref ref-type="bibr" rid="ref21">21</xref>]. In addition to surface features, analysis can include broader features such as coherence, which is defined as good flow combined with a structured, logical argument [<xref ref-type="bibr" rid="ref22">22</xref>,<xref ref-type="bibr" rid="ref23">23</xref>]. We found that increasing coherence with proper spacing around subtopics and better logical connectors improved question-answering (actual difficulty) [<xref ref-type="bibr" rid="ref13">13</xref>]. Not surprisingly, how a topic is presented in a text also influences learning; topics introduced as part of a refutation text, a text where misconceptions are explicitly addressed, led to increased learning and more valid inference but not increased quantity of information being recalled [<xref ref-type="bibr" rid="ref7">7</xref>].</p>
                <p>
                    <italic>Measurement characteristics</italic> also play an important role in readability research, although they are often ignored. Historically, the most popular measurement has been readability formulas, which generate a single number often based only on relative word and sentence length and are used as stand-ins for text complexity [<xref ref-type="bibr" rid="ref24">24</xref>]. These formulas have become popular even though they ignore current knowledge about the reading process, have a shaky statistical basis, and are unhelpful as writing guidelines [<xref ref-type="bibr" rid="ref25">25</xref>]. The Flesch-Kincaid Grade Level formula is the most common in health care literature [<xref ref-type="bibr" rid="ref26">26</xref>]. Even though different tools using the formula sometimes return different levels for the same text [<xref ref-type="bibr" rid="ref27">27</xref>], it has been used to evaluate patient education materials [<xref ref-type="bibr" rid="ref28">28</xref>], general websites [<xref ref-type="bibr" rid="ref29">29</xref>], and information on specific topics such as abdominal aortic aneurysms [<xref ref-type="bibr" rid="ref30">30</xref>] and back pain [<xref ref-type="bibr" rid="ref31">31</xref>]. Other readability formulas, such as the Simple Measure of Gobbledygook (SMOG) and Gunning Fog Index, have also been shown to be problematic for evaluating health-related materials for similar reasons [<xref ref-type="bibr" rid="ref32">32</xref>]. Simplifying text based on these formulas sometimes results in more difficult text, that is, the simplicity paradox [<xref ref-type="bibr" rid="ref5">5</xref>], because the simplification concentrates on writing style rather than content [<xref ref-type="bibr" rid="ref2">2</xref>]. As a result, increasingly more concerns are raised about the effectiveness of these formulas for simplifying consumer health texts [<xref ref-type="bibr" rid="ref33">33</xref>].</p>
                <p>Better measures should be developed and used to evaluate text and motivate algorithmic components. These must be evaluated on a representative sample and measure not just the perception of difficulty, but more importantly understanding and retention of information. By using different measures, we can better evaluate the impact of simplification tools. For example, question-answering tasks (eg, multiple-choice, open-ended, or free recall questions), fill-in-the blanks tasks (eg, multiple-choice or open blanks) and teach-back methods (eg, explain a concept or summarize a topic) can be used to measure understanding. Measures that test retention of information can follow the same style of questions, while measures of learning from a text require a comparison between pre- and post-reading scores.</p>
                <p>Interactions can also exist between personal, text, and even measurement characteristics. For example, the impact of text coherence on the reader has been found to interact with user characteristics and with the type of measurement. Overall coherence did not affect recall (actual difficulty) but affected remembering and understanding when measured by question-answering (actual difficulty) for readers with high knowledge but low interest or low knowledge but high interest in a topic [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref22">22</xref>]. Personal interest in the topic has also repeatedly been shown to be relevant. A higher interest leads to increased learning [<xref ref-type="bibr" rid="ref34">34</xref>] and recall [<xref ref-type="bibr" rid="ref35">35</xref>], however, the coherence of text [<xref ref-type="bibr" rid="ref34">34</xref>] and prior knowledge [<xref ref-type="bibr" rid="ref35">35</xref>] influence this relationship.</p>
            </sec>
            <sec>
                <title>Objective</title>
                <p>Our objective is twofold. First, we address the need for an evidence-based algorithm that pinpoints difficult text. Second, we focus on providing appropriate, easier alternatives to a writer in an effective and efficient manner. We present here our first fully automated version of the <italic>lexical</italic> simplification algorithm, which identifies difficult terms and generates a list of easier alternatives based on information extracted from dictionaries and other databases. In a pilot study [<xref ref-type="bibr" rid="ref36">36</xref>], we introduced the text simplification algorithm and presented an initial user study. This work builds upon the lessons learned in the pilot study and differs in a number of key dimensions: (1) the algorithm examined here is fully automated, (2) the simplification of text is done by an independent writer, not the developers, and (3) the evaluation is based on a new study with different participants, new stimuli, and new more comprehensive metrics.</p>
                <fig id="figure1" position="float">
                    <label>Figure 1</label>
                    <caption>
                        <p>Factors that influence understanding and retention of information.</p>
                    </caption>
                    <graphic xlink:href="jmir_v15i7e144_fig1.jpg" alt-version="no" mimetype="image" position="float" xlink:type="simple" />
                </fig>
            </sec>
        </sec>
        <sec sec-type="methods">
            <title>Methods</title>
            <sec>
                <title>Text Simplification Algorithm and Writing Process</title>
                <p>The automated algorithm executes two steps. The first step is <italic>identification of difficult terms.</italic> We conducted corpus analyses and found that the term familiarity differed between easy and difficult texts [<xref ref-type="bibr" rid="ref17">17</xref>,<xref ref-type="bibr" rid="ref18">18</xref>]. Motivated by this, our algorithm uses the Google Web Corpus [<xref ref-type="bibr" rid="ref37">37</xref>], which contains <italic>n</italic>-gram counts from a corpus of 1 trillion words from public webpages to identify difficult terms. Terms with a low frequency in this corpus are assumed to be less familiar and therefore more difficult since a reader would not encounter them often. We used unigrams and the 5000<sup>th</sup> most frequent word, which has a frequency of 15,377,914, as our threshold for distinguishing less familiar terms. Any term with a lower frequency is considered difficult and is a candidate for replacement.</p>
                <p>We used the Google Web Corpus because its terms are representative of everyday readers without special medical knowledge. Other resources may provide additional value but may also introduce inconsistencies. For example, the Google Book Corpus contains many medical books resulting in higher frequencies for medical terms. The Unified Medical Language System (UMLS) contains both medical and general terms. Distinguishing between them algorithmically would be necessary, which is not an easy task, and may not improve upon the frequency-based approach by much.</p>
                <p>The second step is the <italic>identification and presentation of easier alternatives for each difficult term</italic>. The list of candidate replacements is generated from synonyms and hypernyms from WordNet 2.0 [<xref ref-type="bibr" rid="ref38">38</xref>,<xref ref-type="bibr" rid="ref39">39</xref>]; definitions and semantic types from the UMLS; and definitions from both the English and Simple English Wiktionaries. Only alternatives that possess the same part of speech based on an automatic tagger are presented. In addition, only substitutions with a higher term frequency than the original word are suggested (ie, more familiar). The number of alternatives provided can be adjusted based on user preference or application; currently, we aim to provide a minimum of 7 alternatives. Candidate replacements are sorted both by source (for the convenience of the writer) and by their familiarity in the Google Web Corpus.</p>
                <p>In contrast to the previous version of our simplification algorithm [<xref ref-type="bibr" rid="ref36">36</xref>], which involved one of the authors manually looking up each word to generate the candidate suggestions, the current version is fully automated. To ensure that the algorithm is sufficiently efficient for later inclusion in a comprehensive tool, we tested its efficiency on Wikipedia articles. We selected 100 conditions randomly (see <xref ref-type="app" rid="app1">Multimedia Appendix 1</xref>) from a list of diseases provided by the Mayo Clinic. For each disease, we retrieved the corresponding Wikipedia article. The articles were on average 2573 words long. On average, 617 words were tagged as difficult per article, for which easier alternatives were produced by the algorithm where available. The average run time was 37 seconds per document.</p>
                <p>Given the difficulty of completely automated translation, especially in domains such as health where information may not be omitted, we require a writer to finalize the text. At present, a Microsoft Excel spreadsheet is generated containing each original sentence from a text, the same sentence with blanks for all difficult words, and alternatives for each difficult word. The alternatives are presented in a column and ordered according to source and term familiarity. The writer chooses the best alternative, replacing it in the original text. Ensuring grammatical correctness (eg, consistent pluralization) is currently the responsibility of the writer.</p>
            </sec>
            <sec>
                <title>Original and Simplified Texts (Study Stimuli)</title>
                <p>A subject expert (SE), a medical librarian, simplified the texts. To optimize external validity, we worked with one expert to rewrite the text since this is how the final tool will be used. To increase internal validity, we provided the SE with rules to ensure that we measured only the effects resulting from interaction with our algorithm. She was asked to &#8220;Try to replace as many words as possible&#8221; and when making a replacement &#8220;single words can just be replaced but longer fragments should be added before or after the sentence (with some adjustment for flow of text<italic>)</italic>&#8221;. The SE served two main roles: (1) to determine if a difficult word flagged by the algorithm needs to be replaced, and (2) for those words requiring replacement, to select an appropriate substitution from the alternatives suggested by the algorithm. If the SE deemed that an appropriate synonym existed for a difficult word in the algorithmically generated options, then the difficult word was simply replaced by the synonym. If the simplification option selected by the SE was not a synonym, it needed to be added to the text so that no original information was deleted from the text. Simplifications containing longer phrases or sentences (eg, from definitions) were added by using parentheses or by adding a separate sentence before or after the target sentence. The text was adjusted by the SE as necessary to create grammatically correct sentences.</p>
                <p>In previous work [<xref ref-type="bibr" rid="ref36">36</xref>], we noticed that lexical simplifications by the authors reduced the flow of the text thereby increasing text difficulty. Therefore, the SE was asked to pay close attention to how alternatives were inserted and to choose the option that resulted in the best flow. If the SE preferred a term other than those suggested by the algorithm, she could add it to the text for familiarity verification. Once the text was rewritten, it was rerun through the simplification algorithm to ensure that newly added text was sufficiently simple. This included the verification of any synonyms by the SE.</p>
                <p>To measure <italic>perceived difficulty</italic>, we selected 5 text snippets; these were individual sentences and in one case 2 short sentences combined. Such short snippets do not require much time to read, provide more data points than one long text, and ensure that study participants do not get overwhelmed. The sentences were taken from English Wikipedia articles, and each sentence was simplified by the SE using our algorithm. Our algorithm tagged an average of 11 words per sentence as difficult, of which 5.6 (53%) were replaced.</p>
                <p>To measure <italic>actual difficulty,</italic> it was necessary to use longer texts to allow for questions about the content to be posed. We used two different texts so that each participant in the study worked with an original and simplified text for better (statistical) control of interpersonal differences. We chose a text on liver cirrhosis and one on asthma because most people are somewhat familiar with them and both conditions have several commonly accepted myths associated with them. These myths were incorporated into our multiple-choice questions and provided an excellent opportunity to demonstrate learning. Each text was simplified using our approach described above. Texts were obtained from the initial summary paragraphs from their Wikipedia Web pages and were similar in composition. Our algorithm tagged 210 words as difficult in the liver cirrhosis document, of which 66 (31%) were replaced by the writer during simplification. In the asthma document, 122 words were tagged as difficult and 53 (43%) were replaced during simplification.</p>
                <p>
                    <xref ref-type="table" rid="table1">Tables 1</xref> and <xref ref-type="table" rid="table2">2</xref> show an overview of the text characteristics before and after simplification. We include the Flesch-Kincaid Grade Level for comparison with other work. Below are examples of an original and simplified snippet used as part of the study (perceived difficulty):</p>
                <list list-type="bullet">
                    <list-item>
                        <p>original: &#8220;Gout is a disorder of purine metabolism, and occurs when its final metabolite, uric acid, crystallizes in the form of monosodium urate, precipitating in joints, on tendons, and in the surrounding tissues.&#8221;</p>
                    </list-item>
                    <list-item>
                        <p>simplified: &#8220;Gout is a disease of the processing of the chemical substance called purine, and occurs when its last chemical product (uric acid) makes crystals (monosodium urate), which collect in joints, on tendons, and in the surrounding tissues.&#8221;</p>
                    </list-item>
                </list>
                <p>The texts, both original and simplified versions, are provided in <xref ref-type="app" rid="app2">Multimedia Appendix 2</xref>.</p>
                <table-wrap position="float" id="table1">
                    <label>Table 1</label>
                    <caption>
                        <p>Text snippet characteristics.</p>
                    </caption>
                    <table width="638" border="0" cellpadding="7" cellspacing="0" rules="groups" frame="hsides">
                        <col width="180" />
                        <col width="180" />
                        <col width="180" />
                        <thead>
                            <tr valign="bottom">
                                <td>
                                    <break />
                                </td>
                                <td colspan="2">Lexical simplification</td>
                            </tr>
                            <tr valign="bottom">
                                <td>Sentences (N=5)
                                </td>
                                <td>Original</td>
                                <td>Simplified</td>
                            </tr>
                        </thead>
                        <tbody>
                            <tr valign="bottom">
                                <td>Word count (avg)</td>
                                <td>28.4</td>
                                <td>37.6</td>
                            </tr>
                            <tr valign="bottom">
                                <td>Flesch-Kincaid grade level (avg)</td>
                                <td>18.6</td>
                                <td>17.3</td>
                            </tr>
                        </tbody>
                    </table>
                </table-wrap>
                <table-wrap position="float" id="table2">
                    <label>Table 2</label>
                    <caption>
                        <p>Document characteristics.</p>
                    </caption>
                    <table width="638" border="0" cellpadding="7" cellspacing="0" rules="groups" frame="hsides">
                        <col width="140" />
                        <col width="42" />
                        <col width="75" />
                        <col width="45" />
                        <col width="42" />
                        <col width="75" />
                        <col width="45" />
                        <thead>
                            <tr valign="bottom">
                                <td>
                                    <break />
                                </td>
                                <td colspan="6">Lexical simplification</td>
                            </tr>
                            <tr valign="bottom">
                                <td>
                                 Documents
                                </td>
                                <td colspan="3">Original</td>
                                <td colspan="3">Simplified</td>
                            </tr>
                            <tr valign="bottom">
                                <td>Topic</td>
                                <td>Asthma</td>
                                <td>Liver cirrhosis</td>
                                <td>Average</td>
                                <td>Asthma</td>
                                <td>Liver cirrhosis</td>
                                <td>Average</td>
                            </tr>
                        </thead>
                        <tbody>
                            <tr valign="bottom">
                                <td>Word count</td>
                                <td>623</td>
                                <td>481</td>
                                <td>552</td>
                                <td>779</td>
                                <td>696</td>
                                <td>737.5</td>
                            </tr>
                            <tr valign="bottom">
                                <td>Sentence count</td>
                                <td>31</td>
                                <td>25</td>
                                <td>28</td>
                                <td>33</td>
                                <td>27</td>
                                <td>30</td>
                            </tr>
                            <tr valign="bottom">
                                <td>Flesch-Kincaid grade level</td>
                                <td>13.9</td>
                                <td>14.5</td>
                                <td>14.2</td>
                                <td>13.7</td>
                                <td>14.3</td>
                                <td>14.0</td>
                            </tr>
                        </tbody>
                    </table>
                </table-wrap>
            </sec>
            <sec>
                <title>Metrics</title>
                <p>To measure <italic>perceived difficulty</italic>, participants judged a sentence using a 5-point Likert scale with the following labels: Very Easy, Easy, Neither, Hard, Very Hard. Perceived difficulty is the score on this scale with 1 representing Very Easy and 5 Very Hard.</p>
                <p>To measure <italic>actual difficulty</italic>, we used metrics covering understanding, learning, and retention of information. For understanding of the text, we used 5 multiple-choice questions posed alongside the text. The questions targeted different sections of the text. Understanding was measured as the percentage of questions answered correctly.</p>
                <p>To measure learning, we compared scores on 7 multiple-choice questions shown both before and after reading the text. The text itself was not visible when the questions were presented. By asking the same questions before and after, we were able to use participants as their own controls. For each text, we created the multiple-choice questions based on commonly accepted myths. The myths were gathered by searching the Internet for &#8220;common myths about&#8230;&#8221;. Learning was measured as the increase in the percentage of questions answered correctly after versus before reading the text.</p>
                <p>To measure retention, we asked participants after all sections have been completed to list all facts (one per line) that they remembered from the texts. Retention can be simply measured as the number of facts listed, however, since these facts may contain errors, they were also graded by the authors. Two authors per topic independently graded all facts. Even though participants were asked to list 1 fact per line, many lines included multiple facts per line. Each fact was considered and awarded points separately: +1 for a correct fact and -1 for an incorrect. To grade the answers in an objective manner, the order of answers was randomized per grader and the experimental condition unknown. In cases with a large disparity between grades (scores diverged by more than 100%), a third grader (the SE) judged the results and provided the final score (similar to original manual GRE scoring [<xref ref-type="bibr" rid="ref40">40</xref>]). Retention was then measured with 2 metrics: the number of listed facts and the sum of the grades assigned to those facts.</p>
                <p>In addition to study questions, we also included qualifying questions. These were simple questions for which the answer was obvious. They helped filter results of participants who were not serious about the study. We included a qualifying question with each set of multiple-choice questions and filtered any participant who did not get all qualifying questions right.</p>
            </sec>
            <sec>
                <title>Participants</title>
                <p>Participants were recruited using Amazon&#8217;s Mechanical Turk. MTurk is an online crowdsourcing service that allows for small tasks to be accomplished by human workers. Currently, Amazon has over 300,000 requested tasks and over half a million workers. Workers are paid a small sum for each task accomplished. MTurk has been used in a wide range of settings ranging from user studies to data annotation to subjective rating generation [<xref ref-type="bibr" rid="ref41">41</xref>]. The workers are a diverse group from all over the world with varied demographic characteristics [<xref ref-type="bibr" rid="ref42">42</xref>,<xref ref-type="bibr" rid="ref43">43</xref>]. When precautions are taken to filter out ineffective workers, the quality of the data obtained has been shown to be at least as good as data obtained from more traditional approaches [<xref ref-type="bibr" rid="ref43">43</xref>,<xref ref-type="bibr" rid="ref44">44</xref>].</p>
            </sec>
            <sec>
                <title>Procedure</title>
                <p>Participants were directed to our study website from MTurk, and the sections were presented in the following order:</p>
                <list list-type="bullet">
                    <list-item>
                        <p>The <italic>first page</italic> contained the welcome note and instructions to complete the study sections in order and without use of external sources. From this point, the browser back button was disabled.</p>
                    </list-item>
                    <list-item>
                        <p>The <italic>first study section</italic> showed the myth-based questions for a topic. Then, the text was shown together with new questions, followed by a repetition of the myth-based questions without the text. For each participant, the order of the questions and answers for each question were randomized. The topic was either liver cirrhosis or asthma, and the version was either original or simplified.</p>
                    </list-item>
                    <list-item>
                        <p>The <italic>second study section</italic> was identical to the first, but with a different text in a different version. Each participant received one original and one simplified version. The order and topics were balanced over the study so that all combinations of topic and difficulty level were presented.</p>
                    </list-item>
                    <list-item>
                        <p>The <italic>third study section</italic> contained the individual sentences that participants judged for perceived difficulty. The original and simplified version of a sentence were paired because showing all sentences in one list made it very difficult for participants to notice differences and provide a rational judgment. The order within each pair and the order of the 5 pairs were randomized per participant.</p>
                    </list-item>
                    <list-item>
                        <p>The <italic>fourth study section</italic> contained demographic questions.</p>
                    </list-item>
                    <list-item>
                        <p>The <italic>fifth and sixth study sections</italic> contained the PSS-10 [<xref ref-type="bibr" rid="ref45">45</xref>], a standardized stress survey, and the STOFHLA [<xref ref-type="bibr" rid="ref46">46</xref>,<xref ref-type="bibr" rid="ref47">47</xref>], a standardized health literacy measure.</p>
                    </list-item>
                    <list-item>
                        <p>The <italic>seventh and eighth sections</italic> contained the request for free recall of information for the first and second text.</p>
                    </list-item>
                    <list-item>
                        <p>The <italic>final page</italic> showed a Thank You note and the code to be submitted for payment at MTurk.</p>
                    </list-item>
                </list>
            </sec>
        </sec>
        <sec sec-type="results">
            <title>Results</title>
            <sec>
                <title>Participant Characteristics</title>
                <p>We invited MTurk workers located in the United States with a 95% approval rate on tasks previously performed for other requesters. They were paid US$1.50 for completing the survey. Upon start, 134 participants signed up and 105 completed the study. Of those who completed, 6 did not pass our filtering criteria resulting in a total of 99 valid participants. Completing the survey took on average 33 minutes. The shortest time spent was 13 minutes and the longest was 45 minutes.</p>
                <p>
                    <xref ref-type="table" rid="table3">Table 3</xref> provides the demographic information. Most participants (80%) were between 21 and 50 years old, with only a small group younger than 20 (3%) or older than 60 years (4%). The majority were female (63%), white (89%), and not Hispanic or Latino (93%). Most had moderate education: 48% had a high school diploma, 16% an associate&#8217;s degree, and 25% a bachelor&#8217;s degree. The majority (89%) spoke exclusively English at home.</p>
            </sec>
            <sec>
                <title>Perceived Difficulty</title>
                <p>We found a significant beneficial effect of simplification on perceived difficulty with simplified sentences being judged as simpler. <xref ref-type="fig" rid="figure2">Figure 2</xref> shows an overview of the average score and standard error bars for each sentence and for all sentences combined. A paired-samples <italic>t</italic>-test showed the difference to be significant for all pairs (<italic>P</italic>&#60;.001) and for all pairs combined (<italic>P</italic>&#60;.001).</p>
                <table-wrap position="float" id="table3">
                    <label>Table 3</label>
                    <caption>
                        <p>Participant demographic information (n=99).</p>
                    </caption>
                    <table width="638" border="0" cellpadding="7" cellspacing="0" rules="groups" frame="hsides">
                        <col width="144" />
                        <col width="401" />
                        <col width="51" />
                        <thead>
                            <tr valign="bottom">
                                <td colspan="2">Characteristics</td>
                                <td>n</td>
                            </tr>
                        </thead>
                        <tbody>
                            <tr valign="bottom">
                                <td>
                                    <bold>Age</bold>
                                </td>
                                <td>
                                    <break />
                                </td>
                                <td>
                                    <break />
                                </td>
                            </tr>
                            <tr valign="bottom">
                                <td>
                                    <break />
                                </td>
                                <td>20 or younger</td>
                                <td>3</td>
                            </tr>
                            <tr valign="bottom">
                                <td>
                                    <break />
                                </td>
                                <td>21-30</td>
                                <td>35</td>
                            </tr>
                            <tr valign="bottom">
                                <td>
                                    <break />
                                </td>
                                <td>31-40</td>
                                <td>24</td>
                            </tr>
                            <tr valign="bottom">
                                <td>
                                    <break />
                                </td>
                                <td>41-50</td>
                                <td>21</td>
                            </tr>
                            <tr valign="bottom">
                                <td>
                                    <break />
                                </td>
                                <td>51-60</td>
                                <td>12</td>
                            </tr>
                            <tr valign="bottom">
                                <td>
                                    <break />
                                </td>
                                <td>61-70</td>
                                <td>4</td>
                            </tr>
                            <tr valign="bottom">
                                <td>
                                    <break />
                                </td>
                                <td>71 or older</td>
                                <td>-</td>
                            </tr>
                            <tr valign="bottom">
                                <td>
                                    <bold>Gender</bold>
                                </td>
                                <td>
                                    <break />
                                </td>
                                <td>
                                    <break />
                                </td>
                            </tr>
                            <tr valign="bottom">
                                <td>
                                    <break />
                                </td>
                                <td>Female</td>
                                <td>62</td>
                            </tr>
                            <tr valign="bottom">
                                <td>
                                    <break />
                                </td>
                                <td>Male</td>
                                <td>37</td>
                            </tr>
                            <tr valign="bottom">
                                <td colspan="3">
                                    <bold>Race (multiple choices allowed)</bold>
                                </td>
                            </tr>
                            <tr valign="bottom">
                                <td>
                                    <break />
                                </td>
                                <td>American Indian / Native Alaskan</td>
                                <td>2</td>
                            </tr>
                            <tr valign="bottom">
                                <td>
                                    <break />
                                </td>
                                <td>Asian</td>
                                <td>7</td>
                            </tr>
                            <tr valign="bottom">
                                <td>
                                    <break />
                                </td>
                                <td>Black or African American</td>
                                <td>5</td>
                            </tr>
                            <tr valign="bottom">
                                <td>
                                    <break />
                                </td>
                                <td>Native Hawaiian or Other Pacific Islander</td>
                                <td>-</td>
                            </tr>
                            <tr valign="bottom">
                                <td>
                                    <break />
                                </td>
                                <td>White</td>
                                <td>88</td>
                            </tr>
                            <tr valign="bottom">
                                <td>
                                    <bold>Ethnicity</bold>
                                </td>
                                <td>
                                    <break />
                                </td>
                                <td>
                                    <break />
                                </td>
                            </tr>
                            <tr valign="bottom">
                                <td>
                                    <break />
                                </td>
                                <td>Hispanic or Latino</td>
                                <td>7</td>
                            </tr>
                            <tr valign="bottom">
                                <td>
                                    <break />
                                </td>
                                <td>Not Hispanic or Latino</td>
                                <td>92</td>
                            </tr>
                            <tr valign="bottom">
                                <td colspan="3">
                                    <bold>Education (highest completed)</bold>
                                </td>
                            </tr>
                            <tr valign="bottom">
                                <td>
                                    <break />
                                </td>
                                <td>Less than High School</td>
                                <td>1</td>
                            </tr>
                            <tr valign="bottom">
                                <td>
                                    <break />
                                </td>
                                <td>High School Diploma</td>
                                <td>48</td>
                            </tr>
                            <tr valign="bottom">
                                <td>
                                    <break />
                                </td>
                                <td>Associate&#8217;s Degree</td>
                                <td>16</td>
                            </tr>
                            <tr valign="bottom">
                                <td>
                                    <break />
                                </td>
                                <td>Bachelor&#8217;s Degree</td>
                                <td>25</td>
                            </tr>
                            <tr valign="bottom">
                                <td>
                                    <break />
                                </td>
                                <td>Master&#8217;s Degree</td>
                                <td>6</td>
                            </tr>
                            <tr valign="bottom">
                                <td>
                                    <break />
                                </td>
                                <td>Doctorate</td>
                                <td>3</td>
                            </tr>
                            <tr valign="bottom">
                                <td colspan="3">
                                    <bold>Language skills (frequency of speaking English at home)</bold>
                                </td>
                            </tr>
                            <tr valign="bottom">
                                <td>
                                    <break />
                                </td>
                                <td>Never English</td>
                                <td>-</td>
                            </tr>
                            <tr valign="bottom">
                                <td>
                                    <break />
                                </td>
                                <td>Rarely English</td>
                                <td>1</td>
                            </tr>
                            <tr valign="bottom">
                                <td>
                                    <break />
                                </td>
                                <td>Half English</td>
                                <td>3</td>
                            </tr>
                            <tr valign="bottom">
                                <td>
                                    <break />
                                </td>
                                <td>Mostly English</td>
                                <td>6</td>
                            </tr>
                            <tr valign="bottom">
                                <td>
                                    <break />
                                </td>
                                <td>Only English</td>
                                <td>89</td>
                            </tr>
                        </tbody>
                    </table>
                </table-wrap>
                <fig id="figure2" position="float">
                    <label>Figure 2</label>
                    <caption>
                        <p>Average perceived difficulty scores (lower score = perceived simpler).</p>
                    </caption>
                    <graphic xlink:href="jmir_v15i7e144_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple" />
                </fig>
            </sec>
            <sec>
                <title>Actual Difficulty: Understanding, Learning, and Retention</title>
                <p>
                    <xref ref-type="fig" rid="figure3">Figure 3</xref> shows the mean scores and standard error bars for understanding. We conducted a two-way analysis of variance (ANOVA) with simplification and topic as independent variables. Topic was included to provide a more nuanced view. For understanding, we found two main effects. The first is for simplification with higher scores for simplified text. There were on average 52% correct answers with an original document and 63% with a simplified document, (<italic>F</italic>
                    <sub>1,198</sub>=13.869, <italic>P</italic>&#60;.001). There was also a main effect for topic (<italic>F</italic>
                    <sub>1,198</sub>=13.869, <italic>P</italic>&#60;.001) with higher scores achieved for the asthma document. Since the increases in understanding after simplification were comparable for both topics, the interaction effect was not significant.</p>
                <p>
                    <xref ref-type="fig" rid="figure4">Figure 4</xref> shows the mean scores and standard error bars for the learning of information. We conducted a comparable two-way ANOVA with the simplification and topic as independent variables. We found a significant main effect of simplification of text with more learning from simplified documents (18%) than from the original documents (9%) (<italic>F</italic>
                    <sub>1,198</sub>=9.238, <italic>P</italic>=.003). A second main effect was found for topic (<italic>F</italic>
                    <sub>1,198</sub>=22.301, <italic>P</italic>&#60;.001) with more learning with the liver cirrhosis document (20%) than with the asthma document (6%). The interaction between both independent variables was also significant (<italic>F</italic>
                    <sub>1,198</sub>=4.071, <italic>P</italic>=.045) with the learning being more pronounced with the liver cirrhosis than with the asthma document.</p>
                <p>
                    <xref ref-type="table" rid="table4">Table 4</xref> provides an overview of the retention of information using both raw and graded scores. With simplified documents, slightly more facts were listed (5.04) than with original documents (4.66). There were also slightly more words (43.60) and unique words (32.36) used after reading simplified documents compared to original documents (40.07 words and 30.79 unique words). These differences were not statistically significant. The graded scores show similar small differences. There were slightly more correct facts after reading simplified documents (5.04 facts) than after reading the original documents (4.70 facts). However, the difference is not statistically significant.</p>
                <fig id="figure3" position="float">
                    <label>Figure 3</label>
                    <caption>
                        <p>Average understanding scores.</p>
                    </caption>
                    <graphic xlink:href="jmir_v15i7e144_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple" />
                </fig>
                <fig id="figure4" position="float">
                    <label>Figure 4</label>
                    <caption>
                        <p>Average learning scores.</p>
                    </caption>
                    <graphic xlink:href="jmir_v15i7e144_fig4.png" alt-version="no" mimetype="image" position="float" xlink:type="simple" />
                </fig>
                <table-wrap position="float" id="table4">
                    <label>Table 4</label>
                    <caption>
                        <p>Retention of information: mean and standard deviation.</p>
                    </caption>
                    <table width="547" border="0" cellpadding="7" cellspacing="0" rules="groups" frame="hsides">
                        <col width="131" />
                        <col width="42" />
                        <col width="73" />
                        <col width="45" />
                        <col width="42" />
                        <col width="73" />
                        <col width="45" />
                        <thead>
                            <tr valign="bottom">
                                <td>
                                    <break />
                                </td>
                                <td colspan="3">Original text</td>
                                <td colspan="3">Simplified text</td>
                            </tr>
                            <tr valign="bottom">
                                <td>Average counts</td>
                                <td>Asthma</td>
                                <td>Liver cirrhosis</td>
                                <td>Average</td>
                                <td>Asthma</td>
                                <td>Liver cirrhosis</td>
                                <td>Average</td>
                            </tr>
                        </thead>
                        <tbody>
                            <tr valign="bottom">
                                <td>Facts</td>
                                <td>4.76</td>
                                <td>4.55</td>
                                <td>4.66</td>
                                <td>4.96</td>
                                <td>5.12</td>
                                <td>5.04</td>
                            </tr>
                            <tr valign="bottom">
                                <td>Words</td>
                                <td>40.50</td>
                                <td>39.63</td>
                                <td>40.07</td>
                                <td>42.90</td>
                                <td>44.24</td>
                                <td>43.60</td>
                            </tr>
                            <tr valign="bottom">
                                <td>Unique words</td>
                                <td>31.38</td>
                                <td>30.20</td>
                                <td>30.79</td>
                                <td>32.39</td>
                                <td>32.34</td>
                                <td>32.36</td>
                            </tr>
                            <tr valign="bottom">
                                <td>Average score (graded facts)</td>
                                <td>4.50</td>
                                <td>4.91</td>
                                <td>4.70</td>
                                <td>4.73</td>
                                <td>5.35</td>
                                <td>5.04</td>
                            </tr>
                        </tbody>
                    </table>
                </table-wrap>
            </sec>
            <sec>
                <title>Relationships With Participant Characteristics</title>
                <p>To complete our analysis, we conducted a correlation analysis using a 2-tailed Pearson product-moment correlation coefficient (<italic>r</italic>). We evaluated the personal characteristics and the scores for perceived and actual difficulty over experimental conditions. We assigned a code to the education level and language skills with a higher score indicating a higher level or skill. We also included the PSS scores and STOFHLA scores.</p>
                <p>Overall, there were few significant correlations. There were no significant correlations between the perceived difficulty of sentences and the personal characteristics. For actual difficulty, only education mattered. There was a positive correlation between education and understanding (<italic>r</italic>=.244, <italic>P</italic>=.015), facts listed (<italic>r</italic>=.296, <italic>P</italic>=.003), graded facts (<italic>r</italic>=.411, <italic>P&#8804;</italic>.001), and both the word count (<italic>r=</italic>.316, <italic>P</italic>=.001) and unique word count (<italic>r</italic>=.329, <italic>P</italic>=.001). Among the personal characteristics themselves, two correlations were significant. There was a negative correlation between language skills and stress levels, indicating higher stress related to lower language skills (<italic>r</italic>=-.210, <italic>P</italic>=.037) and also a negative correlation between language skills and education level (<italic>r</italic>=-.260, <italic>P</italic>=.009). Upon closer inspection, this last negative correlation was due to a few individuals with higher degrees who speak a different language at home, that is, Chinese, Tamil, or Farsi.</p>
            </sec>
        </sec>
        <sec sec-type="discussion">
            <title>Discussion</title>
            <sec>
                <title>Principal Findings</title>
                <p>This work reported on a lexical simplification algorithm that automatically detects difficult terms and suggests easier alternatives. The writing process is semiautomated since the final replacements are made by the writer. A controlled user study showed how simplifying text in this manner led to significant improvements in both perceived and actual difficulty of text.</p>
                <p>The results on perceived difficulty corroborate earlier work on manual lexical simplification. In general, changing the text to improve perceived difficulty is more straightforward. Consistent and strong effects are found even when using short text snippets or small sample sizes. Even so, this effect is important and shows that <italic>lexical simplification has a beneficial impact on perceived difficulty</italic>. Future studies will look more closely at how perceived difficulty affects motivation to read and ability to complete reading, among other factors.</p>
                <p>The results on actual difficulty are strong and very encouraging. They also show the importance of using different metrics. We found a strong effect on understanding with simplified text being better understood. However, this effect also depended on the topic being studied. Learning showed a similar strong effect: there was more learning with simplified documents. These effects lead to our conclusion that <italic>lexical simplification is beneficial and has an immediate impact on understanding and learning</italic>. However, we did not find an effect of simplification on retention of information. This may be due to a lack of sustained learning or it may be due to the study design. In previous work on search engines [<xref ref-type="bibr" rid="ref48">48</xref>], we found that many study participants stop finding information at some given point, regardless of how easy or difficult a task is. We may be witnessing a similar effect with participants submitting &#8220;enough&#8221; facts regardless of how many they remember. In future work, we aim to provide better incentives to encourage participants to submit more facts.</p>
            </sec>
            <sec>
                <title>Limitations</title>
                <p>There are several limitations we would like to point out. First, we evaluated our approach with short texts taken from Wikipedia. Different effects may be found for longer or more difficult texts. However, working with short texts allows for a controlled experiment, thereby avoiding potentially confounding variables. Future work will look for repeat effects in longer documents. Second, we worked with general topics. Automatically recognizing which different texts, either distinguished by difficulty level or other factors, would benefit from simplification would be an important addition to our work. In addition, working with personally relevant topics may increase effects, since motivation has been shown to be important to the reading process. Third, we worked with only one subject expert who rewrote text. Comparing different writers may show further strengths and weaknesses of our approach. Working with a team of writers may provide a more balanced gold standard; however, this approach has also been shown to introduce noise when experts disagree [<xref ref-type="bibr" rid="ref49">49</xref>]. Further research is needed to understand the impact of each of these limitations.</p>
            </sec>
            <sec>
                <title>Conclusions</title>
                <p>In addition to these study limitations, there is also much room for future development of our algorithm. We aim to more precisely target difficult words so that fewer words are tagged for replacement while still impacting the overall difficulty of text. We aim to provide a shorter and more precise list of potential replacements by working with resources such as the Consumer Health Vocabulary [<xref ref-type="bibr" rid="ref50">50</xref>-<xref ref-type="bibr" rid="ref52">52</xref>]. This will make the process more efficient for the writer while requiring less time to generate alternatives. For example, we plan to test phrases in addition to individual words to estimate difficulty and work with different thresholds. We also are working toward combining lexical simplification with other forms of simplification of relevant text features.</p>
            </sec>
        </sec>
    </body>
    <back>
        <app-group>
            <app id="app1">
                <title>Multimedia Appendix 1</title>
                <p>List of conditions.</p>
                <media xlink:href="jmir_v15i7e144_app1.pdf" xlink:title="PDF File (Adobe PDF File), 7KB" />
            </app>
            <app id="app2">
                <title>Multimedia Appendix 2</title>
                <p>Stimuli: Original and simplified texts.</p>
                <media xlink:href="jmir_v15i7e144_app2.pdf" xlink:title="PDF File (Adobe PDF File), 62KB" />
            </app>
        </app-group>
        <glossary>
            <title>Abbreviations</title>
            <def-list>
                <def-item>
                    <term id="abb1">ANOVA</term>
                    <def>
                        <p>analysis of variance</p>
                    </def>
                </def-item>
                <def-item>
                    <term id="abb2">GRE</term>
                    <def>
                        <p>Graduate Record Examinations</p>
                    </def>
                </def-item>
                <def-item>
                    <term id="abb3">SE</term>
                    <def>
                        <p>subject expert</p>
                    </def>
                </def-item>
                <def-item>
                    <term id="abb4">UMLS</term>
                    <def>
                        <p>Unified Medical Language System</p>
                    </def>
                </def-item>
            </def-list>
        </glossary>
        <ack>
            <p>The authors would like to thank their study participants. The study was reviewed by the Institutional Review Board (IRB) of Claremont Graduate University.</p>
            <p>This work was supported by the US National Library of Medicine, NIH/NLM 1R03LM010902-01.</p>
        </ack>
        <fn-group>
            <fn fn-type="conflict">
                <p>None declared.</p>
            </fn>
        </fn-group>
        <ref-list>
            <ref id="ref1">
                <label>1</label>
                <nlm-citation citation-type="web">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Fox</surname>
                            <given-names>S</given-names>
                        </name>
                    </person-group>
                    <source>Health Topics</source>
                    <year>2011</year>
                    <access-date>2013-07-07</access-date>
                    <publisher-name>Pew Research Center</publisher-name>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.pewinternet.org/Reports/2011/HealthTopics.aspx">http://www.pewinternet.org/Reports/2011/HealthTopics.aspx</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6HwPg8amf</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref2">
                <label>2</label>
                <nlm-citation citation-type="confproc">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Wang</surname>
                            <given-names>Y</given-names>
                        </name>
                    </person-group>
                    <article-title>Automatic Recognition of Text Difficulty from Consumers Health Information</article-title>
                    <source>Proceedings of the 19th IEEE International Symposium on Computer-Based Medical Systems</source>
                    <year>2006</year>
                    <conf-name>19th IEEE International Symposium on Computer-Based Medical Systems</conf-name>
                    <conf-date>June 22-23, 2006</conf-date>
                    <conf-loc>Salt Lake City</conf-loc>
                </nlm-citation>
            </ref>
            <ref id="ref3">
                <label>3</label>
                <nlm-citation citation-type="book">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Nielsen-Bohlman</surname>
                            <given-names>L</given-names>
                        </name>
                        <collab>Institute of Medicine /Committee on Health</collab>
                    </person-group>
                    <source>&#8216;Health literacy: a prescription to end confusion&#8217;</source>
                    <year>2004</year>
                    <publisher-loc>Maryland</publisher-loc>
                    <publisher-name>National Academies Press</publisher-name>
                </nlm-citation>
            </ref>
            <ref id="ref4">
                <label>4</label>
                <nlm-citation citation-type="confproc">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Yan</surname>
                            <given-names>X</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Song</surname>
                            <given-names>D</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Li</surname>
                            <given-names>X</given-names>
                        </name>
                    </person-group>
                    <article-title>Concept-based Document Readability in Domain Specific Information Retrieval</article-title>
                    <source>Proceedings of the 15th ACM International Conference on Information and Knowledge Management</source>
                    <year>2006</year>
                    <conf-name>15th ACM International Conference on Information and Knowledge Management</conf-name>
                    <conf-date>Nov. 5-11, 2006</conf-date>
                    <conf-loc>Arlington, Virginia</conf-loc>
                    <fpage>540</fpage>
                    <lpage>549</lpage>
                </nlm-citation>
            </ref>
            <ref id="ref5">
                <label>5</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Zarcadoolas</surname>
                            <given-names>C</given-names>
                        </name>
                    </person-group>
                    <article-title>The simplicity complex: exploring simplified health messages in a complex world</article-title>
                    <source>Health Promot Int</source>
                    <year>2011</year>
                    <month>09</month>
                    <volume>26</volume>
                    <issue>3</issue>
                    <fpage>338</fpage>
                    <lpage>50</lpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://heapro.oxfordjournals.org/cgi/pmidlookup?view=long&#38;pmid=21149317" />
                    </comment>
                    <pub-id pub-id-type="doi">10.1093/heapro/daq075</pub-id>
                    <pub-id pub-id-type="medline">21149317</pub-id>
                    <pub-id pub-id-type="pii">daq075</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref6">
                <label>6</label>
                <nlm-citation citation-type="web">
                    <source>Low health literacy report</source>
                    <access-date>2013-02-06</access-date>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://sphhs.gwu.edu/departments/healthpolicy/CHPR/downloads/LowHealthLiteracyReport10_4_07.pdf">http://sphhs.gwu.edu/departments/healthpolicy/CHPR/downloads/LowHealthLiteracyReport10_4_07.pdf</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6EEgqYeox</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref7">
                <label>7</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Diakidoy</surname>
                            <given-names>I-A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Mouskounti</surname>
                            <given-names>T</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Ioannides</surname>
                            <given-names>C</given-names>
                        </name>
                    </person-group>
                    <article-title>Comprehension and Learning from Refutation and Expository Texts</article-title>
                    <source>Reading Research Quarterly</source>
                    <year>2011</year>
                    <volume>43</volume>
                    <issue>1</issue>
                    <fpage>22</fpage>
                    <pub-id pub-id-type="doi">10.1598/RRQ.46.1.2</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref8">
                <label>8</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Leroy</surname>
                            <given-names>G</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Miller</surname>
                            <given-names>T</given-names>
                        </name>
                    </person-group>
                    <article-title>Perils of providing visual health information overviews for consumers with low health literacy or high stress</article-title>
                    <source>J Am Med Inform Assoc</source>
                    <year>2010</year>
                    <volume>17</volume>
                    <issue>2</issue>
                    <fpage>220</fpage>
                    <lpage>3</lpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://jamia.bmj.com/cgi/pmidlookup?view=long&#38;pmid=20190068" />
                    </comment>
                    <pub-id pub-id-type="doi">10.1136/jamia.2009.002717</pub-id>
                    <pub-id pub-id-type="medline">20190068</pub-id>
                    <pub-id pub-id-type="pii">17/2/220</pub-id>
                    <pub-id pub-id-type="pmcid">PMC3000790</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref9">
                <label>9</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Van Servellen</surname>
                            <given-names>G</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Brown</surname>
                            <given-names>JS</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Lombardi</surname>
                            <given-names>E</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Herrera</surname>
                            <given-names>G</given-names>
                        </name>
                    </person-group>
                    <article-title>Health literacy in low-income Latino men and women receiving antiretroviral therapy in community-based treatment centers</article-title>
                    <source>AIDS Patient Care and STDs</source>
                    <year>2003</year>
                    <month>06</month>
                    <volume>17</volume>
                    <issue>6</issue>
                    <fpage>283</fpage>
                    <lpage>98</lpage>
                    <pub-id pub-id-type="doi">10.1089/108729103322108166</pub-id>
                    <pub-id pub-id-type="medline">12880492</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref10">
                <label>10</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Kintsch</surname>
                            <given-names>W</given-names>
                        </name>
                    </person-group>
                    <article-title>Learning from Text</article-title>
                    <source>Cognition and Instruction</source>
                    <year>1986</year>
                    <volume>3</volume>
                    <issue>2</issue>
                    <fpage>87</fpage>
                </nlm-citation>
            </ref>
            <ref id="ref11">
                <label>11</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Landi</surname>
                            <given-names>N</given-names>
                        </name>
                    </person-group>
                    <article-title>An examination of the relationship between reading comprehension, higher-level and lower-level reading sub-skills in adults</article-title>
                    <source>Read Writ</source>
                    <year>2010</year>
                    <month>07</month>
                    <day>1</day>
                    <volume>23</volume>
                    <issue>6</issue>
                    <fpage>701</fpage>
                    <lpage>717</lpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/21691452" />
                    </comment>
                    <pub-id pub-id-type="doi">10.1007/s11145-009-9180-z</pub-id>
                    <pub-id pub-id-type="medline">21691452</pub-id>
                    <pub-id pub-id-type="pmcid">PMC3117585</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref12">
                <label>12</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Stanovich</surname>
                            <given-names>KE</given-names>
                        </name>
                        <name name-style="western">
                            <surname>West</surname>
                            <given-names>RF</given-names>
                        </name>
                    </person-group>
                    <article-title>Exposure to Print and Orthographic Processing</article-title>
                    <source>Reading Research Quarterly</source>
                    <year>1989</year>
                    <volume>24</volume>
                    <issue>4</issue>
                    <fpage>402</fpage>
                </nlm-citation>
            </ref>
            <ref id="ref13">
                <label>13</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Leroy</surname>
                            <given-names>G</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Lauchak</surname>
                            <given-names>D</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Mouradi</surname>
                            <given-names>O</given-names>
                        </name>
                    </person-group>
                    <article-title>A User-study Measuring the Effects of Lexical Simplification and Coherence Enhancement on Perceived and Actual Text Difficulty</article-title>
                    <source>Int J Med Inform</source>
                    <year>2013</year>
                    <comment>(forthcoming)</comment>
                </nlm-citation>
            </ref>
            <ref id="ref14">
                <label>14</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Janz</surname>
                            <given-names>NK</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Becker</surname>
                            <given-names>MH</given-names>
                        </name>
                    </person-group>
                    <article-title>The Health Belief Model: a decade later</article-title>
                    <source>Health Educ Q</source>
                    <year>1984</year>
                    <volume>11</volume>
                    <issue>1</issue>
                    <fpage>1</fpage>
                    <lpage>47</lpage>
                    <pub-id pub-id-type="medline">6392204</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref15">
                <label>15</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Trafimow</surname>
                            <given-names>D</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Sheeran</surname>
                            <given-names>P</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Conner</surname>
                            <given-names>M</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Finlay</surname>
                            <given-names>KA</given-names>
                        </name>
                    </person-group>
                    <article-title>Evidence that perceived behavioural control is a multidimensional construct: perceived control and perceived difficulty</article-title>
                    <source>Br J Soc Psychol</source>
                    <year>2002</year>
                    <month>03</month>
                    <volume>41</volume>
                    <issue>Pt 1</issue>
                    <fpage>101</fpage>
                    <lpage>21</lpage>
                    <pub-id pub-id-type="medline">11970777</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref16">
                <label>16</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Velayo</surname>
                            <given-names>RS</given-names>
                        </name>
                    </person-group>
                    <article-title>Retention of Content as a Function of Presentation Mode and Perceived Difficulty</article-title>
                    <source>Reading Improvement</source>
                    <year>1993</year>
                    <volume>30</volume>
                    <issue>4</issue>
                    <fpage>216</fpage>
                </nlm-citation>
            </ref>
            <ref id="ref17">
                <label>17</label>
                <nlm-citation citation-type="confproc">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Leroy</surname>
                            <given-names>G</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Endicott</surname>
                            <given-names>J</given-names>
                        </name>
                    </person-group>
                    <article-title>Term Familiarity to Indicate Perceived and Actual Difficulty of Text in Medical Digital Libraries</article-title>
                    <source>Proceedings of the International Conference on Asia-Pacific Digital Libraries (ICADL ) - Digital Libraries -- for Culture Heritage, Knowledge Dissemination, and Future Creation</source>
                    <year>2011</year>
                    <conf-name>International Conference on Asia-Pacific Digital Libraries (ICADL ) - Digital Libraries -- for Culture Heritage, Knowledge Dissemination, and Future Creation</conf-name>
                    <conf-date>October 2011</conf-date>
                    <conf-loc>Beijing, China</conf-loc>
                    <fpage>24</fpage>
                    <lpage>27</lpage>
                </nlm-citation>
            </ref>
            <ref id="ref18">
                <label>18</label>
                <nlm-citation citation-type="confproc">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Leroy</surname>
                            <given-names>G</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Endicott</surname>
                            <given-names>J</given-names>
                        </name>
                    </person-group>
                    <article-title>Combining NLP with Evidence-based Methods to Find Text Metrics related to Perceived and Actual Text Difficulty</article-title>
                    <source>Proceedings of the 2nd ACM SIGHIT International Health Informatics Symposium (ACM IHI)</source>
                    <year>2012</year>
                    <conf-name>2nd ACM SIGHIT International Health Informatics Symposium (ACM IHI)</conf-name>
                    <conf-date>January 2012</conf-date>
                    <conf-loc>Miami, FL</conf-loc>
                    <fpage>28</fpage>
                    <lpage>30</lpage>
                </nlm-citation>
            </ref>
            <ref id="ref19">
                <label>19</label>
                <nlm-citation citation-type="confproc">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Pitler</surname>
                            <given-names>E</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Nenkova</surname>
                            <given-names>A</given-names>
                        </name>
                    </person-group>
                    <article-title>Revisiting Readability: A Unified Framework for Predicting Text Quality</article-title>
                    <source>Proceedings of the Empirical Methods in Natural Language Processing</source>
                    <year>2008</year>
                    <conf-name>Empirical Methods in Natural Language Processing</conf-name>
                    <conf-date>2008</conf-date>
                    <conf-loc>Honolulu</conf-loc>
                </nlm-citation>
            </ref>
            <ref id="ref20">
                <label>20</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Soleimani</surname>
                            <given-names>H</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Mohammadi</surname>
                            <given-names>E</given-names>
                        </name>
                    </person-group>
                    <article-title>The Effect of Text Typographical Features on Legibility,Comprehension, and Retrieval of EFL Learners</article-title>
                    <source>English Language Teaching</source>
                    <year>2012</year>
                    <volume>5</volume>
                    <issue>8</issue>
                    <fpage>207</fpage>
                </nlm-citation>
            </ref>
            <ref id="ref21">
                <label>21</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Goldman</surname>
                            <given-names>SR</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Murray</surname>
                            <given-names>JD</given-names>
                        </name>
                    </person-group>
                    <article-title>Knowledge of Connectors as Cohesion Devices in Text: A Comparative Study of Native-English and English-as-a-Second-Language Speakers</article-title>
                    <source>Journal of Educational Psychology</source>
                    <year>1992</year>
                    <volume>84</volume>
                    <issue>4</issue>
                    <fpage>504</fpage>
                </nlm-citation>
            </ref>
            <ref id="ref22">
                <label>22</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Boscolo</surname>
                            <given-names>P</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Mason</surname>
                            <given-names>L</given-names>
                        </name>
                    </person-group>
                    <article-title>Topic Knowledge, Text Coherence, and Interest: How they Interact in Learning from Instructional Texts</article-title>
                    <source>The Journal of Experimental Education</source>
                    <year>2003</year>
                    <volume>7</volume>
                    <issue>2</issue>
                    <fpage>126</fpage>
                </nlm-citation>
            </ref>
            <ref id="ref23">
                <label>23</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>McNamara</surname>
                            <given-names>DS</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Kintsch</surname>
                            <given-names>E</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Songer</surname>
                            <given-names>NB</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Kintsch</surname>
                            <given-names>W</given-names>
                        </name>
                    </person-group>
                    <article-title>Are Good Texts Always Better? Interactions of Text Coherence, Background Knowledge, and Levels of Understanding in Learning from Text</article-title>
                    <source>Cognition and Instruction</source>
                    <year>1996</year>
                    <volume>14</volume>
                    <issue>1</issue>
                    <fpage>1</fpage>
                </nlm-citation>
            </ref>
            <ref id="ref24">
                <label>24</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>DuBay</surname>
                            <given-names>WH</given-names>
                        </name>
                    </person-group>
                    <article-title>The Principles of Readability</article-title>
                    <source>Impact Information</source>
                    <year>2004</year>
                </nlm-citation>
            </ref>
            <ref id="ref25">
                <label>25</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Bruce</surname>
                            <given-names>B</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Rubin</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Starr</surname>
                            <given-names>K</given-names>
                        </name>
                    </person-group>
                    <article-title>Why Readability Formulas Fail</article-title>
                    <source>IEEE Transactions on Professional Communication</source>
                    <year>1981</year>
                    <volume>24</volume>
                    <issue>1</issue>
                    <fpage>50</fpage>
                </nlm-citation>
            </ref>
            <ref id="ref26">
                <label>26</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Wang</surname>
                            <given-names>L-W</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Miller</surname>
                            <given-names>MJ</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Schmitt</surname>
                            <given-names>MR</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Wen</surname>
                            <given-names>FK</given-names>
                        </name>
                    </person-group>
                    <article-title>Assessing Readability Formula Differences with Written Health Information Materials: Application, Results, and Recommendations</article-title>
                    <source>Research in Social &#38; Administrative Pharmacy</source>
                    <year>2012</year>
                    <comment>(forthcoming)</comment>
                </nlm-citation>
            </ref>
            <ref id="ref27">
                <label>27</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Sirico</surname>
                            <given-names>LJ</given-names>
                        </name>
                    </person-group>
                    <article-title>Readability Studies: How Technocentrism Can Compromise Research and Legal Determinations</article-title>
                    <source>Villanova University Legal Working Paper Series</source>
                    <year>2008</year>
                </nlm-citation>
            </ref>
            <ref id="ref28">
                <label>28</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Polishchuk</surname>
                            <given-names>DL</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Hashem</surname>
                            <given-names>J</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Sabharwal</surname>
                            <given-names>S</given-names>
                        </name>
                    </person-group>
                    <article-title>Readability of online patient education materials on adult reconstruction Web sites</article-title>
                    <source>J Arthroplasty</source>
                    <year>2012</year>
                    <month>05</month>
                    <volume>27</volume>
                    <issue>5</issue>
                    <fpage>716</fpage>
                    <lpage>9</lpage>
                    <pub-id pub-id-type="doi">10.1016/j.arth.2011.08.020</pub-id>
                    <pub-id pub-id-type="medline">22000573</pub-id>
                    <pub-id pub-id-type="pii">S0883-5403(11)00472-4</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref29">
                <label>29</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Ahmed</surname>
                            <given-names>OH</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Sullivan</surname>
                            <given-names>SJ</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Schneiders</surname>
                            <given-names>AG</given-names>
                        </name>
                        <name name-style="western">
                            <surname>McCrory</surname>
                            <given-names>PR</given-names>
                        </name>
                    </person-group>
                    <article-title>Concussion information online: evaluation of information quality, content and readability of concussion-related websites</article-title>
                    <source>Br J Sports Med</source>
                    <year>2012</year>
                    <month>07</month>
                    <volume>46</volume>
                    <issue>9</issue>
                    <fpage>675</fpage>
                    <lpage>83</lpage>
                    <pub-id pub-id-type="doi">10.1136/bjsm.2010.081620</pub-id>
                    <pub-id pub-id-type="medline">21504964</pub-id>
                    <pub-id pub-id-type="pii">bjsm.2010.081620</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref30">
                <label>30</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Bailey</surname>
                            <given-names>M</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Coughlin</surname>
                            <given-names>PA</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Sohrabi</surname>
                            <given-names>S</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Griffin</surname>
                            <given-names>KJ</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Rashid</surname>
                            <given-names>ST</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Troxler</surname>
                            <given-names>MA</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Scott</surname>
                            <given-names>DJ</given-names>
                        </name>
                    </person-group>
                    <article-title>Quality and readability of online patient information for abdominal aortic aneurysms</article-title>
                    <source>J Vasc Surg</source>
                    <year>2012</year>
                    <month>07</month>
                    <volume>56</volume>
                    <issue>1</issue>
                    <fpage>21</fpage>
                    <lpage>6</lpage>
                    <pub-id pub-id-type="doi">10.1016/j.jvs.2011.12.063</pub-id>
                    <pub-id pub-id-type="medline">22521801</pub-id>
                    <pub-id pub-id-type="pii">S0741-5214(11)03111-9</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref31">
                <label>31</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Hendrick</surname>
                            <given-names>PA</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Ahmed</surname>
                            <given-names>OH</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Bankier</surname>
                            <given-names>SS</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Chan</surname>
                            <given-names>TJ</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Crawford</surname>
                            <given-names>SA</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Ryder</surname>
                            <given-names>CR</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Welsh</surname>
                            <given-names>LJ</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Schneiders</surname>
                            <given-names>AG</given-names>
                        </name>
                    </person-group>
                    <article-title>Acute low back pain information online: an evaluation of quality, content accuracy and readability of related websites</article-title>
                    <source>Man Ther</source>
                    <year>2012</year>
                    <month>08</month>
                    <volume>17</volume>
                    <issue>4</issue>
                    <fpage>318</fpage>
                    <lpage>24</lpage>
                    <pub-id pub-id-type="doi">10.1016/j.math.2012.02.019</pub-id>
                    <pub-id pub-id-type="medline">22464886</pub-id>
                    <pub-id pub-id-type="pii">S1356-689X(12)00049-5</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref32">
                <label>32</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Kim</surname>
                            <given-names>H</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Goryachev</surname>
                            <given-names>S</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Rosemblat</surname>
                            <given-names>G</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Browne</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Keselman</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Zeng-Treitler</surname>
                            <given-names>Q</given-names>
                        </name>
                    </person-group>
                    <article-title>Beyond Surface Characteristics: A New Health Text-Specific Readability Measurement</article-title>
                    <source>AMIA Annu Symp Proc</source>
                    <year>2007</year>
                    <fpage>418</fpage>
                    <lpage>22</lpage>
                </nlm-citation>
            </ref>
            <ref id="ref33">
                <label>33</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Gemoets</surname>
                            <given-names>D</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Rosemblat</surname>
                            <given-names>G</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Tse</surname>
                            <given-names>T</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Logan</surname>
                            <given-names>R</given-names>
                        </name>
                    </person-group>
                    <article-title>Assessing readability of consumer health information: an exploratory study</article-title>
                    <source>Stud Health Technol Inform</source>
                    <year>2004</year>
                    <volume>107</volume>
                    <issue>Pt 2</issue>
                    <fpage>869</fpage>
                    <lpage>73</lpage>
                    <pub-id pub-id-type="medline">15360936</pub-id>
                    <pub-id pub-id-type="pii">D040004271</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref34">
                <label>34</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Clinton</surname>
                            <given-names>V</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Broek</surname>
                            <given-names>P</given-names>
                        </name>
                    </person-group>
                    <article-title>Interest, inferences, and learning from texts</article-title>
                    <source>Learning and Individual Differences</source>
                    <year>2012</year>
                    <volume>22</volume>
                    <issue>6</issue>
                    <fpage>650</fpage>
                </nlm-citation>
            </ref>
            <ref id="ref35">
                <label>35</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Er&#231;etin</surname>
                            <given-names>G</given-names>
                        </name>
                    </person-group>
                    <article-title>Effects of Topic Interest and Prior Knowledge on Text Recall and Annotation use in Reading a Hypermedia Text in the L2</article-title>
                    <source>ReCALL</source>
                    <year>2010</year>
                    <volume>22</volume>
                    <issue>2</issue>
                    <fpage>228</fpage>
                </nlm-citation>
            </ref>
            <ref id="ref36">
                <label>36</label>
                <nlm-citation citation-type="confproc">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Leroy</surname>
                            <given-names>G</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Endicott</surname>
                            <given-names>J</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Mouradi</surname>
                            <given-names>O</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Kauchak</surname>
                            <given-names>D</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Just</surname>
                            <given-names>M</given-names>
                        </name>
                    </person-group>
                    <article-title>Improving Perceived and Actual Text Difficulty for Health Information Consumers using Semi-Automated Methods</article-title>
                    <source>Proceedings of the American Medical Informatics Association (AMIA) Fall Symposium</source>
                    <year>2012</year>
                    <conf-name>American Medical Informatics Association (AMIA) Fall Symposium</conf-name>
                    <conf-date>Nov. 3-7, 2012</conf-date>
                    <conf-loc>Chicago, IL</conf-loc>
                </nlm-citation>
            </ref>
            <ref id="ref37">
                <label>37</label>
                <nlm-citation citation-type="web">
                    <source>Web 1T 5-gram Corpus Version 1.1</source>
                    <access-date>2013-07-07</access-date>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.ldc.upenn.edu/Catalog/docs/LDC2006T13/readme.txt">http://www.ldc.upenn.edu/Catalog/docs/LDC2006T13/readme.txt</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6HwSRwun2</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref38">
                <label>38</label>
                <nlm-citation citation-type="book">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Fellbaum</surname>
                            <given-names>C</given-names>
                        </name>
                    </person-group>
                    <source>WordNet: An Electronic Lexical Database</source>
                    <year>1998</year>
                    <publisher-loc>Cambridge, MA</publisher-loc>
                    <publisher-name>MIT Press</publisher-name>
                </nlm-citation>
            </ref>
            <ref id="ref39">
                <label>39</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Miller</surname>
                            <given-names>GA</given-names>
                        </name>
                    </person-group>
                    <article-title>WordNet: a lexical database for English</article-title>
                    <source>Commun. ACM</source>
                    <year>1995</year>
                    <volume>38</volume>
                    <issue>11</issue>
                    <fpage>39</fpage>
                </nlm-citation>
            </ref>
            <ref id="ref40">
                <label>40</label>
                <nlm-citation citation-type="web">
                    <source>How the GRE tests are scored</source>
                    <access-date>2013-02-06</access-date>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.ets.org/gre/institutions/scores/how">http://www.ets.org/gre/institutions/scores/how</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6EEh5ILJE</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref41">
                <label>41</label>
                <nlm-citation citation-type="confproc">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Kittur</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Chi</surname>
                            <given-names>E</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Suh</surname>
                            <given-names>B</given-names>
                        </name>
                    </person-group>
                    <article-title>Crowdsourcing User Studies with Mechanical Turk</article-title>
                    <source>Proceedings of the SIGCHI Conference on Human Factors in System Computing</source>
                    <year>2008</year>
                    <conf-name>Proceedings of the SIGCHI Conference on Human Factors in System Computing</conf-name>
                    <conf-date>2008</conf-date>
                    <conf-loc>Florence, Italy</conf-loc>
                    <fpage>453</fpage>
                    <lpage>456</lpage>
                </nlm-citation>
            </ref>
            <ref id="ref42">
                <label>42</label>
                <nlm-citation citation-type="confproc">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Ross</surname>
                            <given-names>J</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Irani</surname>
                            <given-names>L</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Silberman</surname>
                            <given-names>MS</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Zaldivar</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Tomlinson</surname>
                            <given-names>B</given-names>
                        </name>
                    </person-group>
                    <article-title>Who are the Crowdworkers? Shifting Demographics in Mechanical Turk</article-title>
                    <source>Proceedings of the CHI '10 Extended Abstracts on Human Factors in Computing Systems</source>
                    <year>2010</year>
                    <conf-name>CHI '10 Extended Abstracts on Human Factors in Computing Systems</conf-name>
                    <conf-date>2010</conf-date>
                    <conf-loc>Atlanta, Georgia</conf-loc>
                </nlm-citation>
            </ref>
            <ref id="ref43">
                <label>43</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Paolacci</surname>
                            <given-names>G</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Changler</surname>
                            <given-names>J</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Ipeirotis</surname>
                            <given-names>PG</given-names>
                        </name>
                    </person-group>
                    <article-title>Running Experiments on Amazon Mechanical Turk</article-title>
                    <source>Judgment and Decision-making</source>
                    <year>2010</year>
                    <volume>5</volume>
                    <issue>5</issue>
                    <fpage>411</fpage>
                </nlm-citation>
            </ref>
            <ref id="ref44">
                <label>44</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Buhrmester</surname>
                            <given-names>M</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Kwang</surname>
                            <given-names>T</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Gosling</surname>
                            <given-names>SD</given-names>
                        </name>
                    </person-group>
                    <article-title>Amazon's Mechanical Turk A New Source of Inexpensive, Yet High-Quality, Data?</article-title>
                    <source>Perspectives on Psychological Science</source>
                    <year>2011</year>
                    <volume>6</volume>
                    <issue>1</issue>
                </nlm-citation>
            </ref>
            <ref id="ref45">
                <label>45</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Cohen</surname>
                            <given-names>S</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Kamarck</surname>
                            <given-names>T</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Mermelstein</surname>
                            <given-names>R</given-names>
                        </name>
                    </person-group>
                    <article-title>A Global Measure of Perceived Stress</article-title>
                    <source>Journal of Health and Social Behavior</source>
                    <year>1983</year>
                    <volume>24</volume>
                    <issue>4</issue>
                    <fpage>385</fpage>
                </nlm-citation>
            </ref>
            <ref id="ref46">
                <label>46</label>
                <nlm-citation citation-type="book">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Nurss</surname>
                            <given-names>JR</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Parker</surname>
                            <given-names>RM</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Williams</surname>
                            <given-names>MV</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Baker</surname>
                            <given-names>DW</given-names>
                        </name>
                    </person-group>
                    <source>Test of Functional Health Literacy in Adults</source>
                    <year>1995</year>
                    <publisher-loc>Hartford, MI</publisher-loc>
                    <publisher-name>Peppercorn Books &#38; Press</publisher-name>
                </nlm-citation>
            </ref>
            <ref id="ref47">
                <label>47</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Parker</surname>
                            <given-names>RM</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Baker</surname>
                            <given-names>DW</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Williams</surname>
                            <given-names>MV</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Nurss</surname>
                            <given-names>JR</given-names>
                        </name>
                    </person-group>
                    <article-title>The Test of Functional Health Literacy in Adults: A New Instrument for Measuring Patients&#8217; Literacy Skills</article-title>
                    <source>Journal of General Internal Medicine</source>
                    <year>1995</year>
                    <volume>10</volume>
                    <fpage>537</fpage>
                    <lpage>541</lpage>
                </nlm-citation>
            </ref>
            <ref id="ref48">
                <label>48</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Leroy</surname>
                            <given-names>G</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Lally</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Chen</surname>
                            <given-names>H</given-names>
                        </name>
                    </person-group>
                    <article-title>The Use of Dynamic Contexts to Improve Casual Internet Searching</article-title>
                    <source>ACM Transactions on Information Systems</source>
                    <year>2003</year>
                    <volume>21</volume>
                    <issue>3</issue>
                    <fpage>229</fpage>
                </nlm-citation>
            </ref>
            <ref id="ref49">
                <label>49</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Leroy</surname>
                            <given-names>G</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Rindflesch</surname>
                            <given-names>TC</given-names>
                        </name>
                    </person-group>
                    <article-title>Effects of information and machine learning algorithms on word sense disambiguation with small datasets</article-title>
                    <source>Int J Med Inform</source>
                    <year>2005</year>
                    <month>08</month>
                    <volume>74</volume>
                    <issue>7-8</issue>
                    <fpage>573</fpage>
                    <lpage>85</lpage>
                    <pub-id pub-id-type="doi">10.1016/j.ijmedinf.2005.03.013</pub-id>
                    <pub-id pub-id-type="medline">15897005</pub-id>
                    <pub-id pub-id-type="pii">S1386-5056(05)00026-2</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref50">
                <label>50</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Zeng-Treitler</surname>
                            <given-names>Q</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Goryachev</surname>
                            <given-names>S</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Tse</surname>
                            <given-names>T</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Keselman</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Boxwala</surname>
                            <given-names>A</given-names>
                        </name>
                    </person-group>
                    <article-title>Estimating consumer familiarity with health terminology: a context-based approach</article-title>
                    <source>J Am Med Inform Assoc</source>
                    <year>2008</year>
                    <volume>15</volume>
                    <issue>3</issue>
                    <fpage>349</fpage>
                    <lpage>56</lpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://jamia.bmj.com/cgi/pmidlookup?view=long&#38;pmid=18308983" />
                    </comment>
                    <pub-id pub-id-type="doi">10.1197/jamia.M2592</pub-id>
                    <pub-id pub-id-type="medline">18308983</pub-id>
                    <pub-id pub-id-type="pii">M2592</pub-id>
                    <pub-id pub-id-type="pmcid">PMC2409994</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref51">
                <label>51</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Keselman</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Smith</surname>
                            <given-names>CA</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Divita</surname>
                            <given-names>G</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Kim</surname>
                            <given-names>H</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Browne</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Leroy</surname>
                            <given-names>G</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Zeng-Treitler</surname>
                            <given-names>Q</given-names>
                        </name>
                    </person-group>
                    <article-title>Consumer Health Concepts that do not Map to the UMLS: Where Do They Fit?</article-title>
                    <source>Journal of the American Medical Informatics Association</source>
                    <year>2008</year>
                    <volume>15</volume>
                    <issue>4</issue>
                    <fpage>496</fpage>
                    <lpage>505</lpage>
                </nlm-citation>
            </ref>
            <ref id="ref52">
                <label>52</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Keselman</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Logan</surname>
                            <given-names>R</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Smith</surname>
                            <given-names>CA</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Leroy</surname>
                            <given-names>G</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Zeng-Treitler</surname>
                            <given-names>Q</given-names>
                        </name>
                    </person-group>
                    <article-title>Developing informatics tools and strategies for consumer-centered health communication</article-title>
                    <source>J Am Med Inform Assoc</source>
                    <year>2008</year>
                    <volume>15</volume>
                    <issue>4</issue>
                    <fpage>473</fpage>
                    <lpage>83</lpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://jamia.bmj.com/cgi/pmidlookup?view=long&#38;pmid=18436895" />
                    </comment>
                    <pub-id pub-id-type="doi">10.1197/jamia.M2744</pub-id>
                    <pub-id pub-id-type="medline">18436895</pub-id>
                    <pub-id pub-id-type="pii">M2744</pub-id>
                    <pub-id pub-id-type="pmcid">PMC2442255</pub-id>
                </nlm-citation>
            </ref>
        </ref-list>
    </back>
</article>
