<?xml version="1.0" encoding="utf-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMIR</journal-id>
      <journal-id journal-id-type="nlm-ta">J Med Internet Res</journal-id>
      <journal-title>Journal of Medical Internet Research</journal-title>
      <issn pub-type="epub">1438-8871</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
    <article-id pub-id-type="publisher-id">v19i10e342</article-id>
    <article-id pub-id-type="pmid">29038097</article-id>
    <article-id pub-id-type="doi">10.2196/jmir.7754</article-id>
    <article-categories>
      <subj-group subj-group-type="heading">
        <subject>Original Paper</subject>
      </subj-group>
      <subj-group subj-group-type="article-type">
        <subject>Original Paper</subject>
      </subj-group>
    </article-categories>
    <title-group>
      <article-title>Recommending Education Materials for Diabetic Questions Using Information Retrieval Approaches</article-title>
    </title-group>
    <contrib-group>
      <contrib contrib-type="editor">
        <name>
          <surname>Eysenbach</surname>
          <given-names>Gunther</given-names>
        </name>
      </contrib>
    </contrib-group>
    <contrib-group>
      <contrib contrib-type="reviewer">
        <name>
          <surname>Da Silva</surname>
          <given-names>Edson</given-names>
        </name>
      </contrib>
      <contrib contrib-type="reviewer">
        <name>
          <surname>Fitzner</surname>
          <given-names>Karen</given-names>
        </name>
      </contrib>
    </contrib-group>
    <contrib-group>
      <contrib contrib-type="author" id="contrib1" equal-contrib="yes">
        <name name-style="western">
          <surname>Zeng</surname>
          <given-names>Yuqun</given-names>
        </name>
        <xref rid="aff1" ref-type="aff">1</xref>
        <xref rid="aff2" ref-type="aff">2</xref>
        <xref rid="aff3" ref-type="aff">3</xref>
        <ext-link ext-link-type="orcid">http://orcid.org/0000-0003-3402-1953</ext-link>
      </contrib>
      <contrib contrib-type="author" id="contrib2" equal-contrib="yes">
        <name name-style="western">
          <surname>Liu</surname>
          <given-names>Xusheng</given-names>
        </name>
        <xref rid="aff1" ref-type="aff">1</xref>
        <ext-link ext-link-type="orcid">http://orcid.org/0000-0002-7521-851X</ext-link>
      </contrib>
      <contrib contrib-type="author" id="contrib3">
        <name name-style="western">
          <surname>Wang</surname>
          <given-names>Yanshan</given-names>
        </name>
        <xref rid="aff2" ref-type="aff">2</xref>
        <ext-link ext-link-type="orcid">http://orcid.org/0000-0003-4433-7839</ext-link>
      </contrib>
      <contrib contrib-type="author" id="contrib4">
        <name name-style="western">
          <surname>Shen</surname>
          <given-names>Feichen</given-names>
        </name>
        <xref rid="aff2" ref-type="aff">2</xref>
        <ext-link ext-link-type="orcid">http://orcid.org/0000-0002-7803-2331</ext-link>
      </contrib>
      <contrib contrib-type="author" id="contrib5">
        <name name-style="western">
          <surname>Liu</surname>
          <given-names>Sijia</given-names>
        </name>
        <xref rid="aff2" ref-type="aff">2</xref>
        <xref rid="aff4" ref-type="aff">4</xref>
        <ext-link ext-link-type="orcid">http://orcid.org/0000-0001-9763-1164</ext-link>
      </contrib>
      <contrib contrib-type="author" id="contrib6">
        <name name-style="western">
          <surname>Rastegar-Mojarad</surname>
          <given-names>Majid</given-names>
        </name>
        <xref rid="aff2" ref-type="aff">2</xref>
        <ext-link ext-link-type="orcid">http://orcid.org/0000-0001-6962-3554</ext-link>
      </contrib>
      <contrib contrib-type="author" id="contrib7">
        <name name-style="western">
          <surname>Wang</surname>
          <given-names>Liwei</given-names>
        </name>
        <xref rid="aff2" ref-type="aff">2</xref>
        <ext-link ext-link-type="orcid">http://orcid.org/0000-0001-6985-9698</ext-link>
      </contrib>
      <contrib contrib-type="author" id="contrib8" corresp="yes">
      <name name-style="western">
        <surname>Liu</surname>
        <given-names>Hongfang</given-names>
      </name>
      <xref rid="aff2" ref-type="aff">2</xref>
      <address>
        <institution>Department of Health Sciences Research</institution>
        <institution>Mayo College of Medicine</institution>
        <institution>Mayo Clinic</institution>
        <addr-line>200 First Street SW</addr-line>
        <addr-line>Rochester, MN, 55905</addr-line>
        <country>United States</country>
        <phone>1 5072930057</phone>
        <fax>1 5072841516</fax>
        <email>Liu.Hongfang@mayo.edu</email>
      </address>  
      <ext-link ext-link-type="orcid">http://orcid.org/0000-0003-2570-3741</ext-link></contrib>
    </contrib-group>
    <aff id="aff1">
    <sup>1</sup>
    <institution>The Second Clinical College</institution>
    <institution>Guangzhou University of Chinese Medicine</institution>  
    <addr-line>Guangzhou</addr-line>
    <country>China</country></aff>
    <aff id="aff2">
    <sup>2</sup>
    <institution>Department of Health Sciences Research</institution>
    <institution>Mayo College of Medicine</institution>  
    <institution>Mayo Clinic</institution>  
    <addr-line>Rochester, MN</addr-line>
    <country>United States</country></aff>
    <aff id="aff3">
    <sup>3</sup>
    <institution>Department of Traditional Chinese Medicine</institution>
    <institution>The Seventh Affiliated Hospital of Sun Yat-sen University</institution>  
    <addr-line>Shenzhen</addr-line>
    <country>China</country></aff>
    <aff id="aff4">
    <sup>4</sup>
    <institution>Department of Computer Science and Engineering</institution>
    <institution>University at Buffalo, The State University of New York</institution>  
    <addr-line>Buffalo, NY</addr-line>
    <country>United States</country></aff>
    <author-notes>
      <corresp>Corresponding Author: Hongfang Liu 
      <email>Liu.Hongfang@mayo.edu</email></corresp>
    </author-notes>
    <pub-date pub-type="collection"><month>10</month><year>2017</year></pub-date>
    <pub-date pub-type="epub">
      <day>16</day>
      <month>10</month>
      <year>2017</year>
    </pub-date>
    <volume>19</volume>
    <issue>10</issue>
    <elocation-id>e342</elocation-id>
    <!--history from ojs - api-xml-->
    <history>
      <date date-type="received">
        <day>24</day>
        <month>3</month>
        <year>2017</year>
      </date>
      <date date-type="rev-request">
        <day>15</day>
        <month>6</month>
        <year>2017</year>
      </date>
      <date date-type="rev-recd">
        <day>6</day>
        <month>8</month>
        <year>2017</year>
      </date>
      <date date-type="accepted">
        <day>29</day>
        <month>8</month>
        <year>2017</year>
      </date>
    </history>
    <!--(c) the authors - correct author names and publication date here if necessary. Date in form ', dd.mm.yyyy' after jmir.org-->
    <copyright-statement>©Yuqun Zeng, Xusheng Liu, Yanshan Wang, Feichen Shen, Sijia Liu, Majid Rastegar Mojarad, Liwei Wang, Hongfang Liu. Originally published in the Journal of Medical Internet Research (http://www.jmir.org), 16.10.2017.</copyright-statement>
    <copyright-year>2017</copyright-year>
    <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
      <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in the Journal of Medical Internet Research, is properly cited. The complete bibliographic information, a link to the original publication on http://www.jmir.org/, as well as this copyright and license information must be included.</p>
    </license>  
    <self-uri xlink:href="http://www.jmir.org/2017/10/e342/" xlink:type="simple"/>
    <abstract>
      <sec sec-type="background">
        <title>Background</title>
        <p>Self-management is crucial to diabetes care and providing expert-vetted content for answering patients’ questions is crucial in facilitating patient self-management.</p>
      </sec>
      <sec sec-type="objective">
        <title>Objective</title>
        <p>The aim is to investigate the use of information retrieval techniques in recommending patient education materials for diabetic questions of patients.</p>
      </sec>
      <sec sec-type="methods">
        <title>Methods</title>
        <p>We compared two retrieval algorithms, one based on Latent Dirichlet Allocation topic modeling (topic modeling-based model) and one based on semantic group (semantic group-based model), with the baseline retrieval models, vector space model (VSM), in recommending diabetic patient education materials to diabetic questions posted on the TuDiabetes forum. The evaluation was based on a gold standard dataset consisting of 50 randomly selected diabetic questions where the relevancy of diabetic education materials to the questions was manually assigned by two experts. The performance was assessed using precision of top-ranked documents.</p>
      </sec>
      <sec sec-type="results">
        <title>Results</title>
        <p>We retrieved 7510 diabetic questions on the forum and 144 diabetic patient educational materials from the patient education database at Mayo Clinic. The mapping rate of words in each corpus mapped to the Unified Medical Language System (UMLS) was significantly different (<italic>P</italic>&#60;.001). The topic modeling-based model outperformed the other retrieval algorithms. For example, for the top-retrieved document, the precision of the topic modeling-based, semantic group-based, and VSM models was 67.0%, 62.8%, and 54.3%, respectively.</p>
      </sec>
      <sec sec-type="conclusions">
        <title>Conclusions</title>
        <p>This study demonstrated that topic modeling can mitigate the vocabulary difference and it achieved the best performance in recommending education materials for answering patients’ questions. One direction for future work is to assess the generalizability of our findings and to extend our study to other disease areas, other patient education material resources, and online forums.</p>
      </sec>
    </abstract>
    <kwd-group>
      <kwd>education materials</kwd>
      <kwd>patients</kwd>
      <kwd>questions</kwd>
      <kwd>recommendation</kwd>
      <kwd>information retrieval</kwd>
    </kwd-group></article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <p>Diabetes is a chronic metabolic disease currently affecting almost 415 million patients worldwide with an estimation of this reaching 642 million by the year 2040 [<xref ref-type="bibr" rid="ref1">1</xref>]. Having diabetes is associated with substantially higher lifetime medical expenditures despite being associated with reduced life expectancy [<xref ref-type="bibr" rid="ref2">2</xref>]. Optimal control of diabetes requires a high degree of self-management where individuals have the necessary knowledge, skill, and ability for diabetes self-care [<xref ref-type="bibr" rid="ref3">3</xref>]. Self-management consists of a complex and dynamic set of processes and is deeply embedded in each patient’s unique situation [<xref ref-type="bibr" rid="ref4">4</xref>]. Meeting the information needs of each patient is crucial in facilitating self-management.</p>
      <p>Patients’ self-learning is an important component of self-management. For example, through self-learning modules, patients can gain more knowledge and be more knowledgeable about practice interventions regarding foot care, which is a widely neglected part of diabetes management [<xref ref-type="bibr" rid="ref5">5</xref>]. Meanwhile, the Internet has become an important source of self-learning for patients. Many online health communities and forums have emerged as popular platforms for patients to ask questions and share information. However, the quality of health information on the Internet is highly variable [<xref ref-type="bibr" rid="ref6">6</xref>]. It is crucial to provide expert-vetted information to patients. At the same time, there is an abundant supply of expert-vetted patient education resources that aim to help diabetic patients improve their diabetes self-management [<xref ref-type="bibr" rid="ref7">7</xref>-<xref ref-type="bibr" rid="ref9">9</xref>]; however, it is quite challenging for patients without a medical background to find relevant educational materials. A system that can automatically recommend such resources to patients based on their questions in an online forum would be one way to provide relevant expert-vetted education materials.</p>
      <p>Retrieving relevant education materials for given questions can be regarded as an information retrieval task. Information retrieval refers to the task of retrieving information of any type from a collection of documents related to search queries. One classic information retrieval approach is based on keyword matching (ie, Boolean model) [<xref ref-type="bibr" rid="ref10">10</xref>], where documents are represented as a set of terms and queries are represented as Boolean expressions. Another popular information retrieval approach is the ranking model. Unlike the Boolean model where terms are equally weighted, the ranking model ranks the result list in terms of relevance of documents with respect to an information need expressed in the query [<xref ref-type="bibr" rid="ref10">10</xref>]. Ranking is usually to compute numeric scores of query/document pairs where numerous scoring algorithms have been used. For example, the vector space model (VSM) computes the similarity between a query vector and a document vector, where terms can be weighted using a term frequency-inverse document frequency (TF-IDF) model [<xref ref-type="bibr" rid="ref11">11</xref>,<xref ref-type="bibr" rid="ref12">12</xref>]. One common idea of information seeking is to come up with good queries by thinking of words that would likely appear in a relevant document. The language models directly model such ideas where a document is a good match to a query if the document is likely to generate such a query. For a query, the probabilistic language model approach computes a probabilistic language model and ranks documents based on the probability of the model generating the query. Semantic searching intends to improve searches by understanding the semantics in queries and document collections. Concept mapping is popularly used in semantic searches where keywords are mapped to concepts captured in terminological resources. In general English, WordNet is a popular terminology resource where terms are grouped into sets of synonyms according to their meanings and organized into hierarchies based on their semantic relations [<xref ref-type="bibr" rid="ref13">13</xref>].</p>
      <p>Recently, topic modeling, which discovers abstract topics in document collections, has become a frequently used technique in text mining. The most common topic modeling approach is Latent Dirichlet Allocation (LDA), which allows documents to have a mixture of topics. For example, Wang and Blei [<xref ref-type="bibr" rid="ref14">14</xref>] used topic modeling to generate an interpretable latent structure for users and items, which can provide recommendations about both existing and newly published scientific articles. In information retrieval, topic modeling can be effective in enabling the incorporation of hidden semantics [<xref ref-type="bibr" rid="ref15">15</xref>].</p>
      <p>In the clinical domain, there are many information retrieval applications [<xref ref-type="bibr" rid="ref16">16</xref>], including clinical decision support. For example, InfoRetriever was designed for family medicine providers to practice evidence-based medicine [<xref ref-type="bibr" rid="ref17">17</xref>]. Information retrieval technology is also popularly used in patient education applications, such as the PERSIVAL system, which is based on individual patient records and provides personalized access to a distributed patient care digital library by retrieving and summarizing relevant education materials.</p>
      <p>Here, we propose a system that leverages the latest information retrieval techniques, which recommends patient education materials for questions asked by patients online. The system aims to provide expert-vetted, patient-faced information to patients. A similar system has been proposed by Kandula et al [<xref ref-type="bibr" rid="ref18">18</xref>] where, instead of patients questions, their system recommended relevant education materials based on medical records. In this study, we investigated the use of state-of-the-art information retrieval approaches to recommend diabetes education materials for questions available in an online diabetes forum.</p>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <p>An overview of our workflow of this study is presented in <xref ref-type="fig" rid="figure1">Figure 1</xref>. We designed a recommendation system using three retrieval models, including a topic modeling-based model, a semantic group-based model, and a VSM. To evaluate the performance of each model in the system, we assembled a gold standard dataset created manually for a randomly sampled subset of questions.</p>
      <fig id="figure1" position="float">
        <label>Figure 1</label>
        <caption>
          <p>The workflow of this study.</p>
        </caption>
        <graphic xlink:href="jmir_v19i10e342_fig1.jpg" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
      </fig>
      <sec>
        <title>Materials</title>
        <p>The materials used for our study included a corpus of patient educational materials for diabetic patients retrieved from Mayo Clinic’s patient education database and a corpus of questions retrieved from a diabetic forum. There were more than 7400 high-quality, expert-reviewed, and outcome-based patient education materials available in the Mayo Clinic’s Database of Approved Patient Education Materials, which are indexed using disease concepts. We retrieved all diabetes-related education materials, a total of 144 documents, in PDF format and used Apache Tika, a content analysis toolkit [<xref ref-type="bibr" rid="ref19">19</xref>], to transform the PDF format to plain text and form the patient educational materials corpus. We chose a popular diabetic online forum, the TuDiabetes forum [<xref ref-type="bibr" rid="ref20">20</xref>], to retrieve questions asked by diabetic patients. There are more than 43,000 forum users who post questions, provide answers or comments, participate in discussions, and share experiences. Questions in the forum have been categorized into 12 categories. We gathered a total of 7510 diabetic questions from the website; for each question, the corresponding title, content, and category were extracted and formed into the corpus of questions from diabetic patients.</p>
      </sec>
      <sec>
        <title>Tools</title>
        <p>We used the Unified Medical Language System (UMLS) from the US National Library of Medicine (NLM) and the associated concept-mapping tool, MetaMap, to represent and extract clinical concepts from the corpora. The UMLS is a comprehensive resource for clinical concepts, which integrates more than 2 million names for some 900,000 concepts from more than 60 families of biomedical vocabularies, as well as 12 million relations among these concepts [<xref ref-type="bibr" rid="ref21">21</xref>]. Each clinical concept is assigned a concept unique identifier. The UMLS arranges clinical concepts into 134 semantic types. These semantic types are further grouped into 15 semantic groups. The MetaMap tool is a configurable app developed by NLM to map biomedical text to the UMLS Metathesaurus.</p>
        <p>We used the LDA topic model with JGibbLDA software [<xref ref-type="bibr" rid="ref22">22</xref>] to classify the patient education materials. LDA topic modeling is a common method that generates a high underlying set of topic probabilities with an infinite mixture based on a three-level hierarchical Bayesian model [<xref ref-type="bibr" rid="ref23">23</xref>]. The statistical analysis was performed using R [<xref ref-type="bibr" rid="ref24">24</xref>]. The attribute proportion data were analyzed using chi-square tests. We also used Cytoscape software version 3.4 to visualize the networks generated in different models [<xref ref-type="bibr" rid="ref25">25</xref>].</p>
      </sec>
      <sec>
        <title>Information Retrieval Algorithms</title>
        <p>We compared three algorithms for recommending patient education materials for matching questions: (1) a VSM model as the baseline model using scikit-learn 0.18.0 package [<xref ref-type="bibr" rid="ref26">26</xref>], (2) a topic modeling-based matching model motivated by Kandula et al [<xref ref-type="bibr" rid="ref18">18</xref>] using topic modeling for matching patient educational material to patient’s clinic notes, and (3) a semantic group-based matching model that considered each semantic group as a topic in the patient educational materials corpus, the detail processing in <xref ref-type="fig" rid="figure2">Figure 2</xref>. See <xref ref-type="app" rid="app1">Multimedia Appendix 1</xref> for the weight calculations for the topic modeling-based and semantic group-based models.</p>
        <fig id="figure2" position="float">
          <label>Figure 2</label>
          <caption>
            <p>The workflow of the semantic group-based model. CHEM: chemicals and drugs; CONC: concepts and ideas; CUI: concept unique identifier; DISO: disease; QDP: questions from diabetic patients; PEM: patient educational materials.</p>
          </caption>
          <graphic xlink:href="jmir_v19i10e342_fig2.jpg" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Gold Standard and Evaluation</title>
        <p>To compare the performance, we randomly selected 50 questions and assembled a gold standard dataset based on manual review with the agreement of two experts. Specifically, for the pairing of question <italic>q</italic> and education material document <italic>d</italic>, we manually assigned a score in the range of 0 to 2 to indicate if d was relevant to q, where 0 indicated no relevance, 1 partial relevance, and 2 most relevance. Two medical experts performed the task. The weighted Cohen kappa value was calculated to determine interannotator agreement. A gold standard was then created based on the consensus of the two experts. The precision of the top <italic>k</italic> retrieved documents was used to evaluate the performance of the models, defined in the following:</p>
        <disp-formula>Precision (k)=(number of relevant documents)/k</disp-formula>
        <p>where a partial relevance document was counted as 0.5.</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Overall Statistics</title>
        <p>As shown in <xref ref-type="table" rid="table1">Table 1</xref>, the mean document length (word count) was 968 (SD 115) and 110 (SD 36) for patient educational materials and questions from diabetic patients, respectively. The UMLS mapping rate (the ratio of words that can be mapped to UMLS concepts) for patient educational materials was significantly higher than questions from diabetic patients (<italic>P</italic>&#60;.001) with more unique concepts in questions from diabetic patients than in patient educational materials. The unique word count in questions from diabetic patients was 41,820 with 8952 in patient educational materials. The majority of the words in patient educational materials were present in questions from diabetic patients with 25.06% (2244/8952) of the words not in questions from diabetic patients (<xref ref-type="fig" rid="figure3">Figure 3</xref>).</p>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>An overview of the two corpora.</p>
          </caption>
          <table width="520" cellpadding="7" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="150"/>
            <col width="75"/>
            <col width="100"/>
            <col width="100"/>
            <col width="100"/>
            <col width="100"/>
            <thead>
              <tr valign="top">
                <td>Corpus</td>
                <td>Number</td>
                <td>Total word count <break/>(mapping rate)<sup>a</sup></td>
                <td>Word count, mean (SD)</td>
                <td>Unique word count</td>
                <td>Unique UMLS<break/>concepts, n</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Questions from diabetic <break/>patients</td>
                <td>7510</td>
                <td>829,893 (91.18%)</td>
                <td>110 (36)</td>
                <td>41,820</td>
                <td>19,616</td>
              </tr>
              <tr valign="top">
                <td>Patient educational materials</td>
                <td>144</td>
                <td>139,463 (93.31%)</td>
                <td>968 (115)</td>
                <td>8952</td>
                <td>7924</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table1fn1">
              <p><sup>a</sup> Mapping rate was presented the probability of words mapped to the UMLS from the total word count. Difference in mapping rate between the two corpa was statistically significant (<italic>P</italic>&#60;.001).</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <p><xref ref-type="table" rid="table2">Table 2</xref> shows the top 20 words for each corpus. The diabetes technology, community, and type 1 and latent autoimmune diabetes of adulthood (LADA) were the most common topics posted by questions from diabetic patient users, and topic 5, topic 3, and topic 8 were the main topics by topic modeling in patient educational materials documents as shown in <xref ref-type="table" rid="table3">Table 3</xref>. <xref ref-type="table" rid="table4">Table 4</xref> shows some examples of topics obtained using topic modeling, which lists the top 20 words and their corresponding weights for each of the topics. The results of the topic vocabulary similarity analysis calculating the cosine similarity between each two topics of the two corpora are presented by a heat map graphic (<xref ref-type="fig" rid="figure4">Figure 4</xref>). There was no vocabulary similarity between the questions from diabetic patients categories and the patient educational materials topics, but one topic to one another topic in interior questions from diabetic patients corpus had high linguistic similarity. The semantic group distribution of the two corpora was significantly different (<xref ref-type="fig" rid="figure5">Figure 5</xref>) where procedures, phenomena, objects, living beings, disorders, and anatomy were more prevalent in patient educational materials, whereas physiology, genes and molecular sequences, devices, and chemicals and drugs were more prevalent in patient educational materials.</p>
        <fig id="figure3" position="float">
          <label>Figure 3</label>
          <caption>
            <p>The Venn diagram of the words in the two corpora. There were 35,112 (83.96%) unique words in the questions from diabetic patients (QDP) corpus and 2244 (25.06%) unique words in the patient educational materials (PEM) corpus.</p>
          </caption>
          <graphic xlink:href="jmir_v19i10e342_fig3.jpg" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>The top 20 words in the two corpora.</p>
          </caption>
          <table width="475" cellpadding="7" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="75"/>
            <col width="100"/>
            <col width="100"/>
            <col width="100"/>
            <col width="100"/>
            <thead>
              <tr valign="top">
                <td>Rank</td>
                <td colspan="2">Questions from diabetic patients</td>
                <td colspan="2">Patient educational materials</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Word</td>
                <td>Frequency</td>
                <td>Word</td>
                <td>Frequency</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>1</td>
                <td>Diabetes</td>
                <td>9062</td>
                <td>Blood</td>
                <td>3081</td>
              </tr>
              <tr valign="top">
                <td>2</td>
                <td>Insulin</td>
                <td>5369</td>
                <td>Insulin</td>
                <td>2504</td>
              </tr>
              <tr valign="top">
                <td>3</td>
                <td>Type</td>
                <td>4657</td>
                <td>Glucose</td>
                <td>2074</td>
              </tr>
              <tr valign="top">
                <td>4</td>
                <td>Like</td>
                <td>4620</td>
                <td>Diabetes</td>
                <td>1385</td>
              </tr>
              <tr valign="top">
                <td>5</td>
                <td>Get</td>
                <td>4457</td>
                <td>Child</td>
                <td>1166</td>
              </tr>
              <tr valign="top">
                <td>6</td>
                <td>Time</td>
                <td>4107</td>
                <td>Meal</td>
                <td>1047</td>
              </tr>
              <tr valign="top">
                <td>7</td>
                <td>Know</td>
                <td>3875</td>
                <td>Childs</td>
                <td>815</td>
              </tr>
              <tr valign="top">
                <td>8</td>
                <td>Pump</td>
                <td>3428</td>
                <td>Care</td>
                <td>801</td>
              </tr>
              <tr valign="top">
                <td>9</td>
                <td>Now</td>
                <td>3421</td>
                <td>Health</td>
                <td>797</td>
              </tr>
              <tr valign="top">
                <td>10</td>
                <td>Blood</td>
                <td>3388</td>
                <td>Dose</td>
                <td>782</td>
              </tr>
              <tr valign="top">
                <td>11</td>
                <td>Day</td>
                <td>3317</td>
                <td>Test</td>
                <td>738</td>
              </tr>
              <tr valign="top">
                <td>12</td>
                <td>People</td>
                <td>2789</td>
                <td>Sugar</td>
                <td>728</td>
              </tr>
              <tr valign="top">
                <td>13</td>
                <td>First</td>
                <td>2395</td>
                <td>Help</td>
                <td>671</td>
              </tr>
              <tr valign="top">
                <td>14</td>
                <td>Sugar</td>
                <td>2383</td>
                <td>Provider</td>
                <td>638</td>
              </tr>
              <tr valign="top">
                <td>15</td>
                <td>Go</td>
                <td>2309</td>
                <td>Day</td>
                <td>635</td>
              </tr>
              <tr valign="top">
                <td>16</td>
                <td>Back</td>
                <td>2290</td>
                <td>High</td>
                <td>627</td>
              </tr>
              <tr valign="top">
                <td>17</td>
                <td>See</td>
                <td>2219</td>
                <td>Evening</td>
                <td>583</td>
              </tr>
              <tr valign="top">
                <td>18</td>
                <td>Think</td>
                <td>2148</td>
                <td>Take</td>
                <td>583</td>
              </tr>
              <tr valign="top">
                <td>19</td>
                <td>High</td>
                <td>2088</td>
                <td>Time</td>
                <td>571</td>
              </tr>
              <tr valign="top">
                <td>20</td>
                <td>Use</td>
                <td>2036</td>
                <td>Eat</td>
                <td>547</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
        <table-wrap position="float" id="table3">
          <label>Table 3</label>
          <caption>
            <p>Category and topic distribution of the two corpora.</p>
          </caption>
          <table width="487" cellpadding="7" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="15"/>
            <col width="324"/>
            <col width="118"/>
            <thead>
              <tr valign="bottom">
                <td colspan="2">Category/topic<sup>a</sup></td>
                <td>n (%)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="2"><bold>Questions from diabetic patients</bold></td>
                <td><break/></td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Type 2</td>
                <td>454 (6.0)</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Type 1 and LADA</td>
                <td>1609 (21.4)</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>TuDiabetes website</td>
                <td>97 (1.3)</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Treatment</td>
                <td>507 (6.8)</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Mental and emotional wellness</td>
                <td>92 (1.2)</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Healthy living</td>
                <td>187 (2.5)</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Food</td>
                <td>321 (4.3)</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Diabetes technology</td>
                <td>1903 (25.4)</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Diabetes complications and other conditions</td>
                <td>211 (2.8)</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Diabetes and pregnancy</td>
                <td>117 (1.6)</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Diabetes advocacy</td>
                <td>253 (3.4)</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Community</td>
                <td>1759 (23.4)</td>
              </tr>
              <tr valign="top">
                <td colspan="2"><bold>Patient educational materials (PEM)</bold></td>
                <td><break/></td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>PEM1</td>
                <td>6 (4.2)</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>PEM2</td>
                <td>5 (3.5)</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>PEM3</td>
                <td>13 (9.0)</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>PEM4</td>
                <td>6 (4.2)</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>PEM5</td>
                <td>15 (10.4)</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>PEM6</td>
                <td>10 (6.9)</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>PEM7</td>
                <td>3 (2.1)</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>PEM8</td>
                <td>11 (7.6)</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>PEM9</td>
                <td>5 (3.5)</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>PEM10</td>
                <td>7 (4.9)</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>PEM11</td>
                <td>9 (6.3)</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>PEM12</td>
                <td>9 (6.3)</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>PEM13</td>
                <td>6 (4.2)</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>PEM14</td>
                <td>8 (5.6)</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>PEM15</td>
                <td>3(2.1)</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>PEM16</td>
                <td>3(2.1)</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>PEM17</td>
                <td>6(4.2)</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>PEM18</td>
                <td>7(4.9)</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>PEM19</td>
                <td>5(3.5)</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>PEM20</td>
                <td>7(4.9)</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table3fn1">
              <p><sup>a</sup> The categories of the questions from diabetic patients corpus were labeled as the website provided, and the topics of the patient educational material (PEM) corpus were generated using LDA topic modeling. The topic proportion was calculated with the maximum distribution of document.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <table-wrap position="float" id="table4">
          <label>Table 4</label>
          <caption>
            <p>Sample topics in the patient educational materials (PEM) corpus.</p>
          </caption>
          <table width="500" cellpadding="7" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="45"/>
            <col width="350"/>
            <col width="75"/>
            <thead>
              <tr valign="top">
                <td>PEM group</td>
                <td>Top 20 most prominent words (corresponding weight)</td>
                <td>Topic</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>PEM2</td>
                <td>Disease (0.071), kidney (0.043), risk (0.037), heart (0.031), health (0.023), pressure (0.021), care (0.018), provider (0.017), factors (0.017), people (0.017), kidneys (0.015), cholesterol (0.012), high (0.011), lifestyle (0.010), levels (0.010), protein (0.010), control (0.009), body (0.008), urine (0.008), medications (0.008)</td>
                <td>Complication-kidney</td>
              </tr>
              <tr valign="top">
                <td>PEM8</td>
                <td>Food (0.039), fruit (0.024), cup (0.022), foods (0.022), eat (0.020), sugar (0.020), fat (0.019), carbohydrate (0.017), meal (0.016), plan (0.015), milk (0.015), protein (0.014), carbohydrates(0.013), snack (0.013), vegetables (0.013), grams(0.011), meals (0.011), make (0.011), calories (0.010), serving (0.010)</td>
                <td>Food</td>
              </tr>
              <tr valign="top">
                <td>PEM13</td>
                <td>Care (0.024), feet (0.023), problems (0.022), provider (0.020), pain (0.020), health (0.017), term (0.017), symptoms (0.015), peripheral (0.015), website (0.014)nerves (0.013), legs (0.012), system (0.012), neuropathy (0.012), stroke (0.012), walking (0.011), figure (0.011), shoes (0.011), infections (0.009), brain (0.009)</td>
                <td>Complication-foot</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
        <fig id="figure4" position="float">
          <label>Figure 4</label>
          <caption>
            <p>Heat map of questions from diabetic patients categories and patient educational materials topics based on cosine similarity of word vectors weighted using TF-IDF or topic word distribution. The clustering is based on Euclidean distance.</p>
          </caption>
          <graphic xlink:href="jmir_v19i10e342_fig4.jpeg" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure5" position="float">
          <label>Figure 5</label>
          <caption>
            <p>Distribution of 10 clinical semantic groups in the two corpora: questions from diabetic patients (QDP) and patient educational materials (PEM). ANAT: anatomy; CHEM: chemicals and drugs; DEVI: devices; DISO: disorders; GENE: genes and molecular sequences; LIVB: living beings; OBJC: objects; PHEN: phenomena; PHYS: physiology; PROC: procedures.</p>
          </caption>
          <graphic xlink:href="jmir_v19i10e342_fig5.jpg" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Network Analysis</title>
        <p><xref ref-type="fig" rid="figure6">Figure 6</xref> shows the networks of topics or semantic groups with questions for those with the topic/semantic group frequency larger than one (ie, question 5220 matched to topic 8 with a topic frequency of 2.22, and question 4124 matched to the physiology semantic group with semantic group frequency of 4.02). In the network of topic modeling-based model (<xref ref-type="fig" rid="figure6">Figure 6</xref>), all patient educational materials topics were presented, there were more questions matched to topic 4, topic 8, and topic 9, whereas some topics (eg, topic 1, topic 2, topic 3, or topic 10) were relevant to a small number of questions. Some questions were associated with very specific topics. For example, question 6722 from the diabetes complication and other condition topic in questions from diabetic patients corpus, the content of the question was: “Do you have neuropathy? Introduce yourself here! Foot pain, numbness, nerve pain, does anyone else know what I’m going through? Yes, we do!” It had the unique matching to the PEM13 topic (ie, complication-foot topic). In the network of semantic group-based model (<xref ref-type="fig" rid="figure6">Figure 6</xref>), the objects, physiology, and live beings groups had more questions. Similarly, some questions were associated with very specific semantic groups. For example, question 7113 from the diabetes technology topic in the questions from diabetic patients corpus, the content of the question was: “Are you an Accu-Chek user? Jump in here For users of ACCU-CHEK glucose meters.” It was mapped to the devices semantic group. The combination of the two networks (<xref ref-type="fig" rid="figure6">Figure 6</xref>) showed that for some questions the two models, topic modeling-based and semantic group-based, were complementary to each other. For example, question 2760 belonged to the diabetes complication and other condition topic in the questions from diabetic patients corpus, the content of the question was: “Balance neuropathy I don’t have the tingling, numbness, painful neuropathy, but the feelings I have in my feet somehow aren’t being delivered to my balance center. I am having a nerve conduction test an electromyography. Any advice?” It is relevant to the complication-foot topic (ie, PEM13) and also to the disorders semantic group.</p>
      </sec>
      <sec>
        <title>Performance Comparison</title>
        <p>The two experts had a high level of agreement in relevance judgment (κ=0.90). The performance of the three models is presented in <xref ref-type="fig" rid="figure7">Figure 7</xref> and <xref ref-type="table" rid="table5">Table 5</xref>. The topic modeling-based model outperformed the other two models at each rank, and the semantic group-based model had a better performance than the baseline VSM model. For example, for the top-retrieved document, the precision of the topic modeling-based, semantic group-based, and VSM models were 0.670 (67.0%), 0.628 (62.8%), and 0.543 (54.3%), respectively.</p>
        <fig id="figure6" position="float">
          <label>Figure 6</label>
          <caption>
            <p>(A) Network formed using the topic modeling-based model (TMB) with topic frequency cutoff 1, (B) network formed based on the semantic group-based model (SGB) with semantic group frequency cutoff 1, and (C) a combined network by linking the two networks (TMB+SGB) based on questions.</p>
          </caption>
          <graphic xlink:href="jmir_v19i10e342_fig6.jpg" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <table-wrap position="float" id="table5">
          <label>Table 5</label>
          <caption>
            <p>Performance comparison of topic modeling-based, semantic group-based, and vector space model (VSM) models.</p>
          </caption>
          <table width="648" cellpadding="7" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="125"/>
            <col width="58"/>
            <col width="58"/>
            <col width="58"/>
            <col width="58"/>
            <col width="64"/>
            <col width="52"/>
            <col width="61"/>
            <thead>
              <tr valign="top">
                <td>Model</td>
                <td colspan="7">Mean precision</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>P 1</td>
                <td>P 2</td>
                <td>P 3</td>
                <td>P 4</td>
                <td>P 5</td>
                <td>P 10</td>
                <td>P 20</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Topic modeling-based</td>
                <td>0.670</td>
                <td>0.622</td>
                <td>0.596</td>
                <td>0.588</td>
                <td>0.596</td>
                <td>0.579</td>
                <td>0.572</td>
              </tr>
              <tr valign="top">
                <td>Semantic group-based</td>
                <td>0.628</td>
                <td>0.606</td>
                <td>0.585</td>
                <td>0.582</td>
                <td>0.581</td>
                <td>0.564</td>
                <td>0.547</td>
              </tr>
              <tr valign="top">
                <td>VSM</td>
                <td>0.543</td>
                <td>0.532</td>
                <td>0.532</td>
                <td>0.529</td>
                <td>0.528</td>
                <td>0.528</td>
                <td>0.531</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
        <fig id="figure7" position="float">
          <label>Figure 7</label>
          <caption>
            <p>Precision at rank 1 to 20 for topic modeling-based (TMB), semantic group-based (SGB), and vector space model (VSM) models.</p>
          </caption>
          <graphic xlink:href="jmir_v19i10e342_fig7.jpg" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <p>In summary, we investigated the use of the state-of-the-art information retrieval approaches to recommend diabetes education materials for questions available in an online forum for diabetes by leveraging a corpus assembled from diabetes education materials and a corpus assembled from an online forum. Our study shows that the language used in patient education materials is different from the language used in questions from an online forum. A topic modeling-based model has the potential to accurately recommend patient education material to a given question. Both topic modeling-based and semantic group-based models outperform the baseline VSM model. Network analysis illustrates that the network formed by topic modeling and the network formed by semantic groups are different and the combination of them may yield a better strategy.</p>
      <p>Literature has shown that the language used by patients is different from the one used by clinicians [<xref ref-type="bibr" rid="ref27">27</xref>]. Our study demonstrated that there is a language difference between patient education materials and questions in an online forum even though the target audiences of patient education materials are the patients. Patient educational materials are often produced internally by hospital staff without sufficient consideration of the patients intended to use them [<xref ref-type="bibr" rid="ref28">28</xref>]. In our study, patient education materials tend to cover clinical and patient life topics, whereas patients tend to ask about disease-specific technology and treatment from the top words in <xref ref-type="table" rid="table2">Table 2</xref>. In addition, the semantic group of questions from diabetic patients corpus included mainly chemical drugs, physiology, devices, and gene aspects more than patient educational materials corpus, and these semantic groups also related to complication, treatment, and technology categories. There was consistency between the primary category distribution of questions from diabetic patients and their semantic groups. Therefore, analyzing online forums can identify information needs of patients and provide an opportunity to create patient-centric education materials.</p>
      <p>The study demonstrated that topic modeling can mitigate the vocabulary difference between two corpora and achieve the best performance in recommending education materials to questions. In <xref ref-type="fig" rid="figure7">Figure 7</xref>, we found that the topic modeling-based model outperformed the other two models. Through topic modeling, topics and their probability distribution can be calculated for analyzing document similarity, which has been explored for document classification and personalized recommendation. For example, the iDoctor used LDA topic modeling for personalized and professionalized medical recommendation based on data available at crowd-sourced review websites [<xref ref-type="bibr" rid="ref29">29</xref>] and Kandula et al’s [<xref ref-type="bibr" rid="ref18">18</xref>] study also showed that the LDA topic modeling can better recommend patient education material to diabetic patients based on clinical notes. Our network analysis demonstrates that the topic modeling-based and semantic group-based models form two independent networks, which may imply that combining the two automated models has the potential to improve the recommendation.</p>
      <p>Here, we only studied one disease and used our institutional patient education materials. More research is needed to see if our findings can be generalized. One direction for future work is to extend our study to other disease areas, other patient education material resources, and online forums.</p>
    </sec>
  </body>
  <back>
    <app-group>
      <app id="app1">
        <title>Multimedia Appendix 1</title>
        <p>Information retrieval algorithms.</p>
        <media xlink:href="jmir_v19i10e342_app1.pdf" xlink:title="PDF File (Adobe PDF File), 128KB"/>
      </app>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">LADA</term>
          <def>
            <p>latent autoimmune diabetes of adulthood</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">LDA</term>
          <def>
            <p>Latent Dirichlet Allocation</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">UMLS</term>
          <def>
            <p>Unified Medical Language System</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">VSM</term>
          <def>
            <p>vector space model</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>The study was supported by National Institute of Health research grants, R01LM011934-01A1 and R01EB019403 and grant NO.2014B010118005 from Guangdong Provincial Department of Science and Technology, Guangzhou, Guangdong, China. The first author was funded by China Scholarship Council.</p>
    </ack>
    <fn-group>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="web">
        <source>IDF Diabetes Atlas</source>  
        <access-date>2017-09-27</access-date>
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.diabetesatlas.org/">http://www.diabetesatlas.org/</ext-link>
          <ext-link ext-link-type="webcite" xlink:href="6tnpY8Vwj"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Zhuo</surname>
            <given-names>X</given-names>
          </name>
          <name name-style="western">
            <surname>Zhang</surname>
            <given-names>P</given-names>
          </name>
          <name name-style="western">
            <surname>Barker</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Albright</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Thompson</surname>
            <given-names>TJ</given-names>
          </name>
          <name name-style="western">
            <surname>Gregg</surname>
            <given-names>E</given-names>
          </name>
        </person-group>
        <article-title>The lifetime cost of diabetes and its implications for diabetes prevention</article-title>
        <source>Diabetes Care</source>  
        <year>2014</year>  
        <month>09</month>  
        <volume>37</volume>  
        <issue>9</issue>  
        <fpage>2557</fpage>  
        <lpage>2564</lpage>  
        <pub-id pub-id-type="doi">10.2337/dc13-2484</pub-id>
        <pub-id pub-id-type="medline">25147254</pub-id>
        <pub-id pub-id-type="pii">dc13-2484</pub-id></nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Heinrich</surname>
            <given-names>E</given-names>
          </name>
          <name name-style="western">
            <surname>Schaper</surname>
            <given-names>N</given-names>
          </name>
          <name name-style="western">
            <surname>de Vries</surname>
            <given-names>N</given-names>
          </name>
        </person-group>
        <article-title>Self-management interventions for type 2 diabetes: a systematic review</article-title>
        <source>Eur Diabetes Nurs</source>  
        <year>2015</year>  
        <month>02</month>  
        <day>17</day>  
        <volume>7</volume>  
        <issue>2</issue>  
        <fpage>71</fpage>  
        <lpage>76</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.tandfonline.com/doi/abs/10.1002/edn.160"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1002/edn.160</pub-id></nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Moser</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>van der Bruggen</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Widdershoven</surname>
            <given-names>G</given-names>
          </name>
          <name name-style="western">
            <surname>Spreeuwenberg</surname>
            <given-names>C</given-names>
          </name>
        </person-group>
        <article-title>Self-management of type 2 diabetes mellitus: a qualitative investigation from the perspective of participants in a nurse-led, shared-care programme in the Netherlands</article-title>
        <source>BMC Public Health</source>  
        <year>2008</year>  
        <month>03</month>  
        <day>18</day>  
        <volume>8</volume>  
        <fpage>91</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="https://bmcpublichealth.biomedcentral.com/articles/10.1186/1471-2458-8-91"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1186/1471-2458-8-91</pub-id>
        <pub-id pub-id-type="medline">18366665</pub-id>
        <pub-id pub-id-type="pii">1471-2458-8-91</pub-id>
        <pub-id pub-id-type="pmcid">PMC2292711</pub-id></nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Devi</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Kapoor</surname>
            <given-names>B</given-names>
          </name>
          <name name-style="western">
            <surname>Singh</surname>
            <given-names>M</given-names>
          </name>
        </person-group>
        <article-title>Effectiveness of self-learning module on the knowledge and practices regarding foot care among type II diabetes patients in East Delhi, India</article-title>
        <source>Int J Community Med Pub Health</source>  
        <year>2017</year>  
        <volume>3</volume>  
        <issue>8</issue>  
        <fpage>2133</fpage>  
        <lpage>2141</lpage>  
        <pub-id pub-id-type="doi">10.18203/2394-6040.ijcmph20162559</pub-id></nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Kanthawala</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Vermeesch</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Given</surname>
            <given-names>B</given-names>
          </name>
          <name name-style="western">
            <surname>Huh</surname>
            <given-names>J</given-names>
          </name>
        </person-group>
        <article-title>Answers to health questions: Internet search results versus online health community responses</article-title>
        <source>J Med Internet Res</source>  
        <year>2016</year>  
        <month>04</month>  
        <day>28</day>  
        <volume>18</volume>  
        <issue>4</issue>  
        <fpage>e95</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.jmir.org/2016/4/e95/"/>
        </comment>  
        <pub-id pub-id-type="doi">10.2196/jmir.5369</pub-id>
        <pub-id pub-id-type="medline">27125622</pub-id>
        <pub-id pub-id-type="pii">v18i4e95</pub-id>
        <pub-id pub-id-type="pmcid">PMC4865652</pub-id></nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Zheng</surname>
            <given-names>Y</given-names>
          </name>
          <name name-style="western">
            <surname>Wu</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Su</surname>
            <given-names>Z</given-names>
          </name>
          <name name-style="western">
            <surname>Zhou</surname>
            <given-names>Q</given-names>
          </name>
        </person-group>
        <article-title>Development of a diabetes education program based on modified AADE diabetes education curriculum</article-title>
        <source>Int J Clin Exp Med</source>  
        <year>2014</year>  
        <volume>7</volume>  
        <issue>3</issue>  
        <fpage>758</fpage>  
        <lpage>763</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/24753774"/>
        </comment>  
        <pub-id pub-id-type="medline">24753774</pub-id>
        <pub-id pub-id-type="pmcid">PMC3992419</pub-id></nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Hermanns</surname>
            <given-names>N</given-names>
          </name>
          <name name-style="western">
            <surname>Kulzer</surname>
            <given-names>B</given-names>
          </name>
          <name name-style="western">
            <surname>Ehrmann</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Bergis-Jurgan</surname>
            <given-names>N</given-names>
          </name>
          <name name-style="western">
            <surname>Haak</surname>
            <given-names>T</given-names>
          </name>
        </person-group>
        <article-title>The effect of a diabetes education programme (PRIMAS) for people with type 1 diabetes: results of a randomized trial</article-title>
        <source>Diabetes Res Clin Pract</source>  
        <year>2013</year>  
        <month>12</month>  
        <volume>102</volume>  
        <issue>3</issue>  
        <fpage>149</fpage>  
        <lpage>157</lpage>  
        <pub-id pub-id-type="doi">10.1016/j.diabres.2013.10.009</pub-id>
        <pub-id pub-id-type="medline">24210673</pub-id>
        <pub-id pub-id-type="pii">S0168-8227(13)00351-3</pub-id></nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Haas</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Maryniuk</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Beck</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Cox</surname>
            <given-names>CE</given-names>
          </name>
          <name name-style="western">
            <surname>Duker</surname>
            <given-names>P</given-names>
          </name>
          <name name-style="western">
            <surname>Edwards</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Fisher</surname>
            <given-names>EB</given-names>
          </name>
          <name name-style="western">
            <surname>Hanson</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Kent</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Kolb</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>McLaughlin</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Orzeck</surname>
            <given-names>E</given-names>
          </name>
          <name name-style="western">
            <surname>Piette</surname>
            <given-names>JD</given-names>
          </name>
          <name name-style="western">
            <surname>Rhinehart</surname>
            <given-names>AS</given-names>
          </name>
          <name name-style="western">
            <surname>Rothman</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Sklaroff</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Tomky</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Youssef</surname>
            <given-names>G</given-names>
          </name>
          <collab>2012 Standards Revision Task Force</collab>
        </person-group>
        <article-title>National standards for diabetes self-management education and support</article-title>
        <source>Diabetes Care</source>  
        <year>2014</year>  
        <month>01</month>  
        <volume>37 Suppl 1</volume>  
        <fpage>S144</fpage>  
        <lpage>S153</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/24357210"/>
        </comment>  
        <pub-id pub-id-type="doi">10.2337/dc14-S144</pub-id>
        <pub-id pub-id-type="medline">24357210</pub-id>
        <pub-id pub-id-type="pii">37/Supplement_1/S144</pub-id>
        <pub-id pub-id-type="pmcid">PMC4181074</pub-id></nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="book">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Baeza-Yates</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Ribeiro-Neto</surname>
            <given-names>B</given-names>
          </name>
        </person-group>
        <source>Modern Information Retrieval</source>  
        <year>1999</year>  
        <publisher-loc>New York</publisher-loc>
        <publisher-name>ACM Press</publisher-name></nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Raghavan</surname>
            <given-names>V</given-names>
          </name>
          <name name-style="western">
            <surname>Wong</surname>
            <given-names>S</given-names>
          </name>
        </person-group>
        <article-title>A critical analysis of vector space model for information retrieval</article-title>
        <source>J Am Soc Inform Sci</source>  
        <year>1986</year>  
        <volume>37</volume>  
        <issue>5</issue>  
        <fpage>279</fpage> </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="book">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Salton</surname>
            <given-names>G</given-names>
          </name>
          <name name-style="western">
            <surname>McGill</surname>
            <given-names>M</given-names>
          </name>
        </person-group>
        <source>Introduction to Modern Information Retrieval</source>  
        <year>1983</year>  
        <publisher-loc>New York</publisher-loc>
        <publisher-name>McGraw-Hill</publisher-name></nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Miller</surname>
            <given-names>G</given-names>
          </name>
        </person-group>
        <article-title>WordNet: a lexical database for English</article-title>
        <source>Commun ACM</source>  
        <year>1995</year>  
        <volume>38</volume>  
        <issue>11</issue>  
        <fpage>39</fpage>  
        <lpage>41</lpage>  
        <pub-id pub-id-type="doi">10.1145/219717.219748</pub-id></nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Wang</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Blei</surname>
            <given-names>D</given-names>
          </name>
        </person-group>
        <article-title>Collaborative topic modeling for recommending scientific articles</article-title>
        <source>Proceedings of the 17th ACM SIGKDD International Conference on Knowledge Discovery and Data Mining</source>  
        <year>2011</year>  
        <month>08</month>  
        <conf-name>KDD '11 17th ACM SIGKDD International Conference on Knowledge Discovery and Data Mining</conf-name>
        <conf-date>Aug 21-24, 2011</conf-date>
        <conf-loc>San Diego, CA</conf-loc>
        <fpage>448</fpage>  
        <lpage>456</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="https://doi.org/10.1145/2020408.2020480"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="book">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Yi</surname>
            <given-names>X</given-names>
          </name>
          <name name-style="western">
            <surname>Allan</surname>
            <given-names>J</given-names>
          </name>
        </person-group>
        <article-title>A comparative study of utilizing topic models for information retrieval</article-title>
        <source>ECIR 2009: Advances in Information Retrieval</source>  
        <year>2009</year>  
        <publisher-loc>New York</publisher-loc>
        <publisher-name>Springer</publisher-name>
        <fpage>29</fpage>  
        <lpage>41</lpage> </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Gardner</surname>
            <given-names>M</given-names>
          </name>
        </person-group>
        <article-title>Information retrieval for patient care</article-title>
        <source>BMJ</source>  
        <year>1997</year>  
        <month>03</month>  
        <day>29</day>  
        <volume>314</volume>  
        <issue>7085</issue>  
        <fpage>950</fpage>  
        <lpage>950</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="https://doi.org/10.1136/bmj.314.7085.950"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1136/bmj.314.7085.950</pub-id></nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Ebell</surname>
            <given-names>MH</given-names>
          </name>
          <name name-style="western">
            <surname>Barry</surname>
            <given-names>HC</given-names>
          </name>
        </person-group>
        <article-title>InfoRetriever: rapid access to evidence-based information on a hand-held computer</article-title>
        <source>MD Comput</source>  
        <year>1998</year>  
        <volume>15</volume>  
        <issue>5</issue>  
        <fpage>289</fpage>  
        <lpage>297</lpage>  
        <pub-id pub-id-type="medline">9753974</pub-id></nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Kandula</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Curtis</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Hill</surname>
            <given-names>B</given-names>
          </name>
          <name name-style="western">
            <surname>Zeng-Treitler</surname>
            <given-names>Q</given-names>
          </name>
        </person-group>
        <article-title>Use of topic modeling for recommending relevant education material to diabetic patients</article-title>
        <source>AMIA Annu Symp Proc</source>  
        <year>2011</year>  
        <volume>2011</volume>  
        <fpage>674</fpage>  
        <lpage>682</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/22195123"/>
        </comment>  
        <pub-id pub-id-type="medline">22195123</pub-id>
        <pub-id pub-id-type="pmcid">PMC3243223</pub-id></nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="web">
        <source>Apache Tika</source>  
        <access-date>2017-09-27</access-date>
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="https://tika.apache.org/">https://tika.apache.org/</ext-link>
          <ext-link ext-link-type="webcite" xlink:href="6tnsHd7mi"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="web">
        <source>tudiabetes.org</source>  
        <access-date>2017-09-27</access-date>
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.tudiabetes.org/forum/">http://www.tudiabetes.org/forum/</ext-link>
          <ext-link ext-link-type="webcite" xlink:href="6tnsM3ZQi"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Bodenreider</surname>
            <given-names>O</given-names>
          </name>
        </person-group>
        <article-title>The Unified Medical Language System (UMLS): integrating biomedical terminology</article-title>
        <source>Nucleic Acids Res</source>  
        <year>2004</year>  
        <month>01</month>  
        <day>1</day>  
        <volume>32</volume>  
        <issue>Database issue</issue>  
        <fpage>D267</fpage>  
        <lpage>D270</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://nar.oxfordjournals.org/cgi/pmidlookup?view=long&#38;pmid=14681409"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1093/nar/gkh061</pub-id>
        <pub-id pub-id-type="medline">14681409</pub-id>
        <pub-id pub-id-type="pii">32/suppl_1/D267</pub-id>
        <pub-id pub-id-type="pmcid">PMC308795</pub-id></nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Phan</surname>
            <given-names>X</given-names>
          </name>
          <name name-style="western">
            <surname>Nguyen</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Horiguchi</surname>
            <given-names>S</given-names>
          </name>
        </person-group>
        <article-title>Learning to classify shortsparse text &#38;amp;amp; web with hidden topics from large-scale data collections</article-title>
        <source>Proceedings of the 17th International Conference on World Wide Web</source>  
        <year>2008</year>  
        <month>04</month>  
        <conf-name>WWW 2008 7th International Conference on World Wide Web</conf-name>
        <conf-date>Apr 21-25, 2008</conf-date>
        <conf-loc>Beijing, China</conf-loc>
        <fpage>91</fpage>  
        <lpage>100</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="https://doi.org/10.1145/1367497.1367510"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Blei</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Ng</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Jordan</surname>
            <given-names>M</given-names>
          </name>
        </person-group>
        <article-title>Latent Dirichlet Allocation</article-title>
        <source>J Mach Learn Res</source>  
        <year>2003</year>  
        <volume>3</volume>  
        <fpage>993</fpage>  
        <lpage>1022</lpage> </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="book">
        <person-group person-group-type="author">
          <collab>R Core Team</collab>
        </person-group>
        <source>R Language Definition</source>  
        <year>2000</year>  
        <publisher-loc>Vienna, Austria</publisher-loc>
        <publisher-name>R foundation for statistical computing</publisher-name></nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Shannon</surname>
            <given-names>P</given-names>
          </name>
          <name name-style="western">
            <surname>Markiel</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Ozier</surname>
            <given-names>O</given-names>
          </name>
          <name name-style="western">
            <surname>Baliga</surname>
            <given-names>NS</given-names>
          </name>
          <name name-style="western">
            <surname>Wang</surname>
            <given-names>JT</given-names>
          </name>
          <name name-style="western">
            <surname>Ramage</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Amin</surname>
            <given-names>N</given-names>
          </name>
          <name name-style="western">
            <surname>Schwikowski</surname>
            <given-names>B</given-names>
          </name>
          <name name-style="western">
            <surname>Ideker</surname>
            <given-names>T</given-names>
          </name>
        </person-group>
        <article-title>Cytoscape: a software environment for integrated models of biomolecular interaction networks</article-title>
        <source>Genome Res</source>  
        <year>2003</year>  
        <month>11</month>  
        <volume>13</volume>  
        <issue>11</issue>  
        <fpage>2498</fpage>  
        <lpage>2504</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://genome.cshlp.org/cgi/pmidlookup?view=long&#38;pmid=14597658"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1101/gr.1239303</pub-id>
        <pub-id pub-id-type="medline">14597658</pub-id>
        <pub-id pub-id-type="pii">13/11/2498</pub-id>
        <pub-id pub-id-type="pmcid">PMC403769</pub-id></nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Pedregosa</surname>
            <given-names>F</given-names>
          </name>
          <name name-style="western">
            <surname>Varoquaux</surname>
            <given-names>G</given-names>
          </name>
          <name name-style="western">
            <surname>Gramfort</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Michel</surname>
            <given-names>V</given-names>
          </name>
          <name name-style="western">
            <surname>Thirion</surname>
            <given-names>B</given-names>
          </name>
          <name name-style="western">
            <surname>Grisel</surname>
            <given-names>O</given-names>
          </name>
          <name name-style="western">
            <surname>Blondel</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Prettenhofer</surname>
            <given-names>P</given-names>
          </name>
          <name name-style="western">
            <surname>Weiss</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Dubourg</surname>
            <given-names>V</given-names>
          </name>
        </person-group>
        <article-title>Scikit-learn: machine learning in Python</article-title>
        <source>J Mach Learn Res</source>  
        <year>2011</year>  
        <volume>12</volume>  
        <fpage>2825</fpage>  
        <lpage>2830</lpage> </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Zeng</surname>
            <given-names>Q</given-names>
          </name>
          <name name-style="western">
            <surname>Kogan</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Ash</surname>
            <given-names>N</given-names>
          </name>
          <name name-style="western">
            <surname>Greenes</surname>
            <given-names>RA</given-names>
          </name>
        </person-group>
        <article-title>Patient and clinician vocabulary: how different are they?</article-title>
        <source>Stud Health Technol Inform</source>  
        <year>2001</year>  
        <volume>84</volume>  
        <issue>Pt 1</issue>  
        <fpage>399</fpage>  
        <lpage>403</lpage>  
        <pub-id pub-id-type="medline">11604772</pub-id></nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Payne</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Large</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Jarrett</surname>
            <given-names>N</given-names>
          </name>
          <name name-style="western">
            <surname>Turner</surname>
            <given-names>P</given-names>
          </name>
        </person-group>
        <article-title>Written information given to patients and families by palliative care units: a national survey</article-title>
        <source>Lancet</source>  
        <year>2000</year>  
        <month>05</month>  
        <day>20</day>  
        <volume>355</volume>  
        <issue>9217</issue>  
        <fpage>1792</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="https://doi.org/10.1016/S0140-6736%2800%2902272-8"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1016/S0140-6736(00)02272-8</pub-id>
        <pub-id pub-id-type="medline">10832835</pub-id>
        <pub-id pub-id-type="pii">S0140-6736(00)02272-8</pub-id></nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Zhang</surname>
            <given-names>Y</given-names>
          </name>
          <name name-style="western">
            <surname>Chen</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Huang</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Wu</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Li</surname>
            <given-names>Y</given-names>
          </name>
        </person-group>
        <article-title>iDoctor: personalized and professionalized medical recommendations based on hybrid matrix factorization</article-title>
        <source>Future Gener Comp Sy</source>  
        <year>2017</year>  
        <month>01</month>  
        <volume>66</volume>  
        <fpage>30</fpage>  
        <lpage>35</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="https://doi.org/10.1016/j.future.2015.12.001"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1016/j.future.2015.12.001</pub-id></nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
