<?xml version="1.0" encoding="utf-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMIR</journal-id>
      <journal-id journal-id-type="nlm-ta">J Med Internet Res</journal-id>
      <journal-title>Journal of Medical Internet Research</journal-title>
      <issn pub-type="epub">1438-8871</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
    <article-id pub-id-type="publisher-id">v19i4e130</article-id>
    <article-id pub-id-type="pmid">28438725</article-id>
    <article-id pub-id-type="doi">10.2196/jmir.6834</article-id>
    <article-categories>
      <subj-group subj-group-type="heading">
        <subject>Original Paper</subject>
      </subj-group>
      <subj-group subj-group-type="article-type">
        <subject>Original Paper</subject>
      </subj-group>
    </article-categories>
    <title-group>
      <article-title>Analyzing and Predicting User Participations in Online Health Communities: A Social Support Perspective</article-title>
    </title-group>
    <contrib-group>
      <contrib contrib-type="editor">
        <name>
          <surname>Eysenbach</surname>
          <given-names>Gunther</given-names>
        </name>
      </contrib>
    </contrib-group>
    <contrib-group>
      <contrib contrib-type="reviewer">
        <name>
          <surname>Eddens</surname>
          <given-names>Kate</given-names>
        </name>
      </contrib>
      <contrib contrib-type="reviewer">
        <name>
          <surname>Alpert</surname>
          <given-names>Jordan</given-names>
        </name>
      </contrib>
    </contrib-group>
    <contrib-group>
      <contrib contrib-type="author" id="contrib1">
        <name name-style="western">
          <surname>Wang</surname>
          <given-names>Xi</given-names>
        </name>
        <degrees>MSc</degrees>
        <xref rid="aff1" ref-type="aff">1</xref>
        <ext-link ext-link-type="orcid">http://orcid.org/0000-0002-7568-0851</ext-link>
      </contrib>
      <contrib contrib-type="author" id="contrib2" corresp="yes">
      <name name-style="western">
        <surname>Zhao</surname>
        <given-names>Kang</given-names>
      </name>
      <degrees>PhD</degrees>
      <xref rid="aff1" ref-type="aff">1</xref>
      <xref rid="aff2" ref-type="aff">2</xref>
      <address>
        <institution>Department of Management Sciences</institution>
        <institution>The University of Iowa</institution>
        <addr-line>S224 PBB</addr-line>
        <addr-line>Iowa City, IA, 52242</addr-line>
        <country>United States</country>
        <phone>1 3193353831</phone>
        <fax>1 3193350297</fax>
        <email>kang-zhao@uiowa.edu</email>
      </address>  
      <ext-link ext-link-type="orcid">http://orcid.org/0000-0002-8321-2804</ext-link></contrib>
      <contrib contrib-type="author" id="contrib3">
        <name name-style="western">
          <surname>Street</surname>
          <given-names>Nick</given-names>
        </name>
        <degrees>PhD</degrees>
        <xref rid="aff1" ref-type="aff">1</xref>
        <xref rid="aff2" ref-type="aff">2</xref>
        <ext-link ext-link-type="orcid">http://orcid.org/0000-0002-1632-5905</ext-link>
      </contrib>
    </contrib-group>
    <aff id="aff1">
    <sup>1</sup>
    <institution>Interdisciplinary Graduate Program in Informatics</institution>
    <institution>The University of Iowa</institution>  
    <addr-line>Iowa City, IA</addr-line>
    <country>United States</country></aff>
    <aff id="aff2">
    <sup>2</sup>
    <institution>Department of Management Sciences</institution>
    <institution>The University of Iowa</institution>  
    <addr-line>Iowa City, IA</addr-line>
    <country>United States</country></aff>
    <author-notes>
      <corresp>Corresponding Author: Kang Zhao 
      <email>kang-zhao@uiowa.edu</email></corresp>
    </author-notes>
    <pub-date pub-type="collection"><month>04</month><year>2017</year></pub-date>
    <pub-date pub-type="epub">
      <day>24</day>
      <month>04</month>
      <year>2017</year>
    </pub-date>
    <volume>19</volume>
    <issue>4</issue>
    <elocation-id>e130</elocation-id>
    <!--history from ojs - api-xml-->
    <history>
      <date date-type="received">
        <day>17</day>
        <month>10</month>
        <year>2016</year>
      </date>
      <date date-type="rev-request">
        <day>9</day>
        <month>11</month>
        <year>2016</year>
      </date>
      <date date-type="rev-recd">
        <day>28</day>
        <month>12</month>
        <year>2016</year>
      </date>
      <date date-type="accepted">
        <day>11</day>
        <month>2</month>
        <year>2017</year>
      </date>
    </history>
    <!--(c) the authors - correct author names and publication date here if necessary. Date in form ', dd.mm.yyyy' after jmir.org-->
    <copyright-statement>©Xi Wang, Kang Zhao, Nick Street. Originally published in the Journal of Medical Internet Research (http://www.jmir.org), 24.04.2017.</copyright-statement>
    <copyright-year>2017</copyright-year>
    <license license-type="open-access" xlink:href="http://creativecommons.org/licenses/by/2.0/">
      <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (http://creativecommons.org/licenses/by/2.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in the Journal of Medical Internet Research, is properly cited. The complete bibliographic information, a link to the original publication on http://www.jmir.org/, as well as this copyright and license information must be included.</p>
    </license>  
    <self-uri xlink:href="http://www.jmir.org/2017/4/e130/" xlink:type="simple"/>
    <abstract>
      <sec sec-type="background">
        <title>Background</title>
        <p>Online health communities (OHCs) have become a major source of social support for people with health problems. Members of OHCs interact online with similar peers to seek, receive, and provide different types of social support, such as informational support, emotional support, and companionship. As active participations in an OHC are beneficial to both the OHC and its users, it is important to understand factors related to users’ participations and predict user churn for user retention efforts.</p>
      </sec>
      <sec sec-type="objective">
        <title>Objective</title>
        <p>This study aimed to analyze OHC users’ Web-based interactions, reveal which types of social support activities are related to users’ participation, and predict whether and when a user will churn from the OHC.</p>
      </sec>
      <sec sec-type="methods">
        <title>Methods</title>
        <p>We collected a large-scale dataset from a popular OHC for cancer survivors. We used text mining techniques to decide what kinds of social support each post contained. We illustrated how we built text classifiers for 5 different social support categories: seeking informational support (SIS), providing informational support (PIS), seeking emotional support (SES), providing emotional support (PES), and companionship (COM). We conducted survival analysis to identify types of social support related to users’ continued participation. Using supervised machine learning methods, we developed a predictive model for user churn.</p>
      </sec>
      <sec sec-type="results">
        <title>Results</title>
        <p>Users’ behaviors to PIS, SES, and COM had hazard ratios significantly lower than 1 (0.948, 0.972, and 0.919, respectively) and were indicative of continued participations in the OHC. The churn prediction model based on social support activities offers accurate predictions on whether and when a user will leave the OHC.</p>
      </sec>
      <sec sec-type="conclusions">
        <title>Conclusions</title>
        <p>Detecting different types of social support activities via text mining contributes to better understanding and prediction of users’ participations in an OHC. The outcome of this study can help the management and design of a sustainable OHC via more proactive and effective user retention strategies.</p>
      </sec>
    </abstract>
    <kwd-group>
      <kwd>social support</kwd>
      <kwd>machine learning</kwd>
      <kwd>community networks</kwd>
      <kwd>patient engagement</kwd>
      <kwd>prediction</kwd>
    </kwd-group></article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <sec>
        <title>Overview</title>
        <p>Nowadays more and more people use the Internet to satisfy their health-related needs. According to a study by the Pew Research Center, 80% of adult Internet users in the United States use the Internet for health-related purposes. Among them, 34% read health-related experiences or comments from others [<xref ref-type="bibr" rid="ref1">1</xref>]. Online health communities (OHCs) offer a venue for people to interact with peers facing similar health problems. Modern OHCs have incorporated many ways for communication and health management, such as listserv, discussion forums, private messaging, chat rooms, blogs, friend subscriptions, health tracking tools, and so on. OHCs range from general-purpose communities, such as MedHelp and PatientsLikeMe, to those dedicated to a specific health issue, such as diabetes and smoking. Many OHCs host their own websites, whereas some are built on existing social networking services, such as Facebook. Many studies have revealed the advantages and disadvantages of OHCs compared with traditional offline support groups [<xref ref-type="bibr" rid="ref2">2</xref>]. Although OHCs may face problems such as sporadic membership of active users, inaccurate information, deception, and insincerity of strangers [<xref ref-type="bibr" rid="ref3">3</xref>-<xref ref-type="bibr" rid="ref5">5</xref>], they also offer tremendous benefits such as broad reach, availability, and anonymity. Consequently, OHCs have gained popularity in recent years, and it is estimated that 5% of all Internet users participated in an OHC [<xref ref-type="bibr" rid="ref6">6</xref>].</p>
        <p>Studies of user behaviors in OHCs are valuable in several ways. First, outcomes of these studies can inform better management and design of a successful OHC, which can help to promote new treatments and healthy lifestyles and reveal adverse drug effects [<xref ref-type="bibr" rid="ref7">7</xref>-<xref ref-type="bibr" rid="ref9">9</xref>]. Like other online communities, successful OHCs would like to encourage users’ participations and prevent users’ churn (ie, leaving a community), because one of the keys for the success of an online community is active participations from and relationship building among its members [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref11">11</xref>]. In contrast, poor participations and transient membership can lead to the termination or failure of an online community [<xref ref-type="bibr" rid="ref12">12</xref>]. Specifically, OHCs will not be sustainable if its users keep leaving because most of the social support can only be provided by active members of the OHC.</p>
        <p>Second, a successful and sustainable OHC will provide more benefits to individual users. This is because a user’s continued participation in an OHC can be helpful and therapeutic [<xref ref-type="bibr" rid="ref13">13</xref>-<xref ref-type="bibr" rid="ref18">18</xref>]. On one hand, receiving such support can be empowering [<xref ref-type="bibr" rid="ref19">19</xref>] and help patients adjust to the stress of living with and fighting against their diseases [<xref ref-type="bibr" rid="ref20">20</xref>,<xref ref-type="bibr" rid="ref21">21</xref>]. The support they receive online can also improve their offline life and health management [<xref ref-type="bibr" rid="ref22">22</xref>]. On the other hand, besides receiving support from others, staying in an OHC and providing support to others can be beneficial to providers as well [<xref ref-type="bibr" rid="ref20">20</xref>]. There is actually a positive relationship between posting frequency and psychosocial well-being [<xref ref-type="bibr" rid="ref23">23</xref>]. In other words, a user’s continued participation in an OHC can help herself or himself as well as others. Admittedly, for some individuals who have received satisfactory support from an OHC or recovered from the disease, leaving the OHC may not be a bad thing for themselves. However, even though user-generated information about a disease will still be available on the Internet to new OHC members, most of the psychosocial benefits for individual users cannot be achieved if the exodus of experienced users in the OHC keeps happening, leaving new members stranded [<xref ref-type="bibr" rid="ref23">23</xref>]. In fact, providing assistance for new members from experienced members and reminding members to participate continuously are also key factors for the success of online communities [<xref ref-type="bibr" rid="ref12">12</xref>]. Therefore, better understanding and accurate prediction of users’ participations in OHCs can help to build and sustain a successful OHC through improved community design, management, and user retention.</p>
        <p>As social support is a pillar of OHCs, a natural question to ask would be: when it comes to users’ participations, are a user’s Web-based activities in different types of social support related to her or his continued participation in an OHC? If so, can we predict whether and when a user will churn from an OHC based on these social support activities? Despite the large amount of research on social support in OHCs, few studies have answered this question systematically by examining users’ seeking, receiving, and provision of various types of social support from large-scale datasets. An explanatory model [<xref ref-type="bibr" rid="ref24">24</xref>] suggested that receiving more emotional support is associated with users’ longer stay in an OHC. However, the types of social support investigated were limited and only the receiving of support was considered, while we mentioned earlier that providing social support is also important and beneficial. Analyzing large-scale data from a real-world OHC with various data analytics techniques, including text mining, survival analysis, and predictive modeling, our research explained as well as predicted users’ continued participations in OHCs from the perspective of online social support.</p>
      </sec>
      <sec>
        <title>Background and Research Goals</title>
        <sec>
          <title>Social Support and OHCs</title>
          <p>According to Shumaker and Brownell [<xref ref-type="bibr" rid="ref25">25</xref>], social support refers to the “exchange of resources between at least two individuals perceived by the provider or the recipient to be intended to enhance the well-being of the recipient.” Based on the nature of exchanged “resources,” community psychology researchers have identified different types of social support [<xref ref-type="bibr" rid="ref26">26</xref>,<xref ref-type="bibr" rid="ref27">27</xref>]. In this research, we adopted the four types of social support proposed in [<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref29">29</xref>]: informational support, emotional support, companionship, and instrumental support. Informational support is the transmission of information, suggestion, or guidance to the community users [<xref ref-type="bibr" rid="ref30">30</xref>]. The content of such a post in an OHC is usually related to advice, referrals, education, and personal experience with the disease or health problem. Example topics include side effects of a drug, ways to deal with a symptom, experience with a physician, or medical insurance problems. Emotional support, as its name suggests, contains the expression of understanding, encouragement, empathy, affection, affirming, validation, sympathy, caring, and concern. Companionship, also known as network support, consists of chatting, humor, teasing, as well as discussions of offline activities and daily life that are not necessarily related to one’s health problems. Thus, they are sometimes referred to as “off-topic” discussions. Examples include sharing jokes, birthday wishes, holiday plans, or Web-based scrabble games. Instrumental support, or tangible support, refers to offline support activities in the physical world, such as transporting others to hospitals, assistance in grocery shopping, and so forth. Empirical studies suggested that informational support, emotional support, and companionship are common in many OHCs, but instrumental support is rare, as such support is limited by geographical proximity [<xref ref-type="bibr" rid="ref31">31</xref>,<xref ref-type="bibr" rid="ref32">32</xref>]. Also, the further exchange and arrangement of instrumental support may often occur via private or offline communication channels (eg, setting a time for grocery shopping via cell phones). To simplify our automated social support classification, we did not consider instrumental support in this study.</p>
          <p>The emergence of OHCs provides new opportunities to study social support at unprecedented scales and granularities. Traditional studies on offline support communities studies relied heavily on data collected through ethnographical observations, interviews, questionnaires, or surveys [<xref ref-type="bibr" rid="ref14">14</xref>,<xref ref-type="bibr" rid="ref33">33</xref>-<xref ref-type="bibr" rid="ref36">36</xref>]. However, research using these data collection methods faces 3 challenges. First, the scale of the data is limited because observations and interviews are labor intensive and time consuming. Second, results may be biased due to the realities of sampling community members. For example, members who are active in or satisfied with their communities may be more likely to respond to questionnaires or surveys. Third, survey and interview methods typically have coarse temporal granularity and rely on members’ recall of past events and associated feelings. This makes it very difficult to accurately track community members’ activities during an extended time period.</p>
          <p>By contrast, OHCs not only enable but also record asynchronous and distributed social interactions among individuals, making the “big data” available for computational analysis. Such detailed data of users’ online interactions (eg, the amount, content, and time of interactions) contain valuable information on users’ behaviors. To study social support at such a large scale and fine granularity, we need to reveal the nature of social support embedded in users’ contributions in an automated way. Hence, our first research goal was about mining large-scale text data contributed by OHC users to detect different types of social support activities.</p>
          <disp-quote>
            <p>Goal #1: Detect the seeking and provision of different types of social support from unstructured text of large-scale distributed interactions among OHC users.</p>
          </disp-quote>
        </sec>
        <sec>
          <title>Online Community Participations</title>
          <p>According to Preece [<xref ref-type="bibr" rid="ref37">37</xref>], an online community is a group of people who are connected through the Internet and interact over time around a shared purpose, interest, or need. The success of online communities depends largely on sustained participations and voluntary contributions from users [<xref ref-type="bibr" rid="ref38">38</xref>]. Researchers have revealed factors related to user participation in online communities, such as open-source software development [<xref ref-type="bibr" rid="ref39">39</xref>], Wikipedia [<xref ref-type="bibr" rid="ref40">40</xref>], and Question &#38; Answering communities [<xref ref-type="bibr" rid="ref41">41</xref>,<xref ref-type="bibr" rid="ref42">42</xref>].</p>
          <p>Different from other types of online communities, seeking and obtaining various types of social support is a key reason people participate in an OHC [<xref ref-type="bibr" rid="ref43">43</xref>]. On one hand, OHC users have a common identity as the patient of a disease, and information about the disease will be discussed and exchanged very often. On the other hand, the exchange of emotional support and participations in companionship, often in the form of seemingly off-topic discussions, can help OHC users get to know each other personally as they share things beyond health and the common disease. To understand which types of social support are more indicative of user engagement in the community, our second research goal was to run an explanatory model to connect different types of social support with user continued participation.</p>
          <disp-quote>
            <p>Goal #2: Develop an explanatory model to explore whether users’ activities in seeking, providing, and receiving different types of social support are related to their continued participations in an OHC.</p>
          </disp-quote>
        </sec>
        <sec>
          <title>Churn Predictions</title>
          <p>In addition to building an explanatory model to understand factors related to users’ continued participations, another key to sustain an online community is to predict user churn, so that the community can intervene when a user is about to churn and try to retain her or him. Implications for churn prediction are not limited to online communities, but also to other online and offline businesses, such as telecommunication [<xref ref-type="bibr" rid="ref44">44</xref>], retail [<xref ref-type="bibr" rid="ref45">45</xref>], Internet access service [<xref ref-type="bibr" rid="ref46">46</xref>], and online gaming [<xref ref-type="bibr" rid="ref47">47</xref>]. These models have leveraged different types of data about customers and the market, including those related to money, contracts, demographics, usage, products, complaints, competitions, and social networks [<xref ref-type="bibr" rid="ref48">48</xref>-<xref ref-type="bibr" rid="ref50">50</xref>].</p>
          <p>When it comes to online communities, traditional churn prediction faces challenges as well as opportunities. On one hand, many of the features commonly used for churn prediction in for-profit business are not available or make no sense. For instance, users’ demographic data (eg, residential address, income, and ethnicity) is usually unavailable or inaccurate in online communities. Also, because many online communities are based on voluntary participations and do not charge any fee, monetary and contractual issues become largely irrelevant. On the other hand, online communities provide more detailed data about users’ behaviors for predictive analytics [<xref ref-type="bibr" rid="ref51">51</xref>]. While previous churn prediction studies have leveraged structured data of users’ activities, few have examined the unstructured content of users’ interactions or contributions. In contrast, in many online communities, including OHCs, large amount of such content is publicly available from the Web. Previous research on online social networks and social media has suggested that content analysis can be helpful in areas such as personalized recommendation [<xref ref-type="bibr" rid="ref52">52</xref>], community discovery [<xref ref-type="bibr" rid="ref53">53</xref>], and influential user identification [<xref ref-type="bibr" rid="ref54">54</xref>]. We believe analyzing unstructured text posted by online community users from a social support perspective should contribute to accurate churn prediction in OHCs.</p>
          <p>Moreover, many churn predictions for traditional business are limited to snapshot data—a model is learned from data for customers, who were active during a specific period (ie, the training period, usually a couple of months to half a year), based on which customers churned in the subsequent testing period (often a few months). For an online community, data for a user’s complete “life span” in the community can be available for analysis. Such complete data can provide valuable information because those who churn after the first week may behave differently from those who churn after a month. Thus, our last research goal is about building a predictive model using data of users’ social support activities.</p>
          <disp-quote>
            <p>Goal #3: Leverage data about users’ Web-based social support activities over time to build a predictive model to forecast whether and when a user will churn from an OHC.</p>
          </disp-quote>
        </sec>
      </sec>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <p>In this research, we used the data from a very popular peer-to-peer OHC (Breastcancer.org) among breast cancer survivors as a case study. We designed a Web crawler to collect data from its online forum. Our dataset consisted of all the public posts and basic user profile information from October 2002 to August 2013.</p>
      <sec>
        <title>Methods of Social Support Detection</title>
        <p>As we mentioned earlier, informational support, emotional support, and companionship are the three major types of social supports in OHCs. Thus for each post from an OHC, we need to determine whether it was seeking informational support (SIS), providing informational support (PIS), seeking emotional support (SES), providing emotional support (PES), or simply about companionship (COM). Note that we did not differentiate the seeking and provision of companionship because the nature of companionship was about participation and sharing. By getting involved in activities or discussions about companionship through posting, one was seeking and providing support at the same time. It was also possible that a post could belong to more than 1 of the aforementioned categories. <xref ref-type="table" rid="table1">Table 1</xref> lists example posts for each category and a post that belongs to 2 categories.</p>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>Example posts for different types of social support.</p>
          </caption>
          <table width="607" cellpadding="7" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="140"/>
            <col width="436"/>
            <thead>
              <tr valign="top">
                <td>Social support category</td>
                <td>Examples</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Companionship (COM)</td>
                <td>(1) <italic>Kelly Have a wonderful time in Florida, enjoy the sun and fun. Heather</italic> <break/>(2) <italic>I’m loving her new CD. Didn’t recognize any of the songs at first, but there are a few now that I find myself singing the rest of the day.</italic> <break/>(3) <italic>This game has the poster making a new 2 word phrase starting with the second word of the last post Example: Post : Hand out Next poster: Outcast Next poster: Cast Iron Next poster: Iron Age Now let’s begin the game~ Age Old</italic></td>
              </tr>
              <tr valign="top">
                <td>Seeking informational support (SIS)</td>
                <td><italic>Where do you buy digestive enzymes and what are they called?</italic></td>
              </tr>
              <tr valign="top">
                <td>Seeking emotional support (SES)</td>
                <td><italic>I feel like everyone else's lives are going forward, they have plans, hopes, aspirations because they feel. I am one of those not yet out of the woods. I was also someone who could never get cancer. I was a good person, exercised, ate well. Good people don't get sick. I have taken the step of antidepressants, they mitigate the damage, but do not block the pain or sadness I feel.</italic></td>
              </tr>
              <tr valign="top">
                <td>Providing informational support (PIS)</td>
                <td><italic>I had surgery Aug05 for bc recurrance. B4 surgery I had 33 IMRT rads, prior to that had 4A/C &#38;amp; 4 Taxol. I had bc in 2000 &#38;amp; had 37 rads in same general area. Now, my surgery won't heal. Wound doc says there is adema or something on my sternum (shown on recent MRI). My wound has been draining since it broke open in Sept.</italic></td>
              </tr>
              <tr valign="top">
                <td>Providing emotional support (PES)</td>
                <td><italic>Hope you feel better soon, we are here! Prayers Hugs come from Massachusetts APPLE♥</italic> <italic>.</italic></td>
              </tr>
              <tr valign="top">
                <td>Providing informational support (PIS) and providing emotional support (PES)</td>
                <td><italic>I am also the daughter of a 35 yrs BC survivor. Mom is just now going through some more Cancer - alas - they found it in her lung, but it is totally unlikely to be a follow-up of her old BC. I am 45, and was 43 at DX time, my mom was diagnosed at 38... and I am a BRCA2 carrier. Tina, one day at a time. Maybe you'll get good news - it is so hard to wait!!! It is also important to remember that - whatever it is, it is highly treatable, and that YOU WILL SURVIVE too!!! and life goes on after. It will take some time, but it goes on... see my picture? even the hair is back!!! Hugs to all. I am happy you all found your way here, it is a great site for exchanging information, learning and finding support.</italic></td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
        <p>Because it is practically impossible to label all 2.8 million posts manually, we used text classification algorithms to decide what kinds of social support each post contained. Text mining techniques have been adopted to analyze large-scale text data from online social networks, including texts from online health communities (similar findings by Ko D-G, Mai F, and Zhe S, unpublished data, 2015). To train a text classification algorithm, we leveraged human annotated data. We randomly selected 1333 posts out of our dataset. After being trained on the definitions and examples of the aforementioned 5 categories of social supports (SIS, PIS, SES, PES, and COM), 5 human annotators were asked to read each post and decide whether the post belongs to one or more categories of social support (See <xref ref-type="app" rid="app1">Multimedia Appendix 1</xref> for the training instruction). To control the quality of human annotations, we also added to the pool 10 posts that had been annotated by domain experts. For each post, we only accepted results from annotators whose performance on the 10 quality-control posts was among the top 3. The results from the other 2 annotators were discarded. Then, a majority vote among the top 3 annotators was used to determine whether a post was related to a category of social support. <xref ref-type="app" rid="app1">Multimedia Appendix 1</xref> lists the outcome of the annotation.</p>
        <p>Users in OHCs may have different writing styles or linguistic preferences to express themselves. To capture these characteristics, we examined each post and extracted various types of features for training the classifier: basic features, lexical features, sentiment features, and topic features. <xref ref-type="app" rid="app2">Multimedia Appendix 2</xref> includes more details about the feature engineering for social support classification.</p>
      </sec>
      <sec>
        <title>Methods of Participation Analysis</title>
        <p>After detecting the nature of social support in each post, we conducted survival analysis to study how different types of social support activities were related to users’ participations. An individual may enter or exit a community not only based on his or her own expectations and behaviors, but also based on the community’s reactions toward this individual [<xref ref-type="bibr" rid="ref55">55</xref>]. Thus, in addition to users’ own posting behaviors, we also examined whether the receiving or exposure to different types of social support would impact a user’s participation.</p>
        <p>Our survival analysis was based on the Cox proportional-hazards model [<xref ref-type="bibr" rid="ref56">56</xref>], which assessed the importance of different independent variables on the “survival time” it takes for a specific event to occur (<xref ref-type="app" rid="app3">Multimedia Appendix 3</xref> includes more details of the model setup). Specifically, for our analysis, an “event” referred to a user’s cessation of activities in the OHC (ie, churn from the OHC). A user’s survival time was measured from the difference between her last and first posts in the OHC. Similar to a previous study [<xref ref-type="bibr" rid="ref24">24</xref>], we assumed that a user had churned from this OHC if she had no post during the last 12 weeks in our dataset. For those who were active in the OHC during the last 12 weeks, their survival time was right-censored because they were still participating in this OHC.</p>
        <p><xref ref-type="table" rid="table2">Table 2</xref> summarizes independent variables in our model. They reflect users’ own posting behaviors in various social support categories, as well as the amount of social support they received in threaded discussions in direct or indirect ways. A user received support directly when she initiated a thread to seek support and got support from others’ replies to the thread. Meanwhile, social support could also be received indirectly when one replied to a thread started by another user because she might be exposed to support that other users provided to the original poster. In addition to these independent variables, we also included 3 control variables to reflect users’ overall levels of activities.</p>
        <p>The experiment included 19,165 users whose time spans of activities in the OHC exceeded 1 month. Values of control and independent variables were collected based on their behaviors in seeking, providing, and receiving social support in the first month of their participations. To reduce the impact of multi-collinearity, we calculated the correlation coefficients for every pair of variables. We then removed TotalPost and NumThread from the model, as both were strongly correlated with the other control variable InitPost (with correlation coefficients greater than .8). Thus, our model for survival analysis included 1 control variable and 10 independent variables.</p>
      </sec>
      <sec>
        <title>Methods of Churn Prediction</title>
        <p>If different types of social support activities are indeed related to users’ participations in OHCs, OHC managers can design more effective interventions to retain users. Such interventions can be more targeted when OHC mangers know who are likely to leave and when. Therefore, this section proposes a model to predict whether and when a user will churn from an OHC and demonstrates the value of including social support activities over time in such predictions.</p>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>Control variables and independent variables in the survival analysis.</p>
          </caption>
          <table width="607" cellpadding="7" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="140"/>
            <col width="436"/>
            <thead>
              <tr valign="top">
                <td>Variables</td>
                <td>Descriptions</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>TotalPost<sup>a</sup></td>
                <td>The total number of posts a user has published (excluded from the model due to strong correlation with <italic>InitPost</italic>)</td>
              </tr>
              <tr valign="top">
                <td>InitPost<sup>a</sup></td>
                <td>The total number of threads a user initiated</td>
              </tr>
              <tr valign="top">
                <td>NumThread<sup>a</sup></td>
                <td>The number of threads a user contributed to (excluded from the model due to strong correlation with <italic>InitPost</italic>)</td>
              </tr>
              <tr valign="top">
                <td>PES<sup>b</sup></td>
                <td>The number of a user’s posts that provided emotional support</td>
              </tr>
              <tr valign="top">
                <td>PIS<sup>c</sup></td>
                <td>The number of a user’s posts that provided informational support</td>
              </tr>
              <tr valign="top">
                <td>SES<sup>d</sup></td>
                <td>The number of a user’s posts that sought emotional support</td>
              </tr>
              <tr valign="top">
                <td>SIS<sup>e</sup></td>
                <td>The number of a user’s posts that sought informational support</td>
              </tr>
              <tr valign="top">
                <td>COM<sup>f</sup></td>
                <td>The number of a user’s posts that were related to companionship</td>
              </tr>
              <tr valign="top">
                <td>RIS<sub>D</sub></td>
                <td>Direct informational support received—the number of informational support posts a user received after initiating a support-seeking thread.</td>
              </tr>
              <tr valign="top">
                <td>RES<sub>D</sub></td>
                <td>Direct emotional support received—the number of emotional support posts a user received after initiating a support-seeking thread.</td>
              </tr>
              <tr valign="top">
                <td>RIS<sub>I</sub><sup>g</sup></td>
                <td>Indirect informational support received—the number of informational support posts a user was exposed to in threads that she or he did not initiate but contributed to.</td>
              </tr>
              <tr valign="top">
                <td>RES<sub>I</sub><sup>g</sup></td>
                <td>Indirect emotional support received—the number of emotional support posts a user was exposed to in threads that she or he did not initiate but contributed to.</td>
              </tr>
              <tr valign="top">
                <td>RCOM<sup>g</sup></td>
                <td>Companionship received—the number of companionship posts a user was exposed to in threads that she or he did not initiate but contributed to.</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table2fn1">
              <p><sup>a</sup>denotes the three control variables.</p>
            </fn>
            <fn id="table2fn2">
              <p><sup>b</sup>PES: providing emotional support.</p>
            </fn>
            <fn id="table2fn3">
              <p><sup>c</sup>PIS: providing informational support.</p>
            </fn>
            <fn id="table2fn4">
              <p><sup>d</sup>SES: seeking emotional support.</p>
            </fn>
            <fn id="table2fn5">
              <p><sup>e</sup>SIS: seeking informational support.</p>
            </fn>
            <fn id="table2fn6">
              <p><sup>f</sup>COM: companionship.</p>
            </fn>
            <fn id="table2fn7">
              <p><sup>g</sup>For <italic>RIS</italic><sub>I</sub>, <italic>RES</italic><sub>I</sub>, and <italic>RCOM</italic>, we assumed that a user read others’ replies that were posted within 7 days before the user’s replies in the same thread.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <p>Basic features for our predictive model are derived from the 13 independent variables we used for survival analysis (<xref ref-type="table" rid="table2">Table 2</xref>). Because these features aggregated users’ activities during the training period, we also measured how users’ values on the 13 features varied over time using four types of temporal features. Specifically, for each user, we divided her activities measured by each of the 13 basic features into weeks and used 4 additional metrics to capture how the value of each feature changes over the weeks, including overall slope, Shannon entropy, stability, and temporal variations (TV) as proposed in [<xref ref-type="bibr" rid="ref57">57</xref>]. In addition to cumulative values for each basic feature during the training period, we also conjectured that a user’s intention to churn might be better captured during the last week of her online activities. Thus, we also included values for basic features during the last week of the training period if the training period was longer than 1 week. Each basic feature for the last week also had 4 corresponding features to reflect its temporal patterns (ie, slope, Shannon entropy, stability, and TV), although the unit of time was day instead of week. We also added into the feature set the time difference between a user’s registration time and the time of her first post because it might reveal what brought the user to the OHC for the first time. A user who is eager to find some information might have a low gap between the registration time and the time of first posting. More details of features are presented in <xref ref-type="app" rid="app4">Multimedia Appendix 4</xref>.</p>
        <p>In terms of modeling the churn prediction problem, a user was said to churn in her <italic>k-th</italic> week if her last online activity occurred during her <italic>k-th</italic> week in the OHC. Similar to our hazard model, users whose last online activities occurred during the last 12 weeks in our dataset were not considered as churned. To predict whether a user would churn in the <italic>k-th</italic> week of her online activities, we focused on all users who were still active before the <italic>k-th</italic> week and extracted data based on their <italic>k</italic> weeks of activities. For example, the dataset for predicting user churn during the third week contains users who were still active in the OHC before their third week of online activities. Data of their behaviors during their first 2 weeks were collected for training. Users who churned in their third week and never came back were labeled as “positive” instances in the dataset.</p>
        <p>Previous studies indicate that different predictive models for each time period may not be an efficient solution. If the OHC wanted to know who would churn in their second and third weeks, 2 models were needed. Inspired by [<xref ref-type="bibr" rid="ref58">58</xref>], we tried to consolidate all predictive models for churn in different weeks into 1 unified model by leveraging a user’s social support activities across her complete “online life span.” Specifically, we added 1 new feature to the predictive model—time stamp <italic>t</italic>. An instance in the dataset would reflect a user’s historical activities until <italic>t</italic>. As the unit of <italic>t</italic> was the same for all users (a week in our experiment), 1 user could correspond to multiple instances in the dataset. For example, a user who churned in her third week of activities had 3 instances in the dataset—1 instance for her activities and features until the end of her first, second, and third week, respectively. The first 2 instances were labeled as “negative” because the user was still active during these 2 weeks, while the third instance was labeled as a “positive” instance because the user churned in her third week. In other words, the unified model tried to capture the complete life span of a user in the OHC.</p>
        <p>To train the unified model, 24,000 users were randomly selected from 47,581 users in the OHC to be included in the training dataset, while others were placed in the hold-out testing dataset. It is worth noting that the unified model with time stamps as a feature greatly increased the amount of training data because a loyal user who had been active for a long time would have many instances in the dataset. However, 24,000 users in the training dataset resulted in 132,341 instances in total. We built the training dataset and trained the model on a high-performance computing cluster. We also made sure that instances for the same user must belong to the same fold in cross-validation.</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Results of Social Support Detection</title>
        <p>In our dataset from Breastcancer.org, there were more than 2.8 million posts contributed by nearly 50,000 users, including 107,549 initial posts. <xref ref-type="fig" rid="figure1">Figures 1</xref> and <xref ref-type="fig" rid="figure2">2</xref> show the distribution of the number of published posts and the time span of users’ posting activities in this OHC. The 2 plots indicate that users’ online behaviors featured highly skewed distributions that are similar to power-law distributions. In other words, many users were not very active in posting, while some users were very productive and stayed for a long time.</p>
        <p>Because we considered 5 categories of social supports and a post may belong to more than 1 category, we built a classifier for each category. For the classification of each category of social support, we applied various classification algorithms on annotated posts and picked the best performing algorithm using 10-fold cross-validation. Because posts seeking emotional support (SES) accounts for only a small proportion among annotated posts (22 out of 1333), we oversampled posts seeking emotional support when building the SES classifier. Among all the classifiers we tried, AdaBoost, with Naïve Bayesian as the weak learner, was chosen to classify COM, PES, PIS, and SIS, while logistic regression was the best choice for SES (<xref ref-type="table" rid="table3">Table 3</xref>). Overall, our classifiers achieved decent performance with an accuracy rate of more than 0.8 in all 5 classification tasks.</p>
        <table-wrap position="float" id="table3">
          <label>Table 3</label>
          <caption>
            <p>Performance of classification algorithms for 5 categories of social support.</p>
          </caption>
          <table width="571" cellpadding="7" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="55"/>
            <col width="55"/>
            <col width="55"/>
            <col width="65"/>
            <col width="80"/>
            <col width="50"/>
            <col width="50"/>
            <col width="45"/>
            <thead>
              <tr valign="top">
                <td>Social support</td>
                <td>Results</td>
                <td>Naïve Bayesian</td>
                <td>Logistic regression</td>
                <td>Support Vector Machine (polynomial kernel)</td>
                <td>Random forest</td>
                <td>Decision tree</td>
                <td>AdaBoost</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td rowspan="2">COM<sup>a</sup></td>
                <td>Accuracy</td>
                <td>.696</td>
                <td>.787</td>
                <td>.783</td>
                <td>.771</td>
                <td>.767</td>
                <td>.804<sup>f</sup></td>
              </tr>
              <tr valign="top">
                <td>AUC</td>
                <td>.839</td>
                <td>.817</td>
                <td>.768</td>
                <td>.848</td>
                <td>.75</td>
                <td>.852<sup>f</sup></td>
              </tr>
              <tr valign="top">
                <td rowspan="2">PES<sup>b</sup></td>
                <td>Accuracy</td>
                <td>.713</td>
                <td>.830</td>
                <td>.840<sup>f</sup></td>
                <td>.830</td>
                <td>.81</td>
                <td>.817</td>
              </tr>
              <tr valign="top">
                <td>AUC</td>
                <td>.823</td>
                <td>.787</td>
                <td>.681</td>
                <td>.825<sup>f</sup></td>
                <td>.687</td>
                <td>.817</td>
              </tr>
              <tr valign="top">
                <td rowspan="2">PIS<sup>c</sup></td>
                <td>Accuracy</td>
                <td>.753</td>
                <td>.813</td>
                <td>.823<sup>f</sup></td>
                <td>.767</td>
                <td>.779</td>
                <td>.801</td>
              </tr>
              <tr valign="top">
                <td>AUC</td>
                <td>.824</td>
                <td>.83</td>
                <td>.783</td>
                <td>.837</td>
                <td>.717</td>
                <td>.859<sup>f</sup></td>
              </tr>
              <tr valign="top">
                <td rowspan="2">SES<sup>d</sup></td>
                <td>Accuracy</td>
                <td>.893</td>
                <td>.901</td>
                <td>.970<sup>f</sup></td>
                <td>.967</td>
                <td>.963</td>
                <td>.963</td>
              </tr>
              <tr valign="top">
                <td>AUC</td>
                <td>.749</td>
                <td>.867<sup>f</sup></td>
                <td>.656</td>
                <td>.851</td>
                <td>.671</td>
                <td>.668</td>
              </tr>
              <tr valign="top">
                <td rowspan="2">SIS<sup>e</sup></td>
                <td>Accuracy</td>
                <td>.851</td>
                <td>.880</td>
                <td>.943<sup>f</sup></td>
                <td>.931</td>
                <td>.937</td>
                <td>.914</td>
              </tr>
              <tr valign="top">
                <td>AUC</td>
                <td>.893<sup>f</sup></td>
                <td>.803</td>
                <td>.745</td>
                <td>.86</td>
                <td>.766</td>
                <td>.869</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table3fn1">
              <p><sup>a</sup>COM: companionship.</p>
            </fn>
            <fn id="table3fn2">
              <p><sup>b</sup>PES: providing emotional support.</p>
            </fn>
            <fn id="table3fn3">
              <p><sup>c</sup>PIS: providing informational support.</p>
            </fn>
            <fn id="table3fn4">
              <p><sup>d</sup>SES: seeking emotional support.</p>
            </fn>
            <fn id="table3fn5">
              <p><sup>e</sup>SIS: seeking informational support.</p>
            </fn>
            <fn id="table3fn6">
              <p><sup>f</sup>denotes the best performer for each row.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <table-wrap position="float" id="table4">
          <label>Table 4</label>
          <caption>
            <p>Total numbers of posts in each category of social support.</p>
          </caption>
          <table width="500" cellpadding="7" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="350"/>
            <col width="150"/>
            <thead>
              <tr valign="top">
                <td>Social support category</td>
                <td>Total number of posts</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Companionship (COM)</td>
                <td>932,538</td>
              </tr>
              <tr valign="top">
                <td>Seeking informational support (SIS)</td>
                <td>284,027</td>
              </tr>
              <tr valign="top">
                <td>Seeking emotional support (SES)</td>
                <td>227,188</td>
              </tr>
              <tr valign="top">
                <td>Providing informational support (PIS)</td>
                <td>1,034,682</td>
              </tr>
              <tr valign="top">
                <td>Providing emotional support (PES)</td>
                <td>497,096</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>Log-log plot of users’ posting activities in the online health community (OHC).</p>
          </caption>
          <graphic xlink:href="jmir_v19i4e130_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure2" position="float">
          <label>Figure 2</label>
          <caption>
            <p>Log-log plot for the time span of users’ online posting activities.</p>
          </caption>
          <graphic xlink:href="jmir_v19i4e130_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Results of Participation Analysis</title>
        <p><xref ref-type="table" rid="table5">Table 5</xref> shows the results of the participation analysis based on Cox Proportional Hazard models. Variables with hazard ratios lower than 1 contributed positively to the “survival” (ie, continued participation) of users, whereas those with hazard ratio higher than 1 were considered “hazardous” to keep users in this OHC. Three independent variables (PIS, SES, and COM) had hazard ratios that were lower than 1, meaning that users who provided more informational support, sought more emotional support or posted more companionship had longer time spans of activities in the OHC. More specifically, a hazard ratio of 0.919 for companionship meant that a user’s “survival” rate after 1 month was 8.1% higher (100%-91.9%) if her number of companionship posts was one standard deviation higher than the average. In contrast, those who sought or received more informational support (SIS, RIS<sub>D</sub>, and RIS<sub>I</sub>) often left the OHC earlier. Other variables were not significant in the experiment (eg, PES).</p>
      </sec>
      <sec>
        <title>Results of Churn Prediction</title>
        <p>We measured the performance of predictive classifiers using standard metrics for classification, including precision, recall, F1 score, and area under the receiver operating characteristic curve (AUC). After comparing the performance of different classification algorithms (Naïve Bayes, logistic regression, and SVM with polynomial kernel) with 10-fold cross-validation on the training set, logistic regression emerged as the best performer for the unified model. As shown in <xref ref-type="table" rid="table6">Table 6</xref>, the model offers very good performance in predicting churn during the first week. Although recall of the positive class (ie, leaving the OHC) decreased for prediction in later weeks, the precision was still higher than 0.8, and the overall performance measured by AUC was still more than 0.9.</p>
        <p>We also plotted 2 hazard curves to visualize the model’s performance (<xref ref-type="fig" rid="figure3">Figure 3</xref>): one based on empirical data and the other based on predictions from the unified model. The horizontal axis represented weeks, and the vertical axis referred to the probability of users’ churn in specific weeks. The 2 curves were very close to each other, indicating good predictive performance from our model at the community level.</p>
        <table-wrap position="float" id="table5">
          <label>Table 5</label>
          <caption>
            <p>Results from the survival analysis experiment.</p>
          </caption>
          <table width="350" cellpadding="7" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="150"/>
            <col width="150"/>
            <col width="50"/>
            <thead>
              <tr valign="top">
                <td>Variables</td>
                <td>Hazard ratio</td>
                <td><italic>P</italic> Value</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>InitPost (control)</td>
                <td>.995</td>
                <td>.75</td>
              </tr>
              <tr valign="top">
                <td>PES<sup>a</sup></td>
                <td>1.000</td>
                <td>.99</td>
              </tr>
              <tr valign="top">
                <td>PIS<sup>b</sup></td>
                <td>.948***</td>
                <td>.001</td>
              </tr>
              <tr valign="top">
                <td>SES<sup>c</sup></td>
                <td>.972*</td>
                <td>.01</td>
              </tr>
              <tr valign="top">
                <td>SIS<sup>d</sup></td>
                <td>1.050***</td>
                <td>.000</td>
              </tr>
              <tr valign="top">
                <td>COM<sup>e</sup></td>
                <td>.919***</td>
                <td>.000</td>
              </tr>
              <tr valign="top">
                <td>RIS<sub>D</sub></td>
                <td>1.047*</td>
                <td>.02</td>
              </tr>
              <tr valign="top">
                <td>RES<sub>D</sub></td>
                <td>.997</td>
                <td>.79</td>
              </tr>
              <tr valign="top">
                <td>RIS<sub>I</sub></td>
                <td>1.053*</td>
                <td>.02</td>
              </tr>
              <tr valign="top">
                <td>RES<sub>I</sub></td>
                <td>.964</td>
                <td>.11</td>
              </tr>
              <tr valign="top">
                <td>RCOM</td>
                <td>.983</td>
                <td>.41</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table5fn1">
              <p><sup>a</sup>PES: providing emotional support.</p>
            </fn>
            <fn id="table5fn2">
              <p><sup>b</sup>PIS: providing informational support.</p>
            </fn>
            <fn id="table5fn3">
              <p><sup>c</sup>SES: seeking emotional support.</p>
            </fn>
            <fn id="table5fn4">
              <p><sup>d</sup>SIS: seeking informational support.</p>
            </fn>
            <fn id="table5fn5">
              <p><sup>e</sup>COM: companionship.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <table-wrap position="float" id="table6">
          <label>Table 6</label>
          <caption>
            <p>Performance of the unified model on hold-out testing sets in different weeks (precision and recall are for the positive class).</p>
          </caption>
          <table width="410" cellpadding="7" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="70"/>
            <col width="90"/>
            <col width="90"/>
            <col width="90"/>
            <col width="90"/>
            <thead>
              <tr valign="top">
                <td>Measures</td>
                <td>Churn in the 1st week</td>
                <td>Churn in the 3rd week</td>
                <td>Churn in the 5th week</td>
                <td>Churn in the 13th week</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Precision</td>
                <td>.950</td>
                <td>.872</td>
                <td>.880</td>
                <td>.838</td>
              </tr>
              <tr valign="top">
                <td>Recall</td>
                <td>.937</td>
                <td>.534</td>
                <td>.511</td>
                <td>.504</td>
              </tr>
              <tr valign="top">
                <td>F1 score</td>
                <td>.943</td>
                <td>.662</td>
                <td>.647</td>
                <td>.629</td>
              </tr>
              <tr valign="top">
                <td>AUC<sup>a</sup></td>
                <td>.972</td>
                <td>.901</td>
                <td>.909</td>
                <td>.929</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table6fn1">
              <p><sup>a</sup>AUC: area under the receiver operating characteristic (ROC) curve.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <fig id="figure3" position="float">
          <label>Figure 3</label>
          <caption>
            <p>Empirical and predicted hazard curves for user participations.</p>
          </caption>
          <graphic xlink:href="jmir_v19i4e130_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>The results of survival analysis showed that seeking or providing various types of social support was related to users’ participations in different ways. First, informational support is the most popular social support being sought and provided. This was expected for communities based on common social identities [<xref ref-type="bibr" rid="ref59">59</xref>] because the large amount of information about a disease and the common identity as patients of the disease are probably why many users come to the OHC in the first place. While providing more informational support is positively correlated with longer participations, seeking and receiving informational support are negatively associated with participations. In other words, those who focus on seeking information may not stay in the long run, even after they receive informational support.</p>
        <p>Second, companionship had the lowest hazard ratio. Recall that companionship includes discussions of offline events, sharing daily life stories, birthday wishes, and playing online games. This is a very interesting finding—even though this is an OHC about cancer, discussions of non–cancer-related issues are the key to keeping users engaged in the community. This highlights the importance of building personal bond [<xref ref-type="bibr" rid="ref59">59</xref>] through off-topic discussions in the form of sharing personal stories about life or having fun together, which can strengthen the connections among users more than informational support. The role of companionship has significant implications for the management of an OHC. Although some OHCs may discourage off-topic discussions in order to achieve a “cleaner” environment with only relevant content, these discussions turn out to be a good way to bond users and keep them engaged, and OHC managers may want to encourage, or even initiate, more of these activities.</p>
        <p>Third, although we expected emotional support to be positively related to user participation as suggested by [<xref ref-type="bibr" rid="ref24">24</xref>], the results are mixed based on whether emotional support was being sought, provided, or received. The hazard ratio of SES was below 1 in the experiment, which contradicts the effect of SIS and suggests that SES can be a sign of longer participations, especially for those who have been with the OHC for a while. However, providing and receiving emotional support are not significant factors. We conjectured that a fair amount of emotional support in the OHC could be generic and a mere formality (eg, “I will pray for you,” “Love you and Hug”). Such emotional support can still be valuable for those who seek support, but activities in providing and receiving such support are not related to users’ continued participations.</p>
        <p>Our survival analysis has shown the effects of social support activities on users’ engagement. How much do such social support activities contribute to the performance of the churn predictive model? To illustrate which features are more important for the unified model’s predictive power, we ranked the 145 features in the model using information gain [<xref ref-type="bibr" rid="ref60">60</xref>]. Among the top 20 features (<xref ref-type="table" rid="table7">Table 7</xref>), 11 features among the top 20 were made possible only after our classification of different types of social support. Also, 18 of them were features that reflected the temporal dynamics in users’ social support activities, especially the stability during the last week of the training period. Overall, this shows that users’ activities in seeking, providing, and receiving different types of social support, as well as their temporal dynamics in these activities, can greatly enhance churn predictions in OHCs.</p>
        <p>In this research, we mined large-scale data to better understand and predict users’ continued participations in OHCs. We first detected the seeking and provision of different types of social support from OHC users’ posts using text mining techniques. Then, survival analysis revealed that companionship is a significant and positive predictor of users’ continued participations. Not limiting the potential of the large-scale data to descriptive analytics, we also developed a churn prediction model with high accuracies. Our work serves as an example that highlights the power of data analytics in exploring complex human behaviors.</p>
        <p>From a managerial perspective, the outcome of our study can provide OHC managers with suggestions on how to sustain users’ participations and decision support to retain users through interventions (eg, post recommendations and email reminders). A sustainable and successful OHC will eventually benefit its users. From a methodological perspective, this study was the first to use text mining to differentiate the seeking and providing of various types of social support from large-scale OHC data, and demonstrated how such detection of social support activities could help to understand and predict users’ engagement in OHCs.</p>
        <p>This study has practical implications. Traditionally, an OHC will send reminder emails to a user who has been inactive for a while, hoping to raise the user’s interests in coming back. With the help of our churn prediction model, an OHC can find at an early stage whether a user is about to leave. Then, it can intervene proactively and try to retain the user via email reminders. More importantly, instead of including a generic reminder or some random recent posts from the community, such emails can be designed based on the results of our survival analysis. For example, because companionship is a key predictor of users’ continued participations, including some of these companionship posts (eg, birthday wishes, holiday plans, and online scrabble games) in reminder emails may be more effective to keep users engaged than having random posts or just informational posts.</p>
        <table-wrap position="float" id="table7">
          <label>Table 7</label>
          <caption>
            <p>Top 20 features by information gain for the full unified model.</p>
          </caption>
          <table width="450" cellpadding="7" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="50"/>
            <col width="400"/>
            <thead>
              <tr valign="top">
                <td>Rank</td>
                <td>Feature</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>1</td>
                <td>Stability of the total number of threads a user initiated during the last week of the training period</td>
              </tr>
              <tr valign="top">
                <td>2</td>
                <td>Stability of the number of threads a user participated during the last week of the training period</td>
              </tr>
              <tr valign="top">
                <td>3</td>
                <td>Stability of the number of SIS<sup>a</sup> a user posted during the last week of the training period</td>
              </tr>
              <tr valign="top">
                <td>4</td>
                <td>Stability of the number of SES<sup>b</sup> a user posted during the last week of the training period</td>
              </tr>
              <tr valign="top">
                <td>5</td>
                <td>Stability of the total number of posts from a user during the last week of the training period</td>
              </tr>
              <tr valign="top">
                <td>6</td>
                <td>Stability of the number of PIS<sup>c</sup> a user posted during the last week of the training period</td>
              </tr>
              <tr valign="top">
                <td>7</td>
                <td>Stability of the number of PES<sup>d</sup> posts a user received directly during the last week of the training period</td>
              </tr>
              <tr valign="top">
                <td>8</td>
                <td>Stability of the number of PES a user posted during the last week of the training period</td>
              </tr>
              <tr valign="top">
                <td>9</td>
                <td>Stability of the number of COM<sup>e</sup> a user posted during the last week of the training period</td>
              </tr>
              <tr valign="top">
                <td>10</td>
                <td>Stability of the number of PIS posts a user received directly during the last week of the training period</td>
              </tr>
              <tr valign="top">
                <td>11</td>
                <td>Stability of the number of COM a user was exposed to during the last week of the training period</td>
              </tr>
              <tr valign="top">
                <td>12</td>
                <td>Stability of the number of PES posts a user received indirectly during the last week of the training period</td>
              </tr>
              <tr valign="top">
                <td>13</td>
                <td>Stability of the number of PIS posts a user received indirectly during the last week of the training period</td>
              </tr>
              <tr valign="top">
                <td>14</td>
                <td>Total number of posts from a user during the last week of the training period</td>
              </tr>
              <tr valign="top">
                <td>15</td>
                <td>The number of threads a user participated in during the last week of the training period</td>
              </tr>
              <tr valign="top">
                <td>16</td>
                <td>Stability of the number of threads a user participated in across weeks</td>
              </tr>
              <tr valign="top">
                <td>17</td>
                <td>Stability of the total number of posts from a user across weeks</td>
              </tr>
              <tr valign="top">
                <td>18</td>
                <td>Entropy of the total number of posts from a user during the last week of the training period</td>
              </tr>
              <tr valign="top">
                <td>19</td>
                <td>Stability of the number of PIS posts a user received indirectly across weeks</td>
              </tr>
              <tr valign="top">
                <td>20</td>
                <td>Stability of the total number of threads a user initiated across weeks</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table7fn1">
              <p><sup>a</sup>SIS: seeking informational support.</p>
            </fn>
            <fn id="table7fn2">
              <p><sup>b</sup>SES: seeking emotional support.</p>
            </fn>
            <fn id="table7fn3">
              <p><sup>c</sup>PIS: providing informational support.</p>
            </fn>
            <fn id="table7fn4">
              <p><sup>d</sup>PES: providing emotional support.</p>
            </fn>
            <fn id="table7fn5">
              <p><sup>e</sup>COM: companionship.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>Limitations</title>
        <p>This study also had limitations. First, for the 3 independent variables for indirect support received (<italic>RIS</italic><sub>I</sub><italic>, RES</italic><sub>I</sub><italic>, and RCOM</italic>), we assumed that a user received indirect support when she replied to a thread initiated by another user and read other users’ replies to the thread. This approach of capturing indirect support received could be inaccurate: on one hand, we might underestimate the amount of support because we limited our calculation to threads a user replied to, while a user could get indirect support by reading a thread without posting a reply. On the other hand, our approach might also overestimate such indirect support because when posting to a long thread, a user might not have time to read all the previous replies. This limitation can be addressed by analyzing users’ click streams, but such data were not available for this study and can be difficult to obtain for many studies of OHCs. The lack of clickstream data also prevented us from analyzing lurking behaviors, which might also provide social support to lurkers [<xref ref-type="bibr" rid="ref35">35</xref>]. Having users’ clickstream data will also help us better define each user’s temporal span of online activities. Second, our survival analysis only reveals the correlation between users’ social support activities and their participations, without showing any causality. Although randomized experiments are better choices to infer causality, there might be ethical concerns to run such experiments in OHCs (eg, keeping certain users away from social support). Alternative approaches are needed to identify causal relationships. Last but not least, our study was based on data from one OHC for breast cancer. In OHCs for other diseases, especially acute diseases (eg, flu), social support activities and users’ engagement patterns may differ. Although the specific results we found for this breast cancer OHC may not be applicable for all OHCs, the framework of methods we used to classify social support and analyze users’ continued participation based on social support activities can be applied to other OHCs.</p>
      </sec>
      <sec>
        <title>Future Work</title>
        <p>There are several interesting directions for future research. Detecting users’ health status from their posts will be an interesting endeavor, as it not only can help understand why a user leaves an OHC, but also can potentially improve the recommendation and retrieval of Web-based information. We are also interested in improving the unified predictive model, which is easier for OHCs to use. One possible way is to rebalance instances in the unified model’s dataset because the current dataset features way more negative instances than positive. It would also be interesting to explore whether users’ engagement behaviors change over time, especially when accessing the Web using mobile devices is becoming more popular in recent years. We would also like to collaborate with OHC operators to evaluate the effectiveness of interventions aiming at keeping users engaged.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <app id="app1">
        <title>Multimedia Appendix 1</title>
        <p>Post tagging guidelines and outcomes.</p>
        <media xlink:href="jmir_v19i4e130_app1.pdf" xlink:title="PDF File (Adobe PDF File), 62KB"/>
      </app>
      <app id="app2">
        <title>Multimedia Appendix 2</title>
        <p>Features engineering for social support classification.</p>
        <media xlink:href="jmir_v19i4e130_app2.pdf" xlink:title="PDF File (Adobe PDF File), 36KB"/>
      </app>
      <app id="app3">
        <title>Multimedia Appendix 3</title>
        <p>Hazard model.</p>
        <media xlink:href="jmir_v19i4e130_app3.pdf" xlink:title="PDF File (Adobe PDF File), 39KB"/>
      </app>
      <app id="app4">
        <title>Multimedia Appendix 4</title>
        <p>Features engineering for the churn predictive model.</p>
        <media xlink:href="jmir_v19i4e130_app4.pdf" xlink:title="PDF File (Adobe PDF File), 45KB"/>
      </app>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb2">AUC</term>
          <def>
            <p>area under the receiver operating characteristic curve</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">COM</term>
          <def>
            <p>companionship</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">OHC</term>
          <def>
            <p>online health community</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">PES</term>
          <def>
            <p>providing emotional support</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">PIS</term>
          <def>
            <p>providing informational support</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">SES</term>
          <def>
            <p>seeking emotional support</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb8">SIS</term>
          <def>
            <p>seeking informational support</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb9">SVM</term>
          <def>
            <p>support vector machine</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb10">TV</term>
          <def>
            <p>temporal variations</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>Kang Zhao’s work has been partially supported by the National Natural Science Foundation of China (Award #: 71572013).</p>
    </ack>
    <fn-group>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="web">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Fox</surname>
            <given-names>S</given-names>
          </name>
        </person-group>
        <source>Pew Research Center</source>  
        <year>2011</year>  
        <access-date>2017-03-04</access-date>
        <comment>The social life of health information, 2011 
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.pewinternet.org/files/old-media//Files/Reports/2011/PIP_Social_Life_of_Health_Info.pdf">http://www.pewinternet.org/files/old-media//Files/Reports/2011/PIP_Social_Life_of_Health_Info.pdf</ext-link>
        <ext-link ext-link-type="webcite" xlink:href="6oidDcGPg"/></comment> </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>White</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Dorman</surname>
            <given-names>SM</given-names>
          </name>
        </person-group>
        <article-title>Receiving social support online: implications for health education</article-title>
        <source>Health Educ Res</source>  
        <year>2001</year>  
        <month>12</month>  
        <volume>16</volume>  
        <issue>6</issue>  
        <fpage>693</fpage>  
        <lpage>707</lpage>  
        <pub-id pub-id-type="medline">11780708</pub-id></nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Caplan</surname>
            <given-names>SE</given-names>
          </name>
          <name name-style="western">
            <surname>Turner</surname>
            <given-names>JS</given-names>
          </name>
        </person-group>
        <article-title>Bringing theory to research on computer-mediated comforting communication</article-title>
        <source>Comput Human Behav</source>  
        <year>2007</year>  
        <month>3</month>  
        <volume>23</volume>  
        <issue>2</issue>  
        <fpage>985</fpage>  
        <lpage>98</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.sciencedirect.com/science/article/pii/S0747563205000555"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1016/j.chb.2005.08.003</pub-id></nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Wright</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Bell</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Wright</surname>
            <given-names>KB</given-names>
          </name>
          <name name-style="western">
            <surname>Bell</surname>
            <given-names>SB</given-names>
          </name>
        </person-group>
        <article-title>Health-related support groups on the internet: linking empirical findings to social support and computer-mediated communication theory</article-title>
        <source>J Health Psychol</source>  
        <year>2003</year>  
        <month>01</month>  
        <volume>8</volume>  
        <issue>1</issue>  
        <fpage>39</fpage>  
        <lpage>54</lpage>  
        <pub-id pub-id-type="doi">10.1177/1359105303008001429</pub-id>
        <pub-id pub-id-type="medline">22113899</pub-id>
        <pub-id pub-id-type="pii">8/1/39</pub-id></nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Wright</surname>
            <given-names>K</given-names>
          </name>
        </person-group>
        <article-title>Social support within an on-line cancer community: an assessment of emotional support, perceptions of advantages and disadvantages, and motives for using the community from a communication perspective</article-title>
        <source>J Appl Commun Res</source>  
        <year>2002</year>  
        <month>01</month>  
        <volume>30</volume>  
        <issue>3</issue>  
        <fpage>195</fpage>  
        <lpage>209</lpage>  
        <pub-id pub-id-type="doi">10.1080/00909880216586</pub-id></nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Chou</surname>
            <given-names>WY</given-names>
          </name>
          <name name-style="western">
            <surname>Hunt</surname>
            <given-names>YM</given-names>
          </name>
          <name name-style="western">
            <surname>Beckjord</surname>
            <given-names>EB</given-names>
          </name>
          <name name-style="western">
            <surname>Moser</surname>
            <given-names>RP</given-names>
          </name>
          <name name-style="western">
            <surname>Hesse</surname>
            <given-names>BW</given-names>
          </name>
        </person-group>
        <article-title>Social media use in the United States: implications for health communication</article-title>
        <source>J Med Internet Res</source>  
        <year>2009</year>  
        <month>08</month>  
        <volume>11</volume>  
        <issue>4</issue>  
        <fpage>e48</fpage>  
        <lpage>7</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.jmir.org/2009/4/e48/"/>
        </comment>  
        <pub-id pub-id-type="doi">10.2196/jmir.1249</pub-id>
        <pub-id pub-id-type="pii">v11i4e48</pub-id>
        <pub-id pub-id-type="pmcid">PMC172661</pub-id></nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Barak</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Boniel-Nissim</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Suler</surname>
            <given-names>J</given-names>
          </name>
        </person-group>
        <article-title>Fostering empowerment in online support groups</article-title>
        <source>Comput Human Behav</source>  
        <year>2008</year>  
        <month>09</month>  
        <volume>24</volume>  
        <issue>5</issue>  
        <fpage>1867</fpage>  
        <lpage>83</lpage>  
        <pub-id pub-id-type="doi">10.1016/j.chb.2008.02.004</pub-id></nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Yang</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Yang</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Jiang</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Zhang</surname>
            <given-names>M</given-names>
          </name>
        </person-group>
        <article-title>Social media mining for drug safety signal detection</article-title>
        <source>Proceedings of the 2012 international workshop on Smart health and wellbeing</source>  
        <year>2012</year>  
        <month>10</month>  
        <day>29</day>  
        <conf-name>CIKM Conference on Information and Knowledge Management</conf-name>
        <conf-date>October 29, 2012</conf-date>
        <conf-loc>Maui, HI</conf-loc>
        <fpage>33</fpage>  
        <lpage>40</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://dl.acm.org/citation.cfm?doid=2389707.2389714"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1145/2389707.2389714</pub-id></nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Yang</surname>
            <given-names>C</given-names>
          </name>
        </person-group>
        <article-title>Patient centered healthcare informatics</article-title>
        <source>IEEE Intelligent Informatics Bulletin</source>  
        <year>2014</year>  
        <month>12</month>  
        <volume>15</volume>  
        <issue>1</issue>  
        <fpage>1</fpage>  
        <lpage>5</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="https://pdfs.semanticscholar.org/3766/3dc595c0ff7539a41afd0082eecc6ad04dba.pdf"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="book">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Kraut</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Resnick</surname>
            <given-names>P</given-names>
          </name>
          <name name-style="western">
            <surname>Kiesler</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Burke</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Chen</surname>
            <given-names>Y</given-names>
          </name>
          <name name-style="western">
            <surname>Kittur</surname>
            <given-names>N</given-names>
          </name>
          <name name-style="western">
            <surname>Konstan</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Ren</surname>
            <given-names>Y</given-names>
          </name>
          <name name-style="western">
            <surname>Riedl</surname>
            <given-names>J</given-names>
          </name>
        </person-group>
        <source>Building Successful Online Communities: Evidence-Based Social Design</source>  
        <year>2012</year>  
        <month>03</month>  
        <publisher-loc>Cambridge, MA</publisher-loc>
        <publisher-name>The MIT Press</publisher-name></nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Young</surname>
            <given-names>C</given-names>
          </name>
        </person-group>
        <article-title>Community management that works: how to build and sustain a thriving online health community</article-title>
        <source>J Med Internet Res</source>  
        <year>2013</year>  
        <month>06</month>  
        <day>11</day>  
        <volume>15</volume>  
        <issue>6</issue>  
        <fpage>e119</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.jmir.org/2013/6/e119/"/>
        </comment>  
        <pub-id pub-id-type="doi">10.2196/jmir.2501</pub-id>
        <pub-id pub-id-type="medline">23759312</pub-id>
        <pub-id pub-id-type="pii">v15i6e119</pub-id>
        <pub-id pub-id-type="pmcid">PMC3713910</pub-id></nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Iriberri</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Leroy</surname>
            <given-names>G</given-names>
          </name>
        </person-group>
        <article-title>A life-cycle perspective on online community success</article-title>
        <source>ACM Comput Surv</source>  
        <year>2009</year>  
        <month>02</month>  
        <day>01</day>  
        <volume>41</volume>  
        <issue>2</issue>  
        <fpage>1</fpage>  
        <lpage>29</lpage>  
        <pub-id pub-id-type="doi">10.1145/1459352.1459356</pub-id></nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Bouma</surname>
            <given-names>G</given-names>
          </name>
          <name name-style="western">
            <surname>Admiraal</surname>
            <given-names>JM</given-names>
          </name>
          <name name-style="western">
            <surname>de Vries</surname>
            <given-names>E</given-names>
          </name>
          <name name-style="western">
            <surname>Schröder</surname>
            <given-names>CP</given-names>
          </name>
          <name name-style="western">
            <surname>Walenkamp</surname>
            <given-names>AM</given-names>
          </name>
          <name name-style="western">
            <surname>Reyners</surname>
            <given-names>AK</given-names>
          </name>
        </person-group>
        <article-title>Internet-based support programs to alleviate psychosocial and physical symptoms in cancer patients: a literature analysis</article-title>
        <source>Crit Rev Oncol Hematol</source>  
        <year>2015</year>  
        <month>07</month>  
        <volume>95</volume>  
        <issue>1</issue>  
        <fpage>26</fpage>  
        <lpage>37</lpage>  
        <pub-id pub-id-type="doi">10.1016/j.critrevonc.2015.01.011</pub-id>
        <pub-id pub-id-type="medline">25701515</pub-id>
        <pub-id pub-id-type="pii">S1040-8428(15)00014-1</pub-id></nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Campbell</surname>
            <given-names>HS</given-names>
          </name>
          <name name-style="western">
            <surname>Phaneuf</surname>
            <given-names>MR</given-names>
          </name>
          <name name-style="western">
            <surname>Deane</surname>
            <given-names>K</given-names>
          </name>
        </person-group>
        <article-title>Cancer peer support programs-do they work?</article-title>
        <source>Patient Educ Couns</source>  
        <year>2004</year>  
        <month>10</month>  
        <volume>55</volume>  
        <issue>1</issue>  
        <fpage>3</fpage>  
        <lpage>15</lpage>  
        <pub-id pub-id-type="doi">10.1016/j.pec.2003.10.001</pub-id>
        <pub-id pub-id-type="medline">15476984</pub-id>
        <pub-id pub-id-type="pii">S073839910300301X</pub-id></nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Eysenbach</surname>
            <given-names>G</given-names>
          </name>
          <name name-style="western">
            <surname>Powell</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Englesakis</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Rizo</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Stern</surname>
            <given-names>A</given-names>
          </name>
        </person-group>
        <article-title>Primary care health related virtual communities and electronic support groups: systematic review of the effects of online peer to peer interactions</article-title>
        <source>BMJ</source>  
        <year>2004</year>  
        <month>05</month>  
        <day>13</day>  
        <volume>328</volume>  
        <fpage>1166</fpage>  
        <pub-id pub-id-type="doi">10.1136/bmj.328.7449.1166</pub-id></nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Hoey</surname>
            <given-names>LM</given-names>
          </name>
          <name name-style="western">
            <surname>Ieropoli</surname>
            <given-names>SC</given-names>
          </name>
          <name name-style="western">
            <surname>White</surname>
            <given-names>VM</given-names>
          </name>
          <name name-style="western">
            <surname>Jefford</surname>
            <given-names>M</given-names>
          </name>
        </person-group>
        <article-title>Systematic review of peer-support programs for people with cancer</article-title>
        <source>Patient Educ Couns</source>  
        <year>2008</year>  
        <month>3</month>  
        <volume>70</volume>  
        <issue>3</issue>  
        <fpage>315</fpage>  
        <lpage>37</lpage>  
        <pub-id pub-id-type="doi">10.1016/j.pec.2007.11.016</pub-id>
        <pub-id pub-id-type="medline">18191527</pub-id>
        <pub-id pub-id-type="pii">S0738-3991(07)00449-1</pub-id></nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Idriss</surname>
            <given-names>SZ</given-names>
          </name>
          <name name-style="western">
            <surname>Kvedar</surname>
            <given-names>JC</given-names>
          </name>
          <name name-style="western">
            <surname>Watson</surname>
            <given-names>AJ</given-names>
          </name>
        </person-group>
        <article-title>The role of online support communities: benefits of expanded social networks to patients with psoriasis</article-title>
        <source>Arch Dermatol</source>  
        <year>2009</year>  
        <month>01</month>  
        <volume>145</volume>  
        <issue>1</issue>  
        <fpage>46</fpage>  
        <lpage>51</lpage>  
        <pub-id pub-id-type="doi">10.1001/archdermatol.2008.529</pub-id>
        <pub-id pub-id-type="medline">19153342</pub-id>
        <pub-id pub-id-type="pii">145/1/46</pub-id></nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Zhang</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Bantum</surname>
            <given-names>E</given-names>
          </name>
          <name name-style="western">
            <surname>Owen</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Elhadad</surname>
            <given-names>N</given-names>
          </name>
        </person-group>
        <article-title>Does sustained participation in an online health community affect sentiment?</article-title>
        <source>AMIA Annu Symp Proc</source>  
        <year>2014</year>  
        <volume>2014</volume>  
        <fpage>1970</fpage>  
        <lpage>9</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/25954470"/>
        </comment>  
        <pub-id pub-id-type="medline">25954470</pub-id>
        <pub-id pub-id-type="pmcid">PMC4419987</pub-id></nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Burrows</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Nettleton</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Pleace</surname>
            <given-names>N</given-names>
          </name>
          <name name-style="western">
            <surname>Loader</surname>
            <given-names>B</given-names>
          </name>
          <name name-style="western">
            <surname>Muncer</surname>
            <given-names>S</given-names>
          </name>
        </person-group>
        <article-title>VIRTUAL COMMUNITY CARE? SOCIAL POLICY AND THE EMERGENCE OF COMPUTER MEDIATED SOCIAL SUPPORT</article-title>
        <source>Information, Communication &#38; Society</source>  
        <year>2000</year>  
        <month>01</month>  
        <volume>3</volume>  
        <issue>1</issue>  
        <fpage>95</fpage>  
        <lpage>121</lpage>  
        <pub-id pub-id-type="doi">10.1080/136911800359446</pub-id></nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Dunkel-Schetter</surname>
            <given-names>C</given-names>
          </name>
        </person-group>
        <article-title>Social support and cancer: findings based on patient interviews and their implications</article-title>
        <source>J Soc Issues</source>  
        <year>1984</year>  
        <volume>40</volume>  
        <issue>4</issue>  
        <fpage>77</fpage>  
        <lpage>98</lpage>  
        <pub-id pub-id-type="doi">10.1111/j.1540-4560.1984.tb01108.x</pub-id></nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Qiu</surname>
            <given-names>B</given-names>
          </name>
          <name name-style="western">
            <surname>Zhao</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Mitra</surname>
            <given-names>P</given-names>
          </name>
          <name name-style="western">
            <surname>Wu</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Caragea</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Yen</surname>
            <given-names>J</given-names>
          </name>
        </person-group>
        <article-title>Get online support, feel better -- sentiment analysis and dynamics in an online cancer survivor community</article-title>
        <year>2011</year>  
        <month>10</month>  
        <conf-name>Privacy, Security, Risk and Trust and 2011 IEEE Third Inernational Conference on Social Computing</conf-name>
        <conf-date>2011</conf-date>
        <conf-loc>Boston, MA</conf-loc>
        <fpage>274</fpage>  
        <lpage>281</lpage>  
        <pub-id pub-id-type="doi">10.1109/PASSAT/SocialCom.2011.127</pub-id></nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Maloney-Krichmar</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Preece</surname>
            <given-names>J</given-names>
          </name>
        </person-group>
        <article-title>A multilevel analysis of sociability, usability, and community dynamics in an online health community</article-title>
        <source>ACM Trans Comput-Hum</source>  
        <year>2005</year>  
        <month>06</month>  
        <day>01</day>  
        <volume>12</volume>  
        <issue>2</issue>  
        <fpage>201</fpage>  
        <lpage>32</lpage>  
        <pub-id pub-id-type="doi">10.1145/1067860.1067864</pub-id></nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Rodgers</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Chen</surname>
            <given-names>Q</given-names>
          </name>
        </person-group>
        <article-title>Internet community group participation: Psychosocial benefits for women with breast cancer</article-title>
        <source>J Comput Mediat Commun</source>  
        <year>2005</year>  
        <volume>10</volume>  
        <issue>4</issue>  
        <fpage>00</fpage>  
        <pub-id pub-id-type="doi">10.1111/j.1083-6101.2005.tb00268.x</pub-id></nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Wang</surname>
            <given-names>Y</given-names>
          </name>
          <name name-style="western">
            <surname>Kraut</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Levine</surname>
            <given-names>J</given-names>
          </name>
        </person-group>
        <article-title>To stay or leave?: the relationship of emotional and informational support to commitment in online health support groups</article-title>
        <source>Proceedings of the ACM 2012 conference on Computer Supported Cooperative Work</source>  
        <year>2012</year>  
        <month>2</month>  
        <conf-name>ACM 2012 conference on Computer Supported Cooperative Work</conf-name>
        <conf-date>February 11-15, 2012</conf-date>
        <conf-loc>Seattle, Washington, DC</conf-loc>
        <publisher-loc>USA</publisher-loc>
        <publisher-name>ACM</publisher-name>
        <fpage>833</fpage>  
        <lpage>842</lpage>  
        <pub-id pub-id-type="doi">10.1145/2145204.2145329</pub-id></nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Shumaker</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Brownell</surname>
            <given-names>A</given-names>
          </name>
        </person-group>
        <article-title>Toward a theory of social support: closing conceptual gaps</article-title>
        <source>J Soc Issues</source>  
        <year>1984</year>  
        <volume>40</volume>  
        <issue>4</issue>  
        <fpage>11</fpage>  
        <lpage>36</lpage>  
        <pub-id pub-id-type="doi">10.1111/j.1540-4560.1984.tb01105.x</pub-id></nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="book">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>House</surname>
            <given-names>J</given-names>
          </name>
        </person-group>
        <source>Work Stress and Social Support</source>  
        <year>1981</year>  
        <publisher-loc>Reading, MA</publisher-loc>
        <publisher-name>Addison-Wesley Educational Publishers Inc</publisher-name></nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Barrera</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Ainlay</surname>
            <given-names>S</given-names>
          </name>
        </person-group>
        <article-title>The structure of social support: a conceptual and empirical analysis</article-title>
        <source>J Community Psychol</source>  
        <year>1983</year>  
        <month>04</month>  
        <volume>11</volume>  
        <issue>2</issue>  
        <fpage>133</fpage>  
        <lpage>43</lpage>  
        <pub-id pub-id-type="medline">10299305</pub-id></nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="book">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Bambina</surname>
            <given-names>A</given-names>
          </name>
        </person-group>
        <source>Online Social Support: The Interplay of Social Networks and Computer-Mediated Communication</source>  
        <year>2007</year>  
        <publisher-loc>Youngstown, NY</publisher-loc>
        <publisher-name>Cambria Press</publisher-name></nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Keating</surname>
            <given-names>DM</given-names>
          </name>
        </person-group>
        <article-title>Spirituality and support: a descriptive analysis of online social support for depression</article-title>
        <source>J Relig Health</source>  
        <year>2013</year>  
        <month>09</month>  
        <volume>52</volume>  
        <issue>3</issue>  
        <fpage>1014</fpage>  
        <lpage>28</lpage>  
        <pub-id pub-id-type="doi">10.1007/s10943-012-9577-x</pub-id>
        <pub-id pub-id-type="medline">22322336</pub-id></nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Krause</surname>
            <given-names>N</given-names>
          </name>
        </person-group>
        <article-title>Social support, stress, and well-being among older adults</article-title>
        <source>J Gerontol</source>  
        <year>1986</year>  
        <month>07</month>  
        <volume>41</volume>  
        <issue>4</issue>  
        <fpage>512</fpage>  
        <lpage>9</lpage>  
        <pub-id pub-id-type="medline">3722737</pub-id></nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Coulson</surname>
            <given-names>N</given-names>
          </name>
          <name name-style="western">
            <surname>Buchanan</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Aubeeluck</surname>
            <given-names>A</given-names>
          </name>
        </person-group>
        <article-title>Social support in cyberspace: a content analysis of communication within a Huntington's disease online support group</article-title>
        <source>Patient Educ Couns</source>  
        <year>2007</year>  
        <month>10</month>  
        <volume>68</volume>  
        <issue>2</issue>  
        <fpage>173</fpage>  
        <lpage>8</lpage>  
        <pub-id pub-id-type="doi">10.1016/j.pec.2007.06.002</pub-id>
        <pub-id pub-id-type="medline">17629440</pub-id>
        <pub-id pub-id-type="pii">S0738-3991(07)00226-1</pub-id></nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Zhang</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Yang</surname>
            <given-names>CC</given-names>
          </name>
          <name name-style="western">
            <surname>Gong</surname>
            <given-names>X</given-names>
          </name>
        </person-group>
        <article-title>Social support and exchange patterns in an online smoking cessation intervention program</article-title>
        <source>Proceedings of the 2013 IEEE International Conference on Healthcare Informatics</source>  
        <year>2013</year>  
        <month>09</month>  
        <conf-name>2013 IEEE International Conference on Healthcare Informatics</conf-name>
        <conf-date>September 9, 2013</conf-date>
        <conf-loc>Philadelphia, PA</conf-loc>
        <fpage>219</fpage>  
        <lpage>28</lpage>  
        <pub-id pub-id-type="doi">10.1109/ICHI.2013.37</pub-id></nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Lieberman</surname>
            <given-names>M</given-names>
          </name>
        </person-group>
        <article-title>The role of insightful disclosure in outcomes for women in peer-directed breast cancer groups: a replication study</article-title>
        <source>Psychooncology</source>  
        <year>2007</year>  
        <month>10</month>  
        <volume>16</volume>  
        <issue>10</issue>  
        <fpage>961</fpage>  
        <lpage>4</lpage>  
        <pub-id pub-id-type="doi">10.1002/pon.1181</pub-id>
        <pub-id pub-id-type="medline">17328007</pub-id></nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Gorlick</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Bantum</surname>
            <given-names>E</given-names>
          </name>
          <name name-style="western">
            <surname>Owen</surname>
            <given-names>J</given-names>
          </name>
        </person-group>
        <article-title>Internet-based interventions for cancer-related distressxploring the experiences of those whose needs are not met</article-title>
        <source>Psychooncology</source>  
        <year>2014</year>  
        <month>04</month>  
        <volume>23</volume>  
        <issue>4</issue>  
        <fpage>452</fpage>  
        <lpage>8</lpage>  
        <pub-id pub-id-type="doi">10.1002/pon.3443</pub-id></nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Setoyama</surname>
            <given-names>Y</given-names>
          </name>
          <name name-style="western">
            <surname>Yamazaki</surname>
            <given-names>Y</given-names>
          </name>
          <name name-style="western">
            <surname>Namayama</surname>
            <given-names>K</given-names>
          </name>
        </person-group>
        <article-title>Benefits of peer support in online Japanese breast cancer communities: differences between lurkers and posters</article-title>
        <source>J Med Internet Res</source>  
        <year>2011</year>  
        <month>12</month>  
        <day>29</day>  
        <volume>13</volume>  
        <issue>4</issue>  
        <fpage>e122</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.jmir.org/2011/4/e122/"/>
        </comment>  
        <pub-id pub-id-type="doi">10.2196/jmir.1696</pub-id>
        <pub-id pub-id-type="medline">22204869</pub-id>
        <pub-id pub-id-type="pii">v13i4e122</pub-id>
        <pub-id pub-id-type="pmcid">PMC3278108</pub-id></nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Hambly</surname>
            <given-names>K</given-names>
          </name>
        </person-group>
        <article-title>Activity profile of members of an online health community after articular cartilage repair of the knee</article-title>
        <source>Sports Health</source>  
        <year>2011</year>  
        <month>05</month>  
        <volume>3</volume>  
        <issue>3</issue>  
        <fpage>275</fpage>  
        <lpage>82</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/23016018"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1177/1941738111402151</pub-id>
        <pub-id pub-id-type="medline">23016018</pub-id>
        <pub-id pub-id-type="pii">10.1177_1941738111402151</pub-id>
        <pub-id pub-id-type="pmcid">PMC3445167</pub-id></nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="book">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Preece</surname>
            <given-names>J</given-names>
          </name>
        </person-group>
        <source>Online communities: designing usability, supporting sociability</source>  
        <year>2000</year>  
        <publisher-loc>Chichester</publisher-loc>
        <publisher-name>John Wiley</publisher-name></nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Burke</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Marlow</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Lento</surname>
            <given-names>T</given-names>
          </name>
        </person-group>
        <article-title>Feed me: motivating newcomer contribution in social network sites</article-title>
        <source>Proceedings of the SIGCHI Conference on Human Factors in Computing Systems</source>  
        <year>2009</year>  
        <month>04</month>  
        <conf-name>Conference on Human Factors in Computing Systems</conf-name>
        <conf-date>April 04-09, 2009</conf-date>
        <conf-loc>Boston, MA</conf-loc>
        <publisher-loc>Proc 27th Int Conf Hum Factors Comput Syst CHI09 1518847</publisher-loc>
        <publisher-name>ACM</publisher-name>
        <fpage>945</fpage>  
        <lpage>954</lpage>  
        <pub-id pub-id-type="doi">10.1145/1518701.1518847</pub-id></nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="book">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Lakhani</surname>
            <given-names>KR</given-names>
          </name>
          <name name-style="western">
            <surname>Wolf</surname>
            <given-names>R</given-names>
          </name>
        </person-group>
        <person-group person-group-type="editor">
          <name name-style="western">
            <surname>Feller</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Fitzgerald</surname>
            <given-names>B</given-names>
          </name>
          <name name-style="western">
            <surname>Hissam</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Lakhani</surname>
            <given-names>KR</given-names>
          </name>
        </person-group>
        <article-title>Why hackers do what they do: understanding motivation and effort in free/open source software projects</article-title>
        <source>Perspectives on free and open source software</source>  
        <year>2005</year>  
        <publisher-loc>Cambridge, MA</publisher-loc>
        <publisher-name>MIT Press</publisher-name></nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Nov</surname>
            <given-names>O</given-names>
          </name>
        </person-group>
        <article-title>What motivates Wikipedians?</article-title>
        <source>Commun ACM</source>  
        <year>2007</year>  
        <month>11</month>  
        <day>01</day>  
        <volume>50</volume>  
        <issue>11</issue>  
        <fpage>60</fpage>  
        <lpage>64</lpage>  
        <pub-id pub-id-type="doi">10.1145/1297797.1297798</pub-id></nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Khansa</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Ma</surname>
            <given-names>X</given-names>
          </name>
          <name name-style="western">
            <surname>Liginlal</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Kim</surname>
            <given-names>S</given-names>
          </name>
        </person-group>
        <article-title>Understanding members’ active participation in online question-and-answer communities: a theory and empirical analysis</article-title>
        <source>J Manage Inform Syst</source>  
        <year>2015</year>  
        <month>08</month>  
        <day>28</day>  
        <volume>32</volume>  
        <issue>2</issue>  
        <fpage>162</fpage>  
        <lpage>203</lpage>  
        <pub-id pub-id-type="doi">10.1080/07421222.2015.1063293</pub-id></nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Yang</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Wei</surname>
            <given-names>X</given-names>
          </name>
          <name name-style="western">
            <surname>Ackerman</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Adamic</surname>
            <given-names>L</given-names>
          </name>
        </person-group>
        <article-title>Activity lifespan: an analysis of user survival patterns in online knowledge sharing communities</article-title>
        <source>ICWSM 2010 - Proceedings of the 4th International AAAI Conference on Weblogs and Social Media</source>  
        <year>2010</year>  
        <conf-name>4th International AAAI Conference on Weblogs and Social Media</conf-name>
        <conf-date>May 23-26, 2010</conf-date>
        <conf-loc>Washington, DC</conf-loc>
        <fpage>186</fpage>  
        <lpage>93</lpage> </nlm-citation>
      </ref>
      <ref id="ref43">
        <label>43</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Kim</surname>
            <given-names>E</given-names>
          </name>
          <name name-style="western">
            <surname>Han</surname>
            <given-names>JY</given-names>
          </name>
          <name name-style="western">
            <surname>Moon</surname>
            <given-names>TJ</given-names>
          </name>
          <name name-style="western">
            <surname>Shaw</surname>
            <given-names>B</given-names>
          </name>
          <name name-style="western">
            <surname>Shah</surname>
            <given-names>DV</given-names>
          </name>
          <name name-style="western">
            <surname>McTavish</surname>
            <given-names>FM</given-names>
          </name>
        </person-group>
        <article-title>The process and effect of supportive message expression and reception in online breast cancer support groups</article-title>
        <source>Psychooncology</source>  
        <year>2012</year>  
        <volume>21</volume>  
        <issue>5</issue>  
        <fpage>531</fpage>  
        <lpage>40</lpage>  
        <pub-id pub-id-type="doi">10.1002/pon.1942</pub-id>
        <pub-id pub-id-type="pmcid">PMC3168721</pub-id></nlm-citation>
      </ref>
      <ref id="ref44">
        <label>44</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Wei</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Chiu</surname>
            <given-names>I</given-names>
          </name>
        </person-group>
        <article-title>Turning telecommunications call details to churn prediction: a data mining approach</article-title>
        <source>Expert Syst Appl</source>  
        <year>2002</year>  
        <month>8</month>  
        <volume>23</volume>  
        <issue>2</issue>  
        <fpage>103</fpage>  
        <lpage>12</lpage>  
        <pub-id pub-id-type="doi">10.1016/S0957-4174(02)00030-1</pub-id></nlm-citation>
      </ref>
      <ref id="ref45">
        <label>45</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Buckinx</surname>
            <given-names>W</given-names>
          </name>
          <name name-style="western">
            <surname>Van den Poel</surname>
            <given-names>D</given-names>
          </name>
        </person-group>
        <article-title>Customer base analysis: partial defection of behaviourally loyal clients in a non-contractual FMCG retail setting</article-title>
        <source>Eur J Oper Res</source>  
        <year>2005</year>  
        <month>7</month>  
        <volume>164</volume>  
        <issue>1</issue>  
        <fpage>252</fpage>  
        <lpage>68</lpage>  
        <pub-id pub-id-type="doi">10.1016/j.ejor.2003.12.010</pub-id></nlm-citation>
      </ref>
      <ref id="ref46">
        <label>46</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Huang</surname>
            <given-names>B</given-names>
          </name>
          <name name-style="western">
            <surname>Kechadi</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Buckley</surname>
            <given-names>B</given-names>
          </name>
        </person-group>
        <article-title>Customer churn prediction for broadband internet services</article-title>
        <source>Proceedings of the 11th International Conference on Data Warehousing and Knowledge Discovery</source>  
        <year>2009</year>  
        <month>09</month>  
        <conf-name>11th International Conference on Data Warehousing and Knowledge Discovery</conf-name>
        <conf-date>August 31-September 02, 2009</conf-date>
        <conf-loc>Linz, Austria</conf-loc>
        <publisher-loc>Heidelberg</publisher-loc>
        <publisher-name>Springer-Verlag Berlin</publisher-name>
        <fpage>229</fpage>  
        <lpage>43</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://link.springer.com/chapter/10.1007/978-3-642-03730-6_19"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1007/978-3-642-03730-6_19</pub-id></nlm-citation>
      </ref>
      <ref id="ref47">
        <label>47</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Kawale</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Pal</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Srivastava</surname>
            <given-names>J</given-names>
          </name>
        </person-group>
        <article-title>Churn prediction in MMORPGs: a social influence based approach</article-title>
        <source>Proceedings of the 2009 International Conference on Computational Science and Engineering</source>  
        <year>2009</year>  
        <month>08</month>  
        <conf-name>2009 International Conference on Computational Science and Engineering</conf-name>
        <conf-date>August 29-31, 2009</conf-date>
        <conf-loc>Vancouver, BC, Canada</conf-loc>
        <fpage>423</fpage>  
        <lpage>28</lpage>  
        <pub-id pub-id-type="doi">10.1109/CSE.2009.80</pub-id></nlm-citation>
      </ref>
      <ref id="ref48">
        <label>48</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Backiel</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Baesens</surname>
            <given-names>B</given-names>
          </name>
          <name name-style="western">
            <surname>Claeskens</surname>
            <given-names>G</given-names>
          </name>
        </person-group>
        <article-title>Mining telecommunication networks to enhance customer lifetime predictions</article-title>
        <source>Artificial Intelligence and Soft Computing</source>  
        <year>2014</year>  
        <conf-name>13th International Conference ICAISC 2014</conf-name>
        <conf-date>June 1-5, 2014</conf-date>
        <conf-loc>Zakopane, Poland</conf-loc>
        <publisher-loc>Switzerland</publisher-loc>
        <publisher-name>Springer International Publishing</publisher-name>
        <fpage>15</fpage>  
        <lpage>26</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://link.springer.com/chapter/10.1007/978-3-319-07176-3_2"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1007/978-3-319-07176-3_2</pub-id></nlm-citation>
      </ref>
      <ref id="ref49">
        <label>49</label>
        <nlm-citation citation-type="book">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Berson</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Smith</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Thearling</surname>
            <given-names>K</given-names>
          </name>
        </person-group>
        <source>Building Data Mining Applications for CRM</source>  
        <year>1999</year>  
        <publisher-loc>London</publisher-loc>
        <publisher-name>McGraw-Hill</publisher-name></nlm-citation>
      </ref>
      <ref id="ref50">
        <label>50</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Zhang</surname>
            <given-names>X</given-names>
          </name>
          <name name-style="western">
            <surname>Zhu</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Xu</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Wan</surname>
            <given-names>Y</given-names>
          </name>
        </person-group>
        <article-title>Predicting customer churn through interpersonal influence</article-title>
        <source>Knowl-Based Syst</source>  
        <year>2012</year>  
        <month>4</month>  
        <day>01</day>  
        <volume>28</volume>  
        <issue>17</issue>  
        <fpage>97</fpage>  
        <lpage>104</lpage>  
        <pub-id pub-id-type="doi">10.1016/j.knosys.2011.12.005</pub-id>
        <pub-id pub-id-type="pii">0006-2952(75)90094-5</pub-id></nlm-citation>
      </ref>
      <ref id="ref51">
        <label>51</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Shmueli</surname>
            <given-names>G</given-names>
          </name>
          <name name-style="western">
            <surname>Koppius</surname>
            <given-names>O</given-names>
          </name>
        </person-group>
        <article-title>Predictive analytics in information systems research</article-title>
        <source>MIS Quarterly</source>  
        <year>2011</year>  
        <month>09</month>  
        <volume>35</volume>  
        <issue>3</issue>  
        <fpage>553</fpage>  
        <lpage>72</lpage> </nlm-citation>
      </ref>
      <ref id="ref52">
        <label>52</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Barbieri</surname>
            <given-names>N</given-names>
          </name>
          <name name-style="western">
            <surname>Bonchi</surname>
            <given-names>F</given-names>
          </name>
          <name name-style="western">
            <surname>Manco</surname>
            <given-names>G</given-names>
          </name>
        </person-group>
        <article-title>Who to follow and why: link prediction with explanations</article-title>
        <source>Proceedings of the 20th ACM SIGKDD international conference on Knowledge discovery and data mining</source>  
        <year>2014</year>  
        <conf-name>20th ACM SIGKDD international conference on Knowledge discovery and data mining</conf-name>
        <conf-date>August 24-27, 2014</conf-date>
        <conf-loc>New York, NY</conf-loc>
        <publisher-loc>USA</publisher-loc>
        <publisher-name>ACM</publisher-name>
        <fpage>1266</fpage>  
        <lpage>1275</lpage>  
        <pub-id pub-id-type="doi">10.1145/2623330.2623733</pub-id></nlm-citation>
      </ref>
      <ref id="ref53">
        <label>53</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Sachan</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Contractor</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Faruquie</surname>
            <given-names>T</given-names>
          </name>
          <name name-style="western">
            <surname>Subramaniam</surname>
            <given-names>L</given-names>
          </name>
        </person-group>
        <article-title>Using content and interactions for discovering communities in social networks</article-title>
        <source>Proceedings of the 21st international conference on World Wide Web</source>  
        <year>2012</year>  
        <conf-name>21st international conference on World Wide Web</conf-name>
        <conf-date>April 16-20, 2012</conf-date>
        <conf-loc>Lyon, France</conf-loc>
        <publisher-loc>USA</publisher-loc>
        <publisher-name>ACM</publisher-name>
        <fpage>331</fpage>  
        <lpage>40</lpage>  
        <pub-id pub-id-type="doi">10.1145/2187836.2187882</pub-id></nlm-citation>
      </ref>
      <ref id="ref54">
        <label>54</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Zhao</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Yen</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Greer</surname>
            <given-names>G</given-names>
          </name>
          <name name-style="western">
            <surname>Qiu</surname>
            <given-names>B</given-names>
          </name>
          <name name-style="western">
            <surname>Mitra</surname>
            <given-names>P</given-names>
          </name>
          <name name-style="western">
            <surname>Portier</surname>
            <given-names>K</given-names>
          </name>
        </person-group>
        <article-title>Finding influential users of online health communities: a new metric based on sentiment influence</article-title>
        <source>J Am Med Inform Assoc</source>  
        <year>2014</year>  
        <month>10</month>  
        <volume>21</volume>  
        <issue>e2</issue>  
        <fpage>e212</fpage>  
        <lpage>8</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/24449805"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1136/amiajnl-2013-002282</pub-id>
        <pub-id pub-id-type="medline">24449805</pub-id>
        <pub-id pub-id-type="pii">amiajnl-2013-002282</pub-id>
        <pub-id pub-id-type="pmcid">PMC4173171</pub-id></nlm-citation>
      </ref>
      <ref id="ref55">
        <label>55</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Levine</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Moreland</surname>
            <given-names>R</given-names>
          </name>
        </person-group>
        <article-title>Group socialization: theory and research</article-title>
        <source>Eur Rev Soc Psychol</source>  
        <year>1994</year>  
        <month>01</month>  
        <volume>5</volume>  
        <issue>1</issue>  
        <fpage>305</fpage>  
        <lpage>36</lpage>  
        <pub-id pub-id-type="doi">10.1080/14792779543000093</pub-id></nlm-citation>
      </ref>
      <ref id="ref56">
        <label>56</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Cox</surname>
            <given-names>D</given-names>
          </name>
        </person-group>
        <article-title>Regression Models and Life-Tables</article-title>
        <source>J R Stat Soc Series B (Methodological)</source>  
        <year>1972</year>  
        <volume>34</volume>  
        <issue>2</issue>  
        <fpage>187</fpage>  
        <lpage>220</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="https://www.jstor.org/stable/2985181?seq=1#page_scan_tab_contents"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref57">
        <label>57</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Zhao</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Kumar</surname>
            <given-names>A</given-names>
          </name>
        </person-group>
        <article-title>Who blogs what: understanding the publishing behavior of bloggers</article-title>
        <source>World Wide Web</source>  
        <year>2012</year>  
        <month>5</month>  
        <day>17</day>  
        <volume>16</volume>  
        <issue>5-6</issue>  
        <fpage>621</fpage>  
        <lpage>44</lpage>  
        <pub-id pub-id-type="doi">10.1007/s11280-012-0167-3</pub-id></nlm-citation>
      </ref>
      <ref id="ref58">
        <label>58</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Street</surname>
            <given-names>N</given-names>
          </name>
          <name name-style="western">
            <surname>Mangasarian</surname>
            <given-names>O</given-names>
          </name>
          <name name-style="western">
            <surname>Wolberg</surname>
            <given-names>W</given-names>
          </name>
        </person-group>
        <article-title>An inductive learning approach to prognostic prediction</article-title>
        <source>Proceedings of the Twelfth International Conference on Machine Learning</source>  
        <year>1995</year>  
        <conf-name>12th International Conference on Machine Learning</conf-name>
        <conf-date>1995</conf-date>
        <conf-loc>San Francisco, CA</conf-loc>
        <fpage>522</fpage>  
        <lpage>30</lpage> </nlm-citation>
      </ref>
      <ref id="ref59">
        <label>59</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Ren</surname>
            <given-names>Y</given-names>
          </name>
          <name name-style="western">
            <surname>Kraut</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Kiesler</surname>
            <given-names>S</given-names>
          </name>
        </person-group>
        <article-title>Applying common identity and bond theory to design of online communities</article-title>
        <source>Organ Stud</source>  
        <year>2007</year>  
        <month>03</month>  
        <volume>28</volume>  
        <issue>3</issue>  
        <fpage>377</fpage>  
        <lpage>408</lpage>  
        <pub-id pub-id-type="doi">10.1177/0170840607076007</pub-id></nlm-citation>
      </ref>
      <ref id="ref60">
        <label>60</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Quinlan</surname>
            <given-names>J</given-names>
          </name>
        </person-group>
        <article-title>Induction of decision trees</article-title>
        <source>Mach Learn</source>  
        <year>1986</year>  
        <volume>1</volume>  
        <issue>1</issue>  
        <fpage>81</fpage>  
        <lpage>106</lpage>  
        <pub-id pub-id-type="doi">10.1023/A:1022643204877</pub-id></nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
