<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JC</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Cancer</journal-id>
      <journal-title>JMIR Cancer</journal-title>
      <issn pub-type="epub">2369-1999</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v7i3e29555</article-id>
      <article-id pub-id-type="pmid">34491209</article-id>
      <article-id pub-id-type="doi">10.2196/29555</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Understanding Communication in an Online Cancer Forum: Content Analysis Study</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Vollmer Dahlke</surname>
            <given-names>Deborah</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Jang</surname>
            <given-names>Hyeju</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Torii</surname>
            <given-names>Manabu</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Andy</surname>
            <given-names>Anietie</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>Penn Medicine Center for Digital Health</institution>
            <institution>University of Pennsylvania</institution>
            <addr-line>3400 Civic Blvd</addr-line>
            <addr-line>Philadelphia, PA, 19104</addr-line>
            <country>United States</country>
            <phone>1 202 486 4095</phone>
            <email>andyanietie@gmail.com</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-7043-3042</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author">
          <name name-style="western">
            <surname>Andy</surname>
            <given-names>Uduak</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-1213-6912</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Penn Medicine Center for Digital Health</institution>
        <institution>University of Pennsylvania</institution>
        <addr-line>Philadelphia, PA</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Division of Urogynecology and Pelvic Reconstructive Surgery</institution>
        <institution>Department of Obstetrics and Gynecology</institution>
        <institution>Hospital of the University of Pennsylvania</institution>
        <addr-line>Philadelphia, PA</addr-line>
        <country>United States</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Anietie Andy <email>andyanietie@gmail.com</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <season>Jul-Sep</season>
        <year>2021</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>7</day>
        <month>9</month>
        <year>2021</year>
      </pub-date>
      <volume>7</volume>
      <issue>3</issue>
      <elocation-id>e29555</elocation-id>
      <history>
        <date date-type="received">
          <day>12</day>
          <month>4</month>
          <year>2021</year>
        </date>
        <date date-type="rev-request">
          <day>24</day>
          <month>6</month>
          <year>2021</year>
        </date>
        <date date-type="rev-recd">
          <day>20</day>
          <month>7</month>
          <year>2021</year>
        </date>
        <date date-type="accepted">
          <day>10</day>
          <month>8</month>
          <year>2021</year>
        </date>
      </history>
      <copyright-statement>©Anietie Andy, Uduak Andy. Originally published in JMIR Cancer (https://cancer.jmir.org), 07.09.2021.</copyright-statement>
      <copyright-year>2021</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Cancer, is properly cited. The complete bibliographic information, a link to the original publication on https://cancer.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://cancer.jmir.org/2021/3/e29555" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Cancer affects individuals, their family members, and friends, and increasingly, some of these individuals are turning to online cancer forums to express their thoughts/feelings and seek support such as asking cancer-related questions. The thoughts/feelings expressed and the support needed from these online forums may differ depending on if (1) an individual has or had cancer or (2) an individual is a family member or friend of an individual who has or had cancer; the language used in posts in these forums may reflect these differences.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>Using natural language processing methods, we aim to determine the differences in the support needs and concerns expressed in posts published on an online cancer forum by (1) users who self-declare to have or had cancer compared with (2) users who self-declare to be family members or friends of individuals with or that had cancer.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>Using latent Dirichlet allocation (LDA), which is a natural language processing algorithm and Linguistic Inquiry and Word Count (LIWC), a psycholinguistic dictionary, we analyzed posts published on an online cancer forum with the aim to delineate the language features associated with users in these different groups.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>Users who self-declare to have or had cancer were more likely to post about LDA topics related to hospital visits (Cohen <italic>d</italic>=0.671) and use words associated with LIWC categories related to health (Cohen <italic>d</italic>=0.635) and anxiety (Cohen <italic>d</italic>=0.126). By contrast, users who declared to be family members or friends tend to post about LDA topics related to losing a family member (Cohen <italic>d</italic>=0.702) and LIWC categories focusing on the past (Cohen <italic>d</italic>=0.465) and death (Cohen <italic>d</italic>=0.181) were more associated with these users.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>Using LDA and LIWC, we show that there are differences in the support needs and concerns expressed in posts published on an online cancer forum by users with cancer compared with family members or friends of those with cancer. Hence, responders to online cancer forums need to be cognizant of these differences in support needs and concerns and tailor their responses based on these findings.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>Cancer</kwd>
        <kwd>Reddit</kwd>
        <kwd>online forum</kwd>
        <kwd>natural language processing</kwd>
        <kwd>latent Dirichlet allocation</kwd>
        <kwd>Linguistic Inquiry and Word Count</kwd>
        <kwd>psycholinguistics</kwd>
        <kwd>social media</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <sec>
        <title>Background</title>
        <p>Increasingly, individuals affected by cancer are seeking support on online cancer forums [<xref ref-type="bibr" rid="ref1">1</xref>-<xref ref-type="bibr" rid="ref4">4</xref>]. These forums function as a support group where individuals can seek and receive support around cancer from members of the forum, some of whom may (from their personal experience) be familiar with the support expressed.</p>
        <p>Prior work determined that members of online cancer forums who self-declare to be diagnosed with cancer or going through cancer treatment tend to seek advice [<xref ref-type="bibr" rid="ref5">5</xref>] and the more emotional support members of an online cancer forum received, the more likely they were to continue their membership in the forum [<xref ref-type="bibr" rid="ref6">6</xref>].</p>
        <p>The support needs and concerns expressed in online cancer forum posts may vary depending on who is accessing the forum; for example, the support needs expressed by individuals with cancer may vary from those of individuals who are family members or friends of individuals with cancer. In prior work, researchers have used language features from social media and online forum posts to determine whether users belong to different groups such as different age groups [<xref ref-type="bibr" rid="ref7">7</xref>] and genders [<xref ref-type="bibr" rid="ref8">8</xref>], to identify and characterize users who express loneliness from other users (who do not express loneliness) [<xref ref-type="bibr" rid="ref9">9</xref>,<xref ref-type="bibr" rid="ref10">10</xref>], and to predict patients risk for cardiovascular disease [<xref ref-type="bibr" rid="ref11">11</xref>]. Similarly, in this paper, we analyze posts published on an online cancer forum on Reddit to determine the language features that delineate posts by users who self-declare to have or had cancer (we will refer to this group as the “has cancer” group) from posts by users who self-declare to be family members or friends of individuals with cancer (referred to as the “family or friend” group).</p>
        <p>We hypothesize that these language features will reflect the differences in support needs and concerns expressed by users who belong to these different groups.</p>
      </sec>
      <sec>
        <title>Related Work</title>
        <p>Users join online health forums to seek and give support as it relates to their health and well-being and that of others. Prior work has shown that online health forums are an effective way for seeking and giving support around mental health [<xref ref-type="bibr" rid="ref12">12</xref>], substance use recovery [<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref14">14</xref>], and cancer [<xref ref-type="bibr" rid="ref1">1</xref>-<xref ref-type="bibr" rid="ref4">4</xref>].</p>
        <p>Prior work analyzed posts and comments on an online cancer forum and determined that members expressed more negative personal information in public messages compared with private messages [<xref ref-type="bibr" rid="ref4">4</xref>] and the more emotional support members received, the higher the chance they will continue their membership in the forum [<xref ref-type="bibr" rid="ref6">6</xref>]. Members of an online cancer forum who were either diagnosed with cancer or going through cancer treatment tended to seek advice and survivors of cancer shared their cancer-related experiences [<xref ref-type="bibr" rid="ref5">5</xref>].</p>
        <p>Over the course of their membership, members of an online cancer forum take on various roles on the forum and for individuals who have been members of the forum for a long period, these roles tend to be more focused on encouraging other members compared with their roles when they first became members of the forum, which tended to be related to seeking information [<xref ref-type="bibr" rid="ref3">3</xref>]. These forums provide significant peer-to-peer support to individuals seeking support; hence, it is important that members of the forum responding to posts have an accurate understanding of the types of support being sought.</p>
        <p>Our work in this paper is different from prior work analyzing posts in online cancer forums as they did not delineate posts by members of the forum that have/had cancer from those who are family or friends.</p>
      </sec>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Data</title>
        <p>Our data comprise posts from an active online cancer forum on Reddit, <italic>/r/Cancer</italic>, which is the cancer forum with the most number of users (37,000 members as of March 2021) on Reddit. <italic>/r/Cancer</italic> is self-described as “This reddit is for the discussion of cancer, cancer related news, stories of survival, stories of loss and everything else associated with the disease.” Using Google’s BigQuery [<xref ref-type="bibr" rid="ref15">15</xref>], which is a data store with publicly available Reddit data sets, we collected 29,533 posts published between December 2015 and August 2019 on <italic>/r/Cancer</italic>. From these posts, we identified users who self-declared to have or had cancer by selecting the user names of authors of posts that explicitly mentioned that the author of the post either has or had cancer; specifically, we selected posts which contained the word “cancer” and a first-person singular pronoun (ie, “I” and “me”), for example, “Just got diagnosed with lung cancer, how do I cope”. One of the coauthors (AA) reviewed these posts and took out the posts that were not indicating that a user has or had cancer. Similarly, we identified users who self-declared to be family members or friends of individuals with or that had cancer by selecting the user names of authors of posts that explicitly mentioned that a family member or friend has or had cancer; specifically, we selected posts which contained the word “cancer” and also contained the following keywords associated with family members and friends: “mother,” “mom,” “father,” “dad,” “parent,” “grand mother,” “grandmother,” “grand mom,” “grand ma,” “grand father,” “grandfather,” “grand dad,” “granddad,” “grand pa,” “husband,” “wife,” “spouse,” “son,” “daughter,” “child,” “aunty,” “aunt,” “uncle,” “nephew,” “niece,” “sister,” “brother,” “family,” “friend,” for example, “My young child is battling cancer.” One of the coauthors (AA) reviewed these posts and took out the posts that were not indicating that a user was a family member or friend of an individual with or that had cancer. Given the user names of users who either self-declared in posts to have or had cancer or were family members or friends of individuals with or that had cancer, we collected all their posts published in the forum (ie, <italic>/r/Cancer</italic>). <xref ref-type="table" rid="table1">Table 1</xref> shows a summary of our data set.</p>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>Summary of our data set. This shows the number of posts by (1) users who self-declared to have or had cancer (the “has cancer” group) and (2) users who self-declared to be family members or friends (the “family or friend” group) of individuals with cancer.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="450"/>
            <col width="340"/>
            <col width="210"/>
            <thead>
              <tr valign="top">
                <td>Category</td>
                <td>Number of posts</td>
                <td>Number of users</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>The “has cancer” group</td>
                <td>4414</td>
                <td>2938</td>
              </tr>
              <tr valign="top">
                <td>The “family or friend” group</td>
                <td>3483</td>
                <td>2456</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
      </sec>
      <sec>
        <title>Differences in Language Use</title>
        <p>We used 2 approaches to determine the differences in language use in posts by users who belong to either the “has cancer” group or the “family or friend” group. Specifically, we used (1) an open vocabulary method and (2) a dictionary-based method. In all the analysis in this work, we report the effect size by using Cohen <italic>d</italic>, which is the standardized difference between means.</p>
      </sec>
      <sec>
        <title>Open Vocabulary Method</title>
        <p>In this section, we use a natural language processing topic modeling algorithm, latent Dirichlet allocation (LDA) [<xref ref-type="bibr" rid="ref16">16</xref>], which is used to identify and group co-occurring words in documents (ie, Reddit posts in this work); these word groups are referred to as <italic>topics</italic>. LDA is a generative model which assumes that topics consist of a combination of words and tokens and Reddit posts consist of a mixture of topics. As words in Reddit posts are known, the latent variables of the topics can be estimated using Gibbs sampling [<xref ref-type="bibr" rid="ref17">17</xref>]. Labels can be assigned to the various topics based on the content words associated with the topic. For example, LDA may cluster the words “Monday,” “Tuesday,” “Wednesday,” “Thursday,” and “Friday'” as days of the week. Using the DLATK package [<xref ref-type="bibr" rid="ref18">18</xref>], we generated 20 LDA topics from the /r/Cancer posts by users that self-declared to have or had cancer (ie, the “has cancer” group) and users who self-declared to be family members or friends (ie, the “family or friend” group); we chose to generate 20 topics because we varied the number of LDA topics by using 10, 20, 30, and 40 topics, and one of the coauthors (AA) reviewed these topics and observed that the topic themes from 20 topics had the most coherent themes. Similar to prior works which used LDA to identify the topic themes from social media posts most associated with users who expressed loneliness from those who did not [<xref ref-type="bibr" rid="ref9">9</xref>,<xref ref-type="bibr" rid="ref10">10</xref>] and to delineate posts by individuals belonging to different age groups [<xref ref-type="bibr" rid="ref7">7</xref>] and genders [<xref ref-type="bibr" rid="ref8">8</xref>], we used the DLATK package [<xref ref-type="bibr" rid="ref18">18</xref>] to identify the topic themes most associated with posts belonging to the “has cancer” group when compared with posts belonging to the “family or friend” group, and vice versa.</p>
      </sec>
      <sec>
        <title>Dictionary-Based Method</title>
        <p>In this section, we used Linguistic Inquiry and Word Count (LIWC) [<xref ref-type="bibr" rid="ref19">19</xref>], which is a psycholinguistic dictionary with 73 categories (eg, positive and negative emotions, health, and personal pronouns) and a curated list of words associated with these categories. Specifically, using the DLATK package [<xref ref-type="bibr" rid="ref18">18</xref>], we determined the frequency of occurrence of words associated with LIWC categories in posts belonging to the “has cancer” group compared with the “family or friend” group.</p>
      </sec>
      <sec>
        <title>Ethics and Privacy</title>
        <p>This study was deemed exempt by the Institutional Review Board guidelines of the authors institution. The data set used for this work is publicly available. The authors of this work did not contact any member or moderator of the forum /<italic>r/Cancer</italic> nor did we contact any Reddit users. Besides, Reddit user profile information was not reviewed or used in this work.</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Open Vocabulary Method</title>
        <p><xref ref-type="table" rid="table2">Table 2</xref> shows the effect sizes (using Cohen <italic>d</italic>) of the most significant LDA topics (<italic>P</italic>&#60;.001 [Benjamini–Hochberg <italic>P</italic> correction]) associated with <italic>/r/Cancer</italic> posts by users that belong to the “has cancer” group compared with posts by users belonging to the “family or friend” group. In addition, <xref ref-type="table" rid="table3">Table 3</xref> shows the effect sizes (using Cohen <italic>d</italic>) of the most significant LDA topics associated with <italic>/r/Cancer</italic> posts by users belonging to the “family or friend” group compared with posts by users that belong to the “has cancer” group. The authors of the paper independently labeled each topic theme and then met to discuss and agree on the labels for each topic theme.</p>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>LDA topics associated with posts by users who self-declared to have or had cancer (ie, the “has cancer” group) compared with posts by users in the “family or friend” group.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="270"/>
            <col width="640"/>
            <col width="90"/>
            <thead>
              <tr valign="bottom">
                <td>LDA<sup>a</sup> topic themes</td>
                <td>Highly correlated words in topics</td>
                <td>Cohen <italic>d</italic></td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Hospital visit</td>
                <td>pain, hospital, back, days, blood, started, doctor, home, worse, ER</td>
                <td>0.671</td>
              </tr>
              <tr valign="top">
                <td>Questions/seeking advice</td>
                <td>advice, good, wondering, experience, type, information, questions, survival, early, similar</td>
                <td>0.537</td>
              </tr>
              <tr valign="top">
                <td>Symptoms, risk, and cure of disease</td>
                <td>cells, risk, cure, disease, symptoms, cancers, cervical, pancreatic, body, patients</td>
                <td>0.474</td>
              </tr>
              <tr valign="top">
                <td>Research/questions around cancer</td>
                <td>research, patient, part, study, breast, questions, diagnosis, prostrate, find, survivor</td>
                <td>0.432</td>
              </tr>
              <tr valign="top">
                <td>Cancer surgery</td>
                <td>surgery, colon, removed, tumor, thyroid, remove, lymph, kidney, nodes, stomach</td>
                <td>0.349</td>
              </tr>
              <tr valign="top">
                <td>Cost/payment for treatment</td>
                <td>treatment, insurance, medical, money, health, clinical, working, options, pay, trials</td>
                <td>0.345</td>
              </tr>
              <tr valign="top">
                <td>Change in diet</td>
                <td>eat, weight, food, stomach, throat, diet, healthy, tongue, taste, loss</td>
                <td>0.293</td>
              </tr>
              <tr valign="top">
                <td>Tests around cancer</td>
                <td>scan, biopsy, back, doctor, results, CT, lymph, found, oncologist, tumor</td>
                <td>0.290</td>
              </tr>
              <tr valign="top">
                <td>Support from people/community</td>
                <td>support, people, post, free, share, story, group, love, hope, great</td>
                <td>0.245</td>
              </tr>
              <tr valign="top">
                <td>Side effects of treatment</td>
                <td>chemo, treatment, radiation, side, effects, week, hair, round, pretty, started</td>
                <td>0.214</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table2fn1">
              <p><sup>a</sup>LDA: latent Dirichlet allocation.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <table-wrap position="float" id="table3">
          <label>Table 3</label>
          <caption>
            <p>LDA topics associated with posts by users who self-declared to be family members or friends of individuals with or that had cancer (ie, the “family or friend” group) compared with posts by users in the “has cancer” group.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="290"/>
            <col width="610"/>
            <col width="100"/>
            <thead>
              <tr valign="bottom">
                <td>LDA<sup>a</sup> topic themes</td>
                <td>Highly correlated words in topics</td>
                <td>Cohen <italic>d</italic></td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Losing family member</td>
                <td>mom, day, passed, lost, home, didn't, love, hospital, wanted, made</td>
                <td>0.702</td>
              </tr>
              <tr valign="top">
                <td>Caring for family member</td>
                <td>sister, brother, family, wife, home, work, parents, mother, live, care</td>
                <td>0.373</td>
              </tr>
              <tr valign="top">
                <td>Diagnosis of family member</td>
                <td>dad, he’s, father, diagnosed, stage, ago, found, lung, today, pancreatic</td>
                <td>0.339</td>
              </tr>
              <tr valign="top">
                <td>Diagnosis of family member</td>
                <td>mom, stage, breast, diagnosed, advice, she's, friend, ovarian, grandma, lung</td>
                <td>0.179</td>
              </tr>
              <tr valign="top">
                <td>Talk around support</td>
                <td>time, life, family, things, make, support, care, health, long, difficult</td>
                <td>0.159</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table3fn1">
              <p><sup>a</sup>LDA: latent Dirichlet allocation.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>Dictionary-Based Method</title>
        <p><xref ref-type="table" rid="table4">Table 4</xref> shows the effect sizes (using Cohen <italic>d</italic>) and LIWC categories that are more associated with posts belonging to the “has cancer” group when compared with the “family or friend” group. In addition, <xref ref-type="table" rid="table5">Table 5</xref> shows the effect sizes (using Cohen <italic>d</italic>) and LIWC categories that are more associated with posts by the “family or friend” group when compared with posts by the “has cancer” group.</p>
        <table-wrap position="float" id="table4">
          <label>Table 4</label>
          <caption>
            <p>LIWC categories most associated with posts belonging to the “has cancer” group when compared with the “family or friend” group. Effect size is reported as Cohen <italic>d</italic>.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="720"/>
            <col width="280"/>
            <thead>
              <tr valign="bottom">
                <td>LIWC<sup>a</sup> category</td>
                <td>Cohen <italic>d</italic></td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Health</td>
                <td>0.635</td>
              </tr>
              <tr valign="top">
                <td>Biological processes</td>
                <td>0.607</td>
              </tr>
              <tr valign="top">
                <td>Second-person pronouns</td>
                <td>0.234</td>
              </tr>
              <tr valign="top">
                <td>Anxiety</td>
                <td>0.126</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table4fn1">
              <p><sup>a</sup>LIWC: Linguistic Inquiry and Word Count.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <table-wrap position="float" id="table5">
          <label>Table 5</label>
          <caption>
            <p>LIWC categories most associated with posts belonging to the “family or friend” group when compared with posts by the “has cancer” group. Effect size is reported as Cohen <italic>d</italic>.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="720"/>
            <col width="280"/>
            <thead>
              <tr valign="bottom">
                <td>LIWC<sup>a</sup> category</td>
                <td>Cohen <italic>d</italic></td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Third-person singular pronoun</td>
                <td>1.168</td>
              </tr>
              <tr valign="top">
                <td>Personal pronoun</td>
                <td>0.977</td>
              </tr>
              <tr valign="top">
                <td>Female references</td>
                <td>0.964</td>
              </tr>
              <tr valign="top">
                <td>Male references</td>
                <td>0.746</td>
              </tr>
              <tr valign="top">
                <td>First-person singular pronouns</td>
                <td>0.543</td>
              </tr>
              <tr valign="top">
                <td>Past focus</td>
                <td>0.465</td>
              </tr>
              <tr valign="top">
                <td>Affiliation</td>
                <td>0.398</td>
              </tr>
              <tr valign="top">
                <td>First-person plural pronouns</td>
                <td>0.242</td>
              </tr>
              <tr valign="top">
                <td>Sadness</td>
                <td>0.224</td>
              </tr>
              <tr valign="top">
                <td>Time</td>
                <td>0.222</td>
              </tr>
              <tr valign="top">
                <td>Present focus</td>
                <td>0.221</td>
              </tr>
              <tr valign="top">
                <td>Death</td>
                <td>0.181</td>
              </tr>
              <tr valign="top">
                <td>Friends</td>
                <td>0.175</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table5fn1">
              <p><sup>a</sup>LIWC: Linguistic Inquiry and Word Count.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>In this work, using LDA and LIWC, we show that there are differences in the support needs and concerns expressed in online cancer forum posts by users who belong to the “has cancer” group compared with those belonging to the “family or friend” group. In the following section, we summarize the findings from this work.</p>
        <p>In our analysis, we observed that users who self-declare to have or had cancer tend to post about topic themes such as their hospital visits and seeking advice and information as these relate to cancer; this finding is in line with previous work [<xref ref-type="bibr" rid="ref5">5</xref>], which showed that individuals who self-declared (in an online cancer forum) to be diagnosed with cancer or undergoing treatment mostly sought advice from other members of the forum. We also observed that users who self-declared to have cancer tend to post about topics themes related to the cost/payments for their treatments, change in diet, and side effects of treatment, and use words associated with LIWC categories related to health and anxiety. These findings can aid in the design of processes for providing better support on online cancer forums. For example, the cost for cancer treatment can be expensive, and because users who self-declare to have or had cancer tend to post about topic themes related to cost/payment for their treatment, online cancer forums can partner with health care providers and relevant organizations to come up with and document detailed ways and tips in which patients with cancer can approach paying for their treatment; this information can be made easily available and accessible to users on the online forum. A similar thing can be done for other user concerns such as change in diet and side effects of treatments. Given that LIWC categories associated with anxiety are more associated with users who self-declared to have or had cancer, online cancer forums can provide/recommend professional mental health services to these users.</p>
        <p>For users who self-declared to be family members or friends of individuals diagnosed with cancer, we observed that they tend to post about topic themes such as losing a family member, caring for a family member, and the diagnosis of a family member; also, these users tend to use words associated with LIWC categories focusing on the past/present, sadness, and death. Given that some of the topic themes users who self-declare to be family members or friends tend to post about are caring for a family member and the diagnosis of a family member, online cancer forums can partner with health care providers to document ways in which these users can provide support and care to their loved ones with cancer—this information can be made easily accessible on the forum. Besides, given that LIWC categories associated with past/present, sadness, and death are more associated with the “family or friends” group, this may imply that users belonging to this group express (in their posts) having a difficult time coping with either losing their loved one or their loved one being sick; hence, the cancer forum can provide professional mental health counselors who can provide help to these users on how to cope with a loved one being sick or losing a loved one.</p>
      </sec>
      <sec>
        <title>Limitation</title>
        <p>Prior work determined that the interests of members of online forums focused on similar topics may differ [<xref ref-type="bibr" rid="ref20">20</xref>]; hence, a limitation of this work is that the language used on <italic>/r/Cancer</italic> may differ from that used in other online cancer forums. In addition, the sample used in this work is composed of Reddit users who publish posts on the subreddit <italic>/r/Cancer</italic> and is not representative of all users affected by cancer.</p>
      </sec>
      <sec>
        <title>Conclusion</title>
        <p>In this paper, using LDA and LIWC, we determined the LDA topics and LIWC categories associated with posts by (1) users who self-declared to have or had cancer and (2) users who self-declared to be family members or friends of individuals with cancer; also, we observed that these language use differences reflect the differences in support needs and concerns expressed in posts belonging to these groups.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group/>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">LDA</term>
          <def>
            <p>latent Dirichlet allocation</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">LIWC</term>
          <def>
            <p>Linguistic Inquiry and Word Count</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <fn-group>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Kraut</surname>
              <given-names>RE</given-names>
            </name>
            <name name-style="western">
              <surname>Levine</surname>
              <given-names>JM</given-names>
            </name>
          </person-group>
          <article-title>Eliciting and receiving online support: using computer-aided content analysis to examine the dynamics of online social support</article-title>
          <source>J Med Internet Res</source>
          <year>2015</year>
          <month>04</month>
          <day>20</day>
          <volume>17</volume>
          <issue>4</issue>
          <fpage>e99</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2015/4/e99/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/jmir.3558</pub-id>
          <pub-id pub-id-type="medline">25896033</pub-id>
          <pub-id pub-id-type="pii">v17i4e99</pub-id>
          <pub-id pub-id-type="pmcid">PMC4419194</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Kraut</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Levine</surname>
              <given-names>JM</given-names>
            </name>
          </person-group>
          <article-title>Commitment of newcomers and old-timers to online health support communities</article-title>
          <source>Proceedings of the SIGCHI Conference on Human Factors in Computing systems</source>
          <year>2017</year>
          <month>05</month>
          <conf-name>CHI Conference on Human Factors in Computing Systems</conf-name>
          <conf-date>May 6-11, 2017</conf-date>
          <conf-loc>Denver, CO</conf-loc>
          <publisher-loc>New York, NY</publisher-loc>
          <publisher-name>ACM</publisher-name>
          <fpage>6363</fpage>
          <lpage>6375</lpage>
          <pub-id pub-id-type="doi">10.1145/3025453.3026008</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Kraut</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Mayfield</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Jurafsky</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Seekers, providers, welcomers, and storytellers: Modeling social roles in online health communities</article-title>
          <source>Proceedings of the 2019 CHI Conference on Human Factors in Computing Systems</source>
          <year>2019</year>
          <month>05</month>
          <conf-name>CHI Conference on Human Factors in Computing Systems</conf-name>
          <conf-date>May 4-9, 2019</conf-date>
          <conf-loc>Glasgow, Scotland, UK</conf-loc>
          <publisher-loc>New York, NY</publisher-loc>
          <publisher-name>ACM</publisher-name>
          <fpage>1</fpage>
          <lpage>14</lpage>
          <pub-id pub-id-type="doi">10.1145/3290605.3300574</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Yao</surname>
              <given-names>Zheng</given-names>
            </name>
            <name name-style="western">
              <surname>Seering</surname>
              <given-names>Joseph</given-names>
            </name>
            <name name-style="western">
              <surname>Kraut</surname>
              <given-names>Robert</given-names>
            </name>
          </person-group>
          <article-title>The Channel Matters: Self-disclosure, reciprocity and social support in online cancer support groups</article-title>
          <source>Proceedings of the 2019 CHI Conference on Human Factors in Computing Systems</source>
          <year>2019</year>
          <month>05</month>
          <conf-name>CHI Conference on Human Factors in Computing Systems</conf-name>
          <conf-date>May 4-9, 2019</conf-date>
          <conf-loc>Glasgow, Scotland, UK</conf-loc>
          <fpage>1</fpage>
          <lpage>15</lpage>
          <pub-id pub-id-type="doi">10.1145/3290605.3300261</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Eschler</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Dehlawi</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Pratt</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>Self-characterized illness phase and information needs of participants in an online cancer forum</article-title>
          <source>Proceedings of the Ninth International AAAI Conference on Web and Social Media</source>
          <year>2015</year>
          <month>03</month>
          <day>01</day>
          <conf-name>Ninth International AAAI Conference on Web and Social Media</conf-name>
          <conf-date>May 26-29, 2015</conf-date>
          <conf-loc>University of Oxford, Oxford, UK</conf-loc>
          <publisher-loc>Palo Alto, CA</publisher-loc>
          <publisher-name>AAAI Press</publisher-name>
          <fpage>1</fpage>
          <lpage>9</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.aaai.org/ocs/index.php/ICWSM/ICWSM15/paper/download/10546/10493"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>Y-C</given-names>
            </name>
            <name name-style="western">
              <surname>Robert</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>John</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>To stay or leave? The relationship of emotional and informational support to commitment in online health support groups</article-title>
          <source>Proceedings of the ACM 2012 conference on Computer Supported Cooperative Work</source>
          <year>2012</year>
          <month>02</month>
          <day>15</day>
          <conf-name>CSCW '12: Computer Supported Cooperative Work</conf-name>
          <conf-date>February 11-15, 2012</conf-date>
          <conf-loc>Seattle, WA</conf-loc>
          <publisher-loc>New York, NY</publisher-loc>
          <publisher-name>ACM</publisher-name>
          <fpage>833</fpage>
          <lpage>842</lpage>
          <pub-id pub-id-type="doi">10.1145/2145204.2145329</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Park</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Yaden</surname>
              <given-names>DB</given-names>
            </name>
            <name name-style="western">
              <surname>Schwartz</surname>
              <given-names>HA</given-names>
            </name>
            <name name-style="western">
              <surname>Kern</surname>
              <given-names>ML</given-names>
            </name>
            <name name-style="western">
              <surname>Eichstaedt</surname>
              <given-names>JC</given-names>
            </name>
            <name name-style="western">
              <surname>Kosinski</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Stillwell</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Ungar</surname>
              <given-names>LH</given-names>
            </name>
            <name name-style="western">
              <surname>Seligman</surname>
              <given-names>MEP</given-names>
            </name>
          </person-group>
          <article-title>Women are Warmer but No Less Assertive than Men: Gender and Language on Facebook</article-title>
          <source>PLoS One</source>
          <year>2016</year>
          <month>5</month>
          <day>25</day>
          <volume>11</volume>
          <issue>5</issue>
          <fpage>e0155885</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.plos.org/10.1371/journal.pone.0155885"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0155885</pub-id>
          <pub-id pub-id-type="medline">27223607</pub-id>
          <pub-id pub-id-type="pii">PONE-D-15-49892</pub-id>
          <pub-id pub-id-type="pmcid">PMC4881750</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Schwartz</surname>
              <given-names>HA</given-names>
            </name>
            <name name-style="western">
              <surname>Eichstaedt</surname>
              <given-names>JC</given-names>
            </name>
            <name name-style="western">
              <surname>Kern</surname>
              <given-names>ML</given-names>
            </name>
            <name name-style="western">
              <surname>Dziurzynski</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Ramones</surname>
              <given-names>SM</given-names>
            </name>
            <name name-style="western">
              <surname>Agrawal</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Shah</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Kosinski</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Stillwell</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Seligman</surname>
              <given-names>MEP</given-names>
            </name>
            <name name-style="western">
              <surname>Ungar</surname>
              <given-names>LH</given-names>
            </name>
          </person-group>
          <article-title>Personality, gender, and age in the language of social media: the open-vocabulary approach</article-title>
          <source>PLoS One</source>
          <year>2013</year>
          <month>9</month>
          <day>25</day>
          <volume>8</volume>
          <issue>9</issue>
          <fpage>e73791</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.plos.org/10.1371/journal.pone.0073791"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0073791</pub-id>
          <pub-id pub-id-type="medline">24086296</pub-id>
          <pub-id pub-id-type="pii">PONE-D-13-03858</pub-id>
          <pub-id pub-id-type="pmcid">PMC3783449</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Guntuku</surname>
              <given-names>SC</given-names>
            </name>
            <name name-style="western">
              <surname>Schneider</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Pelullo</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Young</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Wong</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Ungar</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Polsky</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Volpp</surname>
              <given-names>KG</given-names>
            </name>
            <name name-style="western">
              <surname>Merchant</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Studying expressions of loneliness in individuals using twitter: an observational study</article-title>
          <source>BMJ Open</source>
          <year>2019</year>
          <month>11</month>
          <day>04</day>
          <volume>9</volume>
          <issue>11</issue>
          <fpage>e030355</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmjopen.bmj.com/lookup/pmidlookup?view=long&#38;pmid=31685502"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/bmjopen-2019-030355</pub-id>
          <pub-id pub-id-type="medline">31685502</pub-id>
          <pub-id pub-id-type="pii">bmjopen-2019-030355</pub-id>
          <pub-id pub-id-type="pmcid">PMC6830671</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Andy</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Studying How Individuals Who Express the Feeling of Loneliness in an Online Loneliness Forum Communicate in a Nonloneliness Forum: Observational Study</article-title>
          <source>JMIR Form Res</source>
          <year>2021</year>
          <month>07</month>
          <day>20</day>
          <volume>5</volume>
          <issue>7</issue>
          <fpage>e28738</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://formative.jmir.org/2021/7/e28738/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/28738</pub-id>
          <pub-id pub-id-type="medline">34283026</pub-id>
          <pub-id pub-id-type="pii">v5i7e28738</pub-id>
          <pub-id pub-id-type="pmcid">PMC8335613</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Andy</surname>
              <given-names>AU</given-names>
            </name>
            <name name-style="western">
              <surname>Guntuku</surname>
              <given-names>SC</given-names>
            </name>
            <name name-style="western">
              <surname>Adusumalli</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Asch</surname>
              <given-names>DA</given-names>
            </name>
            <name name-style="western">
              <surname>Groeneveld</surname>
              <given-names>PW</given-names>
            </name>
            <name name-style="western">
              <surname>Ungar</surname>
              <given-names>LH</given-names>
            </name>
            <name name-style="western">
              <surname>Merchant</surname>
              <given-names>RM</given-names>
            </name>
          </person-group>
          <article-title>Predicting Cardiovascular Risk Using Social Media Data: Performance Evaluation of Machine-Learning Models</article-title>
          <source>JMIR Cardio</source>
          <year>2021</year>
          <month>03</month>
          <day>19</day>
          <volume>5</volume>
          <issue>1</issue>
          <fpage>e24473</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://cardio.jmir.org/2021/1/e24473/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/24473</pub-id>
          <pub-id pub-id-type="medline">33605888</pub-id>
          <pub-id pub-id-type="pii">v5i1e24473</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Munmun</surname>
              <given-names>DC</given-names>
            </name>
          </person-group>
          <article-title>Mental health discourse on reddit: Self-disclosure, social support, and anonymity</article-title>
          <year>2014</year>
          <month>06</month>
          <day>01</day>
          <conf-name>Eighth International AAAI Conference on Weblogs and Social Media</conf-name>
          <conf-date>June 1-4, 2014</conf-date>
          <conf-loc>Ann Arbor, MI</conf-loc>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>MacLean</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Gupta</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Lembke</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Manning</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Heer</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Forum77: An analysis of an online health forum dedicated to addiction recovery</article-title>
          <source>Proceedings of the 18th ACM Conference on Computer Supported Cooperative Work &#38; Social Computing</source>
          <year>2015</year>
          <month>03</month>
          <day>14</day>
          <conf-name>CSCW '15: Computer Supported Cooperative Work and Social Computing</conf-name>
          <conf-date>March 14-18, 2015</conf-date>
          <conf-loc>Vancouver, BC, Canada</conf-loc>
          <publisher-loc>New York, NY</publisher-loc>
          <publisher-name>ACM</publisher-name>
          <fpage>1511</fpage>
          <lpage>1526</lpage>
          <pub-id pub-id-type="doi">10.1145/2675133.2675146</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Andy</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Guntuku</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Does Social Support (Expressed in Post Titles) Elicit Comments in Online Substance Use Recovery Forums?</article-title>
          <source>Proceedings of the Fourth Workshop on Natural Language Processing and Computational Social Science</source>
          <year>2020</year>
          <month>11</month>
          <day>20</day>
          <conf-name>Fourth Workshop on Natural Language Processing and Computational Social Science</conf-name>
          <conf-date>November 20, 2020</conf-date>
          <conf-loc>Virtual</conf-loc>
          <fpage>35</fpage>
          <lpage>40</lpage>
          <pub-id pub-id-type="doi">10.18653/v1/2020.nlpcss-1.4</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Fernandes</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Bernardino</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>What is BigQuery?</article-title>
          <source>IDEAS '15: Proceedings of the 19th International Database Engineering &#38; Applications Symposium</source>
          <year>2015</year>
          <month>07</month>
          <day>15</day>
          <conf-name>IDEAS '15: 19th International Database Engineering &#38; Applications Symposium</conf-name>
          <conf-date>July 13-15, 2015</conf-date>
          <conf-loc>Yokohama, Japan</conf-loc>
          <publisher-loc>New York, NY</publisher-loc>
          <publisher-name>ACM</publisher-name>
          <fpage>202</fpage>
          <lpage>203</lpage>
          <pub-id pub-id-type="doi">10.1145/2790755.2790797</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Blei</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Ng</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Jordan</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Latent Dirichlet allocation</article-title>
          <source>Journal of Machine Learning Research</source>
          <year>2003</year>
          <month>01</month>
          <day>01</day>
          <volume>3</volume>
          <fpage>993</fpage>
          <lpage>1022</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://jmlr.org/papers/volume3/blei03a/blei03a.pdf"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gelfand</surname>
              <given-names>AE</given-names>
            </name>
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>AFM</given-names>
            </name>
          </person-group>
          <article-title>Sampling-Based Approaches to Calculating Marginal Densities</article-title>
          <source>Journal of the American Statistical Association</source>
          <year>1990</year>
          <month>06</month>
          <volume>85</volume>
          <issue>410</issue>
          <fpage>398</fpage>
          <lpage>409</lpage>
          <pub-id pub-id-type="doi">10.1080/01621459.1990.10476213</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Schwartz</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Giorgi</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Sap</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Crutchley</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Ungar</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Eichstaedt</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Dlatk: Differential language analysis toolkit</article-title>
          <source>Proceedings of the 2017 Conference on Empirical Methods in Natural Language Processing: System Demonstrations</source>
          <year>2017</year>
          <month>09</month>
          <day>7</day>
          <conf-name>2017 Conference on Empirical Methods in Natural Language Processing: System Demonstrations</conf-name>
          <conf-date>September 2017</conf-date>
          <conf-loc>Copenhagen, Denmark</conf-loc>
          <fpage>55</fpage>
          <lpage>60</lpage>
          <pub-id pub-id-type="doi">10.18653/v1/d17-2010</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pennebaker</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Boyd</surname>
              <given-names>RL</given-names>
            </name>
            <name name-style="western">
              <surname>Jordan</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Blackburn</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <source>The Development and Psychometric Properties of LIWC2015</source>
          <year>2015</year>
          <month>09</month>
          <day>01</day>
          <access-date>2021-08-29</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://repositories.lib.utexas.edu/bitstream/handle/2152/31333/LIWC2015_LanguageManual.pdf">https://repositories.lib.utexas.edu/bitstream/handle/2152/31333/LIWC2015_LanguageManual.pdf</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tran</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Ostendorf</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Characterizing the language of online communities and its relation to community reception (preprint)</article-title>
          <source>arXiv</source>
          <year>2016</year>
          <month>02</month>
          <day>01</day>
          <volume>1</volume>
          <fpage>1</fpage>
          <pub-id pub-id-type="doi">10.18653/v1/d16-1108</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
