<?xml version="1.0" encoding="utf-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JC</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Cancer</journal-id>
      <journal-title>JMIR Cancer</journal-title>
      <issn pub-type="epub">2369-1999</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
    <article-id pub-id-type="publisher-id">v4i2e11073</article-id>
    <article-id pub-id-type="pmid">30563821</article-id>
    <article-id pub-id-type="doi">10.2196/11073</article-id>
    <article-categories>
      <subj-group subj-group-type="heading">
        <subject>Original Paper</subject>
      </subj-group>
      <subj-group subj-group-type="article-type">
        <subject>Original Paper</subject>
      </subj-group>
    </article-categories>
    <title-group>
      <article-title>How to Optimize Health Messages About Cancer on Facebook: Mixed-Methods Study</article-title>
    </title-group>
    <contrib-group>
      <contrib contrib-type="editor">
        <name>
          <surname>Eysenbach</surname>
          <given-names>Gunther</given-names>
        </name>
      </contrib>
    </contrib-group>
    <contrib-group>
      <contrib contrib-type="reviewer">
        <name>
          <surname>Kulanthaivel</surname>
          <given-names>Anand</given-names>
        </name>
      </contrib>
      <contrib contrib-type="reviewer">
        <name>
          <surname>Das</surname>
          <given-names>Enny</given-names>
        </name>
      </contrib>
    </contrib-group>
    <contrib-group>
      <contrib contrib-type="author" id="contrib1" corresp="yes" equal-contrib="yes">
      <name name-style="western">
        <surname>Biancovilli</surname>
        <given-names>Priscila</given-names>
      </name>
      <degrees>MSc</degrees>
      <xref rid="aff1" ref-type="aff">1</xref>
      <address>
        <institution>Doctoral School of Health Sciences</institution>
        <institution>University of Pécs</institution>
        <addr-line>Vörösmarty utca 4</addr-line>
        <addr-line>Pécs, 7621</addr-line>
        <country>Hungary</country>
        <phone>36 (72) 513 678</phone>
        <email>biancovilli@bioqmed.ufrj.br</email>
      </address>  
      <xref rid="aff2" ref-type="aff">2</xref>
      <ext-link ext-link-type="orcid">http://orcid.org/0000-0003-1425-4223</ext-link></contrib>
      <contrib contrib-type="author" id="contrib2">
        <name name-style="western">
          <surname>Jurberg</surname>
          <given-names>Claudia</given-names>
        </name>
        <degrees>PhD</degrees>
        <xref rid="aff2" ref-type="aff">2</xref>
        <xref rid="aff3" ref-type="aff">3</xref>
        <ext-link ext-link-type="orcid">http://orcid.org/0000-0003-3607-7299</ext-link>
      </contrib>
    </contrib-group>
    <aff id="aff1">
    <label>1</label>
    <institution>Doctoral School of Health Sciences</institution>
    <institution>University of Pécs</institution>  
    <addr-line>Pécs</addr-line>
    <country>Hungary</country></aff>
    <aff id="aff2">
    <label>2</label>
    <institution>Laboratório de Imunologia Tumoral Dra. Ottilia Affonso Mitidieri</institution>
    <institution>Instituto de Bioquímica Médica Leopoldo de Meis</institution>  
    <institution>Universidade Federal do Rio de Janeiro</institution>  
    <addr-line>Rio de Janeiro</addr-line>
    <country>Brazil</country></aff>
    <aff id="aff3">
    <label>3</label>
    <institution>Fundação Oswaldo Cruz</institution>
    <institution>Instituto Oswaldo Cruz</institution>  
    <addr-line>Rio de Janeiro</addr-line>
    <country>Brazil</country></aff>
    <author-notes>
      <corresp>Corresponding Author: Priscila Biancovilli 
      <email>biancovilli@bioqmed.ufrj.br</email></corresp>
    </author-notes>
    <pub-date pub-type="collection"><season>Jul-Dec</season><year>2018</year></pub-date>
    <pub-date pub-type="epub">
      <day>18</day>
      <month>12</month>
      <year>2018</year>
    </pub-date>
    <volume>4</volume>
    <issue>2</issue>
    <elocation-id>e11073</elocation-id>
    <!--history from ojs - api-xml-->
    <history>
      <date date-type="received">
        <day>21</day>
        <month>5</month>
        <year>2018</year>
      </date>
      <date date-type="rev-request">
        <day>9</day>
        <month>8</month>
        <year>2018</year>
      </date>
      <date date-type="rev-recd">
        <day>3</day>
        <month>10</month>
        <year>2018</year>
      </date>
      <date date-type="accepted">
        <day>30</day>
        <month>10</month>
        <year>2018</year>
      </date>
    </history>
    <!--(c) the authors - correct author names and publication date here if necessary. Date in form ', dd.mm.yyyy' after jmir.org-->
    <copyright-statement>©Priscila Biancovilli, Claudia Jurberg. Originally published in JMIR Cancer (http://cancer.jmir.org), 18.12.2018.</copyright-statement>
    <copyright-year>2018</copyright-year>
    <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
      <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Cancer, is properly cited. The complete bibliographic information, a link to the original publication on http://cancer.jmir.org/, as well as this copyright and license information must be included.</p>
    </license>  
    <self-uri xlink:href="http://cancer.jmir.org/2018/2/e11073/" xlink:type="simple"/>
    <abstract>
      <sec sec-type="background">
        <title>Background</title>
        <p>Incidence rate of cancer is increasing worldwide, with longer life expectancy being one of the main causes. Yet, between 30% and 50% of cancer cases are preventable, and early detection contributes to a better prognosis. This makes health communication strategies essential. Facebook, the world’s most used social networking site in 2017 and 2018, can be a useful tool for disseminating powerful messages on health promotion, prevention, and early detection.</p>
      </sec>
      <sec sec-type="objective">
        <title>Objective</title>
        <p>We aimed to (1) offer ways of optimizing health messages about cancer on Facebook, focusing on topics, such as risk factors, prevention, treatment, early diagnosis, and cure, and (2) investigate which aspects of these messages generate greater engagement.</p>
      </sec>
      <sec sec-type="methods">
        <title>Methods</title>
        <p>To verify what generates greater engagement in topics related to cancer on Facebook, we analyzed 16 Brazilian pages with the main theme of cancer. We performed a manual analysis of texts, content, and engagement rates. Finally, we developed a software program to operationalize the analysis of Facebook posts. The tool we devised aims to automate the analysis of any Facebook page with cancer as the main theme.</p>
      </sec>
      <sec sec-type="results">
        <title>Results</title>
        <p>We analyzed 712 posts over a 1-month period. We divided the posts into the following 8 categories: “Testimonies or real-life stories,” “Solidarity,” “Anniversaries,” “Science and health,” “Events,” “Institutional,” “Risk factors,” and “Beauty.” The pages were also organized into groups according to the type of profile to which they belonged (ie, hospitals or foundations, informative, nongovernmental organizations, and personal pages).The results showed that the categories generating greater engagement in Brazil were not those with the highest percentage of cancer-related content. For instance, in the “Informative” group the “Testimonies or real-life stories” category generated an engagement of 79.5%. However, only 9.5% (25/261) of the content within the relevant time period dealt with such topics. Another example concerns the category “Science and health.” Despite being the one with the highest number of posts (129/261, 49.4%), it scored 5th in terms of engagement. This investigation served as the basis for the development of a tool designed to automate the analysis of Facebook pages. The list of categories and keywords generated by this analysis was employed to feed the system, which was then able to categorize posts appearing on a Facebook page. We tested the system on 163 posts and only 34 were classified incorrectly, which amounts to a 20.8% error rate (79.2% accuracy).</p>
      </sec>
      <sec sec-type="conclusions">
        <title>Conclusions</title>
        <p>The analysis we conducted by categorizing posts and calculating engagement rates shows that the potential of Facebook pages is often underutilized. This occurs because the categories that generate the greatest engagement are often not those most frequently used. The software developed in this research may help administrators of cancer-related pages analyze their posts more easily and increase public interest as a result.</p>
      </sec>
    </abstract>
    <kwd-group>
      <kwd>cancer</kwd>
      <kwd>content analysis</kwd>
      <kwd>Facebook</kwd>
      <kwd>health</kwd>
      <kwd>software</kwd>
    </kwd-group></article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <sec>
        <title>Background</title>
        <p>Cancer is an umbrella term encompassing a group of &#62;200 diseases that have in common the disordered growth of cells invading tissues and organs [<xref ref-type="bibr" rid="ref1">1</xref>]. The number of cancer-related deaths worldwide increased from 6 million in 2000 to 7.6 million in 2007 [<xref ref-type="bibr" rid="ref2">2</xref>]. In 2012, there were 8.2 million cancer-related deaths [<xref ref-type="bibr" rid="ref3">3</xref>], and in 2018, it is estimated that this disease will be responsible for around 9.6 million deaths. While about 1 in 6 deaths globally is due to cancer [<xref ref-type="bibr" rid="ref4">4</xref>], Brazil has an incidence rate of 205.5 cases of cancer per 100,000 inhabitants, thus ranking tenth in South America and the Caribbean region [<xref ref-type="bibr" rid="ref3">3</xref>].</p>
        <p>For prevention purposes, it is important to reiterate that changes in lifestyle and habits of the population may reduce the likelihood of disease onset. As reported by Anand et al, “Only 5%-10% of all cancer cases can be attributed to genetic defects, whereas the remaining 90%-95% have their roots in the environment and lifestyle. The lifestyle factors include cigarette smoking, diet (fried foods, red meat), alcohol, sun exposure, environmental pollutants, infections, stress, obesity, and physical inactivity” [<xref ref-type="bibr" rid="ref5">5</xref>]. There is, thus, evidence that prevention is the most cost-effective, long-term strategy for controlling the onset of cancer [<xref ref-type="bibr" rid="ref6">6</xref>].</p>
        <p>In addition to the importance of adopting a healthy lifestyle for prevention, it is crucial to increase early detection in individuals who already exhibit symptoms of the disease. Indeed, when some types of cancer are diagnosed in the early stages, the chances of treatment success and cure (for, at least, 5 years after diagnosis) increase dramatically. According to <italic>Cancer Research UK</italic>, some types of cancer can be treated much more easily if detected early, for example, bowel, breast, ovarian, and lung [<xref ref-type="bibr" rid="ref7">7</xref>].</p>
      </sec>
      <sec>
        <title>Facebook and Health Communication</title>
        <p>Facebook is currently the social networking site with the highest number of active users; in June 2017, it reached 2 billion monthly active users [<xref ref-type="bibr" rid="ref8">8</xref>]. Every minute, 510,000 comments are posted, 293,000 statuses are updated, and 136,000 photos are uploaded [<xref ref-type="bibr" rid="ref9">9</xref>]. The most common forms of interaction are reactions (eg, when a user clicks on one of the emojis representing emotions, such as love, surprise, sadness, and anger), comments (eg, when a user writes a text under a post), and shares (eg, when a user shares another person’s post on his or her Facebook profile). Brazil ranks third in the world per the number of Facebook users (130 million), following India (270 million) and the United States (210 million) [<xref ref-type="bibr" rid="ref10">10</xref>]. Several Facebook pages worldwide are devoted to health promotion. Here, we characterize a “Facebook page” as a public profile created by businesses, organizations, celebrities, or anyone seeking to promote themselves publicly through social media [<xref ref-type="bibr" rid="ref11">11</xref>].</p>
        <p>The active search for health information is associated with greater knowledge of health and with positive behavioral change; that is, individuals tend to become healthier when they are better informed [<xref ref-type="bibr" rid="ref12">12</xref>]. A number of studies have already explored health-related pages on Facebook to verify the effectiveness of this communication strategy [<xref ref-type="bibr" rid="ref13">13</xref>-<xref ref-type="bibr" rid="ref15">15</xref>]. This body of research shows that there is a significant degree of user responsiveness to the topics posted on these pages, suggesting that there is still considerable room for growth in this type of discussion.</p>
      </sec>
      <sec>
        <title>Facebook and Cancer</title>
        <p>The use of Facebook as a platform for disseminating health messages focused on cancer treatment, early diagnosis, and prevention has been overlooked in the scientific literature. One of the few papers dealing with this theme [<xref ref-type="bibr" rid="ref16">16</xref>] analyzed about 13,000 comments posted by visiting users on 3 Brazilian cancer-related pages. It was observed that on these pages there was a strong presence of comments employing religious terms such as “God,” “faith,” “Lord,” “blessed,” “save,” and “pray.” Notably, most of the comments were written by women, and the content of the messages was found to be overwhelmingly positive.</p>
        <p>A related study conducted in the United States [<xref ref-type="bibr" rid="ref12">12</xref>] looked at the National Cancer Institute page to identify the most effective strategies for engaging the audience. The researchers reviewed the posts and comments made on this page and found that “audience engagement is associated with the format of cancer-related posts. Specifically, photo posts received significantly more reactions, comments and shares than videos, links, and status updates (posts that contain only texts)” [<xref ref-type="bibr" rid="ref12">12</xref>].</p>
        <p>Another study published in 2017 [<xref ref-type="bibr" rid="ref17">17</xref>] implemented a Facebook-based intervention, the main goal of which was to induce users to reduce or stop smoking; the researchers concluded that the interaction between users led to a decrease in the number of cigarettes smoked per week. This result indicates that a Web-based environment of social support and engagement may be beneficial for participants’ health.</p>
        <p>Finally, another paper [<xref ref-type="bibr" rid="ref18">18</xref>] studied the Facebook platform to understand “the most commonly used terms and phrases relating to breast cancer screening and the most commonly shared website links that other women interacted with.” The study concluded that on this social media, women “shared and reacted to links to commercial and informative websites regarding breast cancer and screening”; this result may provide clues for the development of messaging strategies addressing the importance of early detection of breast cancer.</p>
        <p>Despite the studies mentioned above, little research is available on the best ways to engage the public in health communication on social media, both in Brazil and worldwide. Academic analyses are even scarcer with respect to cancer-related communication; this might have a negative impact on the Facebook pages of hospitals, nongovernmental organizations (NGOs), and informational organizations, which may end up reaching a lower percentage of the audience than their potential. Therefore, the objectives of this study were to offer ways of optimizing health messages about cancer on Facebook, with special emphasis on topics such as risk factors, prevention, treatment, early diagnosis, and cure, and to investigate which aspects of these messages generate greater engagement in the audience. Notably, the metric of engagement on Facebook is based on the number of reactions, shares, and comments for a post.</p>
      </sec>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <p>This study comprised a qualitative and quantitative study [<xref ref-type="bibr" rid="ref19">19</xref>] with a descriptive purpose [<xref ref-type="bibr" rid="ref20">20</xref>], not starting from an <italic>a priori</italic> hypothesis.</p>
      <sec>
        <title>Choosing and Organizing Facebook Data</title>
        <p>To verify what generates greater engagement in cancer-related topics on Facebook, we analyzed 16 Brazilian pages with the main theme of cancer. In 2017, we studied these pages 2 times over a 1-month period, from March 14 to April 14 and then from April 15 to May 15. With respect to the page selection for this study, we proceeded as follows:</p>
        <list list-type="order">
          <list-item>
            <p>We typed the word “cancer” in Facebook’s internal search engine (“câncer” in Portuguese) and selected the “Pages” option.</p>
          </list-item>
          <list-item>
            <p>We disregarded pages that were not written in Brazilian Portuguese. We also disregarded pages referring to “Cancer” as an astrological sign. To ensure that the pages were actually Brazilian, we also read the posts to attain better identification of the geographical origin of the page; this was done by either recognizing the way in which Portuguese was written (ie, by looking at the differences between European, African, or Brazilian Portuguese) or seeing that the authors themselves mentioned living in Brazil.</p>
          </list-item>
          <list-item>
            <p>To select the pages, we first considered those with a higher number of followers, and then we looked at the updates. Notably, to enter our survey, the page should have, at least, 2 weekly updates in the selected 4-week period. We ended up selecting 15 pages, which were divided into the following categories: personal pages, newsletters, hospitals or foundations, and NGOs.</p>
          </list-item>
          <list-item>
            <p>Finally, we analyzed a Facebook page created by us, the purpose of which was to inform the public about the prevention and early diagnosis of cancer. We called this page “Acubens, museu de cancer” (“Acubens, cancer museum” in English).</p>
          </list-item>
        </list>
        <p>It is worth noting that in our research, we did not select pages that specifically addressed prevention or early detection. Our intention was rather to identify how Brazilian Facebook pages dealt with cancer-related topics. We include the name of each page, the number of followers in 2017 and a content description in <xref ref-type="app" rid="app1">Multimedia Appendix 1</xref>.</p>
        <p>For our analysis, we used the social media monitoring tool Quintly (quintly.com) because it allows the monitoring of multiple media at the same time, even when a user is not an administrator of the relevant pages. Quintly organizes the publicly available information of all pages (ie, the number of followers, reactions, comments, and shares) in charts and tables, showing, for example, how many new followers a certain page has acquired, or the number of posts created in a selected time period. This service also provides a user with the complete listing of the posts for all the selected pages, collecting the data in a table that indicates the date, time, and type of post. The types of post are sorted into the following categories: photo (any image file), video, event (invitations to events, with the option to accept or decline), status (text-only posts), or link (posts including a Web address redirecting to an external page). These post type definitions mirror those offered by Facebook itself.</p>
      </sec>
      <sec>
        <title>Content Analysis of Posts and Engagement Rate</title>
        <p>The analysis of the posts was conducted following the methodology proposed by Bardin [<xref ref-type="bibr" rid="ref21">21</xref>], which consists of a type of inductive analysis [<xref ref-type="bibr" rid="ref22">22</xref>]. In our case, 2 researchers performed the analysis independently. We conducted the process of content analysis as follows:</p>
        <list list-type="order">
          <list-item>
            <p><italic>Preanalysis</italic>: It comprised careful and systematic reading of all the text in posts to identify the most relevant categories.</p>
          </list-item>
          <list-item>
            <p><italic>Categorization</italic>: It involved the creation of relevant categories so that all individual posts would fit into, at least, one. In this study, the 2 researchers created their categories independently and subsequently worked together to create a final list. In the case of discrepancy between the 2 initial lists, the 2 researchers discussed the categories concerned until consensus was reached.</p>
          </list-item>
          <list-item>
            <p><italic>Interpretation</italic>: It involved the study of the data and development of inferences [<xref ref-type="bibr" rid="ref21">21</xref>,<xref ref-type="bibr" rid="ref23">23</xref>].</p>
          </list-item>
        </list>
        <p>After the content analysis process, the 2 researchers created a list of keywords for each category. It was not possible for the same word to feature in more than one category. Moreover, very general words that could fit into any of the categories, such as “cancer” or “chemotherapy,” were not taken into consideration. After the 2 researchers created their lists independently, they met to check similarities and differences and finally a unique list based on consensus was created.</p>
        <p>To obtain a more holistic view of the categories, we also established the total impact that each would have, termed as the “engagement rate”. This value considered 3 metrics for each page. We calculated the weighted average reactions, shares, and comments for each post in the 16 relevant pages, assigning a weight of 0.05 for reactions, 0.2 for shares, and 0.75 for comments [<xref ref-type="bibr" rid="ref23">23</xref>]. The weights created for the calculation of the total engagement took into consideration that the type of engagement (ie, liking, commenting, or sharing) follows a hierarchy according to the amount of effort required by the user to undertake it. For instance, liking a post is usually considered low engagement because it is the simplest and quickest among the 3 available actions, sharing is rather considered a medium form of engagement because a Facebook user identifies with the content to the point that he or she wants to share it on his or her page. Finally, we regard commenting as a high form of engagement; in this case, a Facebook user needs to reflect on the topic in question, draft text, and state his or her opinion publicly.</p>
      </sec>
      <sec>
        <title>Elaboration of a System That Automates the Analysis</title>
        <p>Our previous analysis of Facebook pages [<xref ref-type="bibr" rid="ref23">23</xref>], as well as this study, served as the basis for the development of a tool designed to automate the analysis of any cancer-related Facebook page.</p>
        <p>The tool developed constitutes a software program created in JavaScript that allows users to organize different types of Facebook posts according to metrics. While some of these metrics are publicly available (eg, reactions, shares, and comments), others are only accessible by page administrators. The metrics employed by our software are as follows: post reach (how many people viewed that post); post clicks (how many users clicked to read the full text); post hides (how many people hid the page content after reading the post, or reported the page as spam); reactions; shares; comments; engagement (weighted average engagement = number of clicks + reactions × 0.05 + shares × 0.2 + comments × 0.75); and engagement rate (engagement divided by reach). The software then enables the creation of a ranking according to each of these metrics. The ranking can be created by considering all the posts published in a relevant period or by filtering according to the categories to be analyzed.</p>
        <p>Moreover, within the software, we created a database of categories and a dictionary of keywords, which were developed by the researchers in an earlier phase of this work; this list is editable, and categories or words may be added or removed at any time. Notably, our system can only “read” complete words, and it does not consider compound or root words. This means that the keywords list contains all the possible variations of a particular word—singular, plural, masculine, and feminine. From these data, the system is then able to tag posts and fit them into categories. If a post uses keywords belonging to more than one category, the system will fit the post into the category exhibiting the highest number of keywords.</p>
        <p>Our software is also able to predict the engagement rate that a post would have based on the engagement rates of the previous posts on a given page. More specifically, if a text features keywords that have generated high engagement in previous posts, the likelihood of this new post also having high engagement increases.</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Content Analysis of Facebook Pages</title>
        <p>The 16 Facebook pages that we analyzed produced a total of 712 posts in the relevant 1-month period. As mentioned above, all the pages were organized in groups according to the profile to which they belonged (ie, hospitals or foundations, informative, NGOs and personal pages).</p>
        <p>In our previous study [<xref ref-type="bibr" rid="ref23">23</xref>], we analyzed the texts of 3 Brazilian pages about cancer over a 6-month period (January-June, 2014) and created 8 categories as follows: “Testimonies or real-life stories” (people writing about their experience of cancer or any real-life story); “Solidarity” (posts asking people to make a donation, such as blood or hair); “Anniversaries” (when the main subject of the post was the celebration of some important date); “Science and health” (posts about scientific discoveries, academic research, and progress in treatment); “Events” (when the page administrator organized or publicized some event); “Institutional” (when an institution wrote about itself); “Risk factors” (when the posts addressed habits increasing the risk of cancer, such as smoking); and “Beauty” (posts about makeup, clothes, or hairstyles).</p>
        <p>Although we added new pages in this later analysis, we did not have to create new categories with respect to those listed above, indicating that despite the authors and page administrators being different, the spectrum of topics within the theme of cancer remained similar.</p>
        <p>The results presented in <xref ref-type="table" rid="table1">Table 1</xref> show the analysis of the page performance divided by the following group: hospitals or foundations, informative pages, NGOs, and personal pages.</p>
        </sec>
      <sec>
        <title>Facebook Analytics Software Development</title>
        <p>The software we developed for the content analysis of Facebook posts and its classification into categories has a simple and intuitive interface, illustrated in the following <xref ref-type="fig" rid="figure1">Figures 1</xref>-<xref ref-type="fig" rid="figure3">3</xref>. In <xref ref-type="fig" rid="figure2">Figure 2</xref> darker squares indicate greater the engagement, and in <xref ref-type="fig" rid="figure3">Figure 3</xref> bigger font indicates higher frequency.</p>
        <p>Initially, we entered in the software the 8 categories we created, as well as the keywords corresponding to each of these categories. Then, we tested the software through analysis of the page “Acubens, cancer museum,” which was created over the course of 6 months by our research group on the <italic>Oncobiology Program</italic> at the Federal University of Rio de Janeiro. Our goal was to verify whether the tool could actually tag the posts in the correct categories. Over this time period, the page presented 163 published posts. In the first stage of this investigation, 2 researchers categorized all posts manually. Then, the results of the manual classification were compared with that performed automatically by the software. This way, the researchers could verify whether the tool could correctly categorize the posts. Of 163 posts, only 34 were classified in the wrong categories by the tool. This corresponds to an error rate of 20.8% (or 79.2% accuracy). <xref ref-type="table" rid="table2">Table 2</xref> summarizes the results of the automated analysis performed by the software and the number of errors found for each category. The errors are deducted from the comparison between the manual analysis done by the researchers and that performed by the software.</p>
        <p>The percentage of errors is considered acceptable. Indeed, according to the literature [<xref ref-type="bibr" rid="ref24">24</xref>-<xref ref-type="bibr" rid="ref28">28</xref>], the accuracy of multiclass text classification (when texts are classified into ≥3 categories) ranges from 46.9% to 83%.</p>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>Averages of reactions, shares, and comments and weighted average engagement of 16 the pages.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="250"/>
            <col width="100"/>
            <col width="140"/>
            <col width="120"/>
            <col width="140"/>
            <col width="220"/>
            <thead>
              <tr valign="top">
                <td colspan="2">Group</td>
                <td>Post, n (%)</td>
                <td>Reactions, mean</td>
                <td>Shares, mean</td>
                <td>Comments, mean</td>
                <td>Weighted average engagement</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="7"><bold>Hospitals or foundations (n=109)</bold></td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Solidarity</td>
                <td>11 (10)</td>
                <td>524</td>
                <td>346.9</td>
                <td>21.4</td>
                <td>111.6</td>
              </tr>
              <tr valign="bottom">
                <td><break/></td>
                <td>Anniversaries</td>
                <td>0 (0)</td>
                <td>N/A<sup>a</sup></td>
                <td>N/A</td>
                <td>N/A</td>
                <td>N/A</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Institutional</td>
                <td>57 (52.2)</td>
                <td>825.1</td>
                <td>161.3</td>
                <td>56.4</td>
                <td>115.8</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Testimonies or real-life stories</td>
                <td>2 (1.8)</td>
                <td>179</td>
                <td>26.5</td>
                <td>3</td>
                <td>16.4</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Science and health</td>
                <td>20 (18.3)</td>
                <td>1263.3</td>
                <td>440.5</td>
                <td>47</td>
                <td>186.5</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Events</td>
                <td>18 (16.5)</td>
                <td>283.7</td>
                <td>52.5</td>
                <td>13.8</td>
                <td>35.1</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Beauty</td>
                <td>0 (0)</td>
                <td>N/A</td>
                <td>N/A</td>
                <td>N/A</td>
                <td>N/A</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Risk factors</td>
                <td>1 (0.9)</td>
                <td>219</td>
                <td>57</td>
                <td>12</td>
                <td>31.3</td>
              </tr>
              <tr valign="top">
                <td colspan="7"><bold>Informative pages (n=261)</bold></td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Solidarity</td>
                <td>19 (7.3)</td>
                <td>1400.7</td>
                <td>227.9</td>
                <td>43</td>
                <td>147.9</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Anniversaries</td>
                <td>29 (11.1)</td>
                <td>2209.9</td>
                <td>717.4</td>
                <td>27</td>
                <td>274.2</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Institutional</td>
                <td>26 (9.9)</td>
                <td>397.3</td>
                <td>72.8</td>
                <td>5.7</td>
                <td>38.7</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Testimonies or real-life stories</td>
                <td>25 (9.6)</td>
                <td>1976.5</td>
                <td>79.9</td>
                <td>108.8</td>
                <td>196.4</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Science and health</td>
                <td>129 (49.4)</td>
                <td>143.4</td>
                <td>50.7</td>
                <td>3.8</td>
                <td>20.1</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Events</td>
                <td>28 (10.7)</td>
                <td>114.8</td>
                <td>28.4</td>
                <td>30.4</td>
                <td>34.2</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Beauty</td>
                <td>1 (0.3)</td>
                <td>85</td>
                <td>19</td>
                <td>3</td>
                <td>10.3</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Risk factors</td>
                <td>4 (1.5)</td>
                <td>76.2</td>
                <td>26.5</td>
                <td>2.2</td>
                <td>10.8</td>
              </tr>
              <tr valign="top">
                <td colspan="7"><bold>Nongovernmental organizations</bold> <bold>(n=156)</bold></td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Solidarity</td>
                <td>76 (48.7)</td>
                <td>559.8</td>
                <td>24.3</td>
                <td>16.2</td>
                <td>45.0</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Anniversaries</td>
                <td>8 (5.1)</td>
                <td>1641</td>
                <td>108.3</td>
                <td>33.8</td>
                <td>129.1</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Institutional</td>
                <td>27 (17.3)</td>
                <td>620.6</td>
                <td>37.8</td>
                <td>15.7</td>
                <td>50.4</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Testimonies or real-life stories</td>
                <td>11 (7.1)</td>
                <td>505.8</td>
                <td>24.5</td>
                <td>11.3</td>
                <td>38.7</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Science and health</td>
                <td>0 (0)</td>
                <td>N/A</td>
                <td>N/A</td>
                <td>N/A</td>
                <td>N/A</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Events</td>
                <td>33 (21.1)</td>
                <td>305.3</td>
                <td>84.2</td>
                <td>18</td>
                <td>45.6</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Beauty</td>
                <td>1 (0.6)</td>
                <td>124</td>
                <td>0</td>
                <td>4</td>
                <td>9.2</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Risk factors</td>
                <td>0 (0)</td>
                <td>N/A</td>
                <td>N/A</td>
                <td>N/A</td>
                <td>N/A</td>
              </tr>
              
              <tr valign="top">
                <td colspan="7"><bold>Personal pages (n=186)</bold></td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Solidarity</td>
                <td>53 (28.5)</td>
                <td>1885.2</td>
                <td>32.8</td>
                <td>48.9</td>
                <td>135.5</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Anniversaries</td>
                <td>9 (4.3)</td>
                <td>1320.7</td>
                <td>10.8</td>
                <td>29.7</td>
                <td>90.5</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Institutional</td>
                <td>26 (13.9)</td>
                <td>340.2</td>
                <td>8.7</td>
                <td>7.4</td>
                <td>24.3</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Testimonies or real-life stories</td>
                <td>68 (36.6)</td>
                <td>236.6</td>
                <td>18.4</td>
                <td>26.7</td>
                <td>35.6</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Science and health</td>
                <td>0 (0)</td>
                <td>N/A</td>
                <td>N/A</td>
                <td>N/A</td>
                <td>N/A</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Events</td>
                <td>10 (5.3)</td>
                <td>401.6</td>
                <td>8.8</td>
                <td>11.6</td>
                <td>30.5</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Beauty</td>
                <td>19 (10.2)</td>
                <td>149.7</td>
                <td>8.3</td>
                <td>5.9</td>
                <td>16.6</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Risk factors</td>
                <td>1 (0.5)</td>
                <td>20</td>
                <td>1</td>
                <td>2</td>
                <td>2.7</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table1fn1">
              <p><sup>a</sup>N/A: not applicable.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>Screenshot of the “posts” tab, displaying the complete list of page posts. (Source: Created by Corbata Informática, 2016).</p>
          </caption>
          <graphic xlink:href="cancer_v4i2e11073_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure2" position="float">
          <label>Figure 2</label>
          <caption>
            <p>Screenshot of the “Heat map” tab, displaying the days and times of higher engagement on a particular page. (Source: Created by Corbata Informática, 2016).</p>
          </caption>
          <graphic xlink:href="cancer_v4i2e11073_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure3" position="float">
          <label>Figure 3</label>
          <caption>
            <p>Screenshot of the “Word cloud” tab, showing the words used more frequently on a given page. (Source: Created by Corbata Informática, 2016).</p>
          </caption>
          <graphic xlink:href="cancer_v4i2e11073_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>Results of the automated analysis of the page “Acubens, cancer museum” and the number of errors compared with the manual analysis.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="550"/>
            <col width="250"/>
            <col width="200"/>
            <thead>
              <tr valign="top">
                <td>Category</td>
                <td>Posts analyzed by the tool, n (%)</td>
                <td>Errors per category, n (%)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Beauty</td>
                <td>1 (0.6)</td>
                <td>1 (2.9)</td>
              </tr>
              <tr valign="top">
                <td>Science and health</td>
                <td>95 (57.2)</td>
                <td>4 (11.7)</td>
              </tr>
              <tr valign="top">
                <td>Anniversaries</td>
                <td>17 (10.2)</td>
                <td>10 (29.4)</td>
              </tr>
              <tr valign="top">
                <td>Testimonials</td>
                <td>25 (15)</td>
                <td>14 (41.1)</td>
              </tr>
              <tr valign="top">
                <td>Events</td>
                <td>1 (0.6)</td>
                <td>1 (2.9)</td>
              </tr>
              <tr valign="top">
                <td>Risk factors</td>
                <td>11 (6.6)</td>
                <td>1 (2.9)</td>
              </tr>
              <tr valign="top">
                <td>Institutional</td>
                <td>6 (3.6)</td>
                <td>1 (2.9)</td>
              </tr>
              <tr valign="top">
                <td>Solidarity</td>
                <td>10 (6.0)</td>
                <td>2 (5.8)</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Content Analysis of Facebook Pages</title>
        <p>In this study, we observed that the categories that generated the greater level of engagement were not those with the highest percentage of posts. For example, in the “Informative pages” group, the “Testimonies or real-life stories” category generated an engagement of 196.4 However, only 9.6% (25/261) of the page content in the period of analysis dealt with such topics. The category with the highest number of posts in the “Informative” group was “Science and health” (129/261, 49.4%); yet, this category was ranked only 6th with respect to engagement.</p>
        <p>We observed a similar pattern in the “NGOs” group. While the category generating the greatest engagement was “Anniversaries” (129.1), only 5.1% (8/156) of the page content fell into this category. Within this group of pages, the most frequent category was “Solidarity,” with 48.7% (76/156) of posts. However, the average engagement rate for these posts was 45, around 2.8 times lower than the most successful category and scoring fourth in the average engagement ranking.</p>
        <p>Another category with a relatively low presence among the analyzed posts was “Science and health”; this category, along with “Risk factors,” is directly related to topics such as cancer prevention, well-being, and early diagnosis. In the “NGOs” group and on personal pages, nothing was published on the subject. However, in the “Hospital or foundation” group, this category ranked second in terms of average engagement, indicating that people looking for information on hospitals and foundations are more likely to be interested in these topics than people visiting other cancer-related pages. Hence, we suggest that the administrators of hospitals or foundations devote more space to this subject on their Facebook pages.</p>
        <p>Furthermore, to increase engagement, it is crucial that the page administrators adopt strategies to incentivize their users to comment more often, as this is the type of participation that demands greater intellectual effort. Given that users who comment invest more time in a post, this is probably the reason why the average number of comments is lower than the average number of shares and reactions across all categories.</p>
        <p>Some of the most common strategies used to generate more comments on Facebook consist of asking users questions and responding to all the comments [<xref ref-type="bibr" rid="ref29">29</xref>]. As Porto emphasized, “The more a user interacts with a particular content producer, the greater the chances of that producer appearing in the user’s news feed” [<xref ref-type="bibr" rid="ref30">30</xref>]. To increase user engagement, it is, therefore, crucial for the page to encourage similar actions.</p>
      </sec>
      <sec>
        <title>Facebook Analytics Software Development</title>
        <p>The category “Science and health” had the largest number of posts (n=95), but it was also the one for which the software committed a small number of errors—only 2. Although the software cannot draw on images or videos that come with the publication, textual analysis proved sufficient for our purposes. In the “Risk factors” category, there was only one error out of 11 posts. An example of text that was correctly classified in the “Science and health” category is as follows:</p>
        <disp-quote>
          <p>Cancer can be fought with cell transplantation from healthy subjects. Scientists have discovered that it is possible to fight cancerous tumors by using cells from the immune system of a healthy person and transplanting them in the body of a person with the disease. The research was conducted by the Cancer Institute of the Netherlands and the University of Oslo in Norway and published last week by the journal Science. The researchers noted that by inserting components of a healthy donor's immune system cells into the cells of a patient with cancer in the laboratory, it is possible to get the patient’s body to recognize the tumors and attack them. The research was conducted on 3 patients with melanoma, a type of skin cancer. Read more:http://goo.gl/FgJNvv.</p>
          <attrib>Translated from Portuguese</attrib>
        </disp-quote>
        <p>Although the text contains words belonging to other categories, such as “donor” (“Solidarity”), the software was able to classify the post in the appropriate category, given that most of the words in this section concern “Science and health.”</p>
        <p>The classification errors made by the software occurred largely because the tool was not able to analyze the context surrounding a sentence. For instance, the following post was interpreted as “Anniversaries,” despite having been classified as “Institutional” by the researchers:</p>
        <disp-quote>
          <p>Any day is a day to break a taboo. Let's talk about cancer. Today's message was recorded with Manoel Gomes and he suggests we see the world in a more positive way. Watch the video by clicking on the link below [link] Get to know @Toda Poesia at [link].</p>
          <attrib>Translated from Portuguese</attrib>
        </disp-quote>
        <p>The mistake arguably happened because the word “day” appears 2 times and it is the only word in this post that also appeared in the keyword list. After this error, we may consider including the word “project” in the “Institutional” category as several publications from “Acubens, cancer museum” in this category contain this word.</p>
      </sec>
      <sec>
        <title>Limitations</title>
        <p>With respect to content analysis, one of the limitations concerned the fact that we restricted the study to pages produced in Brazilian Portuguese. We did this out of interest in gaining a better understanding of what is produced on social media about cancer in Brazil and what generates engagement among Brazilians. However, future studies should analyze more broadly the content generated in other countries and languages.</p>
        <p>With respect to the software, one limitation concerned the difficulty in choosing the words for each category, as some of them could belong to more than one. In many cases, we had to make choices based on the evaluative criteria of the researchers. However, it may very well be that people with different experiences and writing styles could have classified words in other categories. Another limitation, already mentioned above, may be that the software does not understand the context and, therefore, is unable to capture irony, jokes, ambiguous wording, or figurative language. Moreover, the system is not able to recognize common typing errors.</p>
        <p>Despite these limitations, our software could be of help to many research groups and Facebook page administrators wishing to gain a better understanding of what their audience wants and what generates engagement. Other features of the software, such as the “Heat map,” will also be of great value in this process.</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>Categorizing posts and calculating engagement rates revealed that the potential of Facebook pages is often underutilized. This may be because the categories generating the greatest engagement are not those used most frequently. In contrast, we have noticed that in some cases, the most attractive category in terms of engagement is among the least published. For instance, it is worth noting that many pages had only a few posts in the “Science and health” category, despite this being one of the most popular. Indeed, along with “Risk factors,” “Science and health” comprises the most relevant categories for public health issues, such as cancer prevention, early diagnosis, and well-being. Given that a high number of cancer cases are related to environmental and lifestyle issues, it is crucial to talk more about prevention and risky behaviors on social media.</p>
        <p>However, this study shows that personal pages and the “NGOs” group did not produce any messages about “Science and health.” The “NGOs” group also failed to produce any content on “Risk factors”. Our results suggest that NGOs should include more information about science, health, and risk factors and also set out to promote them more vigorously.</p>
        <p>Within the “Hospital or foundation” group, the category “Science and health” was the one that generated the highest weighted average engagement. However, only 18.3% (20/109) of the posts within this group of pages fell into this category. Our suggestion is that page administrators of hospitals or foundations give more space to this subject.</p>
        <p>The software developed in this study may certainly help research groups interested in studying cancer-related topics. In addition, the keyword dictionary on cancer could help people who are interested in delving deeper into this topic. Moreover, researchers and groups willing to create new categories and dictionaries could take advantage of our tool to gain a better understanding of what type of content engenders greater engagement among target audiences, thereby collecting information to produce more attractive Web-based content.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <app id="app1">
        <title>Multimedia Appendix 1</title>
        <p>Name of each page, number of followers in 2017 and content description.</p>
        <media xlink:href="cancer_v4i2e11073_app1.pdf" xlink:title="PDF File (Adobe PDF File), 39KB"/>
      </app>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">NGO</term>
          <def>
            <p>nongovernmental organization</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    
    <ack><p>This study was supported by the (Brazilian) National Council for Scientific and Technological Development, the Brazilian Cancer Foundation, and Carlos Chagas Filho Foundation (Fundação Carlos Chagas Filho de Amparo à Pesquisa do Estado do Rio de Janeiro).</p></ack>
    
    <fn-group>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="web">
        <person-group person-group-type="author">
          <collab>Sociedade Brasileira de Cirurgia Oncológica</collab>
        </person-group>
        <source>Comunidade: O que é câncer?</source>  
        <year>2015</year>  
        <access-date>2018-09-16</access-date>
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://www.sbco.org.br/comunidade/o-que-e-cancer/">http://www.sbco.org.br/comunidade/o-que-e-cancer/</ext-link>
          <ext-link ext-link-type="webcite" xlink:href="74RkFvmYW"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="web">
        <person-group person-group-type="author">
          <collab>International Agency for Research on Cancer</collab>
        </person-group>
        <source>Global Cancer Observatory</source>  
        <year>2014</year>  
        <access-date>2018-09-16</access-date>
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://gco.iarc.fr/">http://gco.iarc.fr/</ext-link>
          <ext-link ext-link-type="webcite" xlink:href="72TZuFKTh"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Barbosa</surname>
            <given-names>IR</given-names>
          </name>
          <name name-style="western">
            <surname>de Souza</surname>
            <given-names>Dyego LB</given-names>
          </name>
          <name name-style="western">
            <surname>Bernal</surname>
            <given-names>MM</given-names>
          </name>
          <name name-style="western">
            <surname>do CC Costa</surname>
            <given-names>Íris</given-names>
          </name>
        </person-group>
        <article-title>Cancer mortality in Brazil: Temporal Trends and Predictions for the Year 2030</article-title>
        <source>Medicine (Baltimore)</source>  
        <year>2015</year>  
        <month>04</month>  
        <volume>94</volume>  
        <issue>16</issue>  
        <fpage>e746</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://Insights.ovid.com/pubmed?pmid=25906105"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1097/MD.0000000000000746</pub-id>
        <pub-id pub-id-type="medline">25906105</pub-id>
        <pub-id pub-id-type="pii">00005792-201504040-00016</pub-id>
        <pub-id pub-id-type="pmcid">PMC4602680</pub-id></nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="web">
        <source>World Health Organization Cancer Factsheet</source>  
        <year>2017</year>  
        <access-date>2018-09-16</access-date>
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://www.who.int/en/news-room/fact-sheets/detail/cancer">http://www.who.int/en/news-room/fact-sheets/detail/cancer</ext-link>
          <ext-link ext-link-type="webcite" xlink:href="72TaBDHGQ"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Anand</surname>
            <given-names>P</given-names>
          </name>
          <name name-style="western">
            <surname>Kunnumakkara</surname>
            <given-names>AB</given-names>
          </name>
          <name name-style="western">
            <surname>Kunnumakara</surname>
            <given-names>AB</given-names>
          </name>
          <name name-style="western">
            <surname>Sundaram</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Harikumar</surname>
            <given-names>KB</given-names>
          </name>
          <name name-style="western">
            <surname>Tharakan</surname>
            <given-names>ST</given-names>
          </name>
          <name name-style="western">
            <surname>Lai</surname>
            <given-names>OS</given-names>
          </name>
          <name name-style="western">
            <surname>Sung</surname>
            <given-names>B</given-names>
          </name>
          <name name-style="western">
            <surname>Aggarwal</surname>
            <given-names>BB</given-names>
          </name>
        </person-group>
        <article-title>Cancer is a preventable disease that requires major lifestyle changes</article-title>
        <source>Pharm Res</source>  
        <year>2008</year>  
        <month>09</month>  
        <volume>25</volume>  
        <issue>9</issue>  
        <fpage>2097</fpage>  
        <lpage>116</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/18626751"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1007/s11095-008-9661-9</pub-id>
        <pub-id pub-id-type="medline">18626751</pub-id>
        <pub-id pub-id-type="pmcid">PMC2515569</pub-id></nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="web">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Cross</surname>
            <given-names>D</given-names>
          </name>
        </person-group>
        <source>50 percent of cancer cases preventable</source>  
        <year>2017</year>  
        <access-date>2018-09-16</access-date>
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://www.cancertutor.com/who-cancer-prevention/">https://www.cancertutor.com/who-cancer-prevention/</ext-link>
          <ext-link ext-link-type="webcite" xlink:href="72TaIoERu"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="web">
        <person-group person-group-type="author">
          <collab>Cancer Research UK</collab>
        </person-group>
        <source>Why is early diagnosis important?</source>  
        <year>2015</year>  
        <access-date>2018-09-17</access-date>
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://www.cancerresearchuk.org/about-cancer/cancer-symptoms/why-is-early-diagnosis-important">https://www.cancerresearchuk.org/about-cancer/cancer-symptoms/why-is-early-diagnosis-important</ext-link>
          <ext-link ext-link-type="webcite" xlink:href="72Un9cKWX"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="web">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Chaykowski</surname>
            <given-names>K</given-names>
          </name>
        </person-group>
        <source>Mark Zuckerberg: 2 Billion Users Means Facebook's 'Responsibility Is Expanding'</source>  
        <year>2017</year>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://www.forbes.com/sites/kathleenchaykowski/2017/06/27/facebook-officially-hits-2-billion-users/#c5acc9437080">https://www.forbes.com/sites/kathleenchaykowski/2017/06/27/facebook-officially-hits-2-billion-users/#c5acc9437080</ext-link>
          <ext-link ext-link-type="webcite" xlink:href="72UnVvL4Q"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="web">
        <source>The top 20 valuable Facebook statistics</source>  
        <year>2018</year>  
        <access-date>2018-09-17</access-date>
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://zephoria.com/top-15-valuable-facebook-statistics/">https://zephoria.com/top-15-valuable-facebook-statistics/</ext-link>
          <ext-link ext-link-type="webcite" xlink:href="72UnauVnB"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="web">
        <source>Leading countries based on number of Facebook users as of July (in millions)</source>  
        <year>2018</year>  
        <access-date>2018-11-21</access-date>
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://www.statista.com/statistics/268136/top-15-countries-based-on-number-of-facebook-users/">http://www.statista.com/statistics/268136/top-15-countries-based-on-number-of-facebook-users/</ext-link>
          <ext-link ext-link-type="webcite" xlink:href="72UnqcSoz"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="web">
        <source>What is a Facebook page?</source>  
        <year>2018</year>  
        <access-date>2018-09-17</access-date>
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://www.techopedia.com/definition/15441/facebook-page">https://www.techopedia.com/definition/15441/facebook-page</ext-link>
          <ext-link ext-link-type="webcite" xlink:href="72Uodx1GP"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Strekalova</surname>
            <given-names>YA</given-names>
          </name>
          <name name-style="western">
            <surname>Krieger</surname>
            <given-names>JL</given-names>
          </name>
        </person-group>
        <article-title>A Picture Really is Worth a Thousand Words: Public Engagement with the National Cancer Institute on Social Media</article-title>
        <source>J Cancer Educ</source>  
        <year>2017</year>  
        <month>12</month>  
        <volume>32</volume>  
        <issue>1</issue>  
        <fpage>155</fpage>  
        <lpage>157</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/26351003"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1007/s13187-015-0901-5</pub-id>
        <pub-id pub-id-type="medline">26351003</pub-id>
        <pub-id pub-id-type="pii">10.1007/s13187-015-0901-5</pub-id>
        <pub-id pub-id-type="pmcid">PMC5030178</pub-id></nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Greene</surname>
            <given-names>JA</given-names>
          </name>
          <name name-style="western">
            <surname>Choudhry</surname>
            <given-names>NK</given-names>
          </name>
          <name name-style="western">
            <surname>Kilabuk</surname>
            <given-names>E</given-names>
          </name>
          <name name-style="western">
            <surname>Shrank</surname>
            <given-names>WH</given-names>
          </name>
        </person-group>
        <article-title>Online social networking by patients with diabetes: a qualitative evaluation of communication with Facebook</article-title>
        <source>J Gen Intern Med</source>  
        <year>2011</year>  
        <month>03</month>  
        <volume>26</volume>  
        <issue>3</issue>  
        <fpage>287</fpage>  
        <lpage>92</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/20945113"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1007/s11606-010-1526-3</pub-id>
        <pub-id pub-id-type="medline">20945113</pub-id>
        <pub-id pub-id-type="pmcid">PMC3043192</pub-id></nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Naslund</surname>
            <given-names>JA</given-names>
          </name>
          <name name-style="western">
            <surname>Aschbrenner</surname>
            <given-names>KA</given-names>
          </name>
          <name name-style="western">
            <surname>Marsch</surname>
            <given-names>LA</given-names>
          </name>
          <name name-style="western">
            <surname>Bartels</surname>
            <given-names>SJ</given-names>
          </name>
        </person-group>
        <article-title>Feasibility and acceptability of Facebook for health promotion among people with serious mental illness</article-title>
        <source>Digit Health</source>  
        <year>2016</year>  
        <month>11</month>  
        <day>01</day>  
        <volume>2</volume>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/28367321"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1177/2055207616654822</pub-id>
        <pub-id pub-id-type="medline">28367321</pub-id>
        <pub-id pub-id-type="pmcid">PMC5370548</pub-id></nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Khawaja</surname>
            <given-names>Z</given-names>
          </name>
          <name name-style="western">
            <surname>Ali</surname>
            <given-names>KI</given-names>
          </name>
          <name name-style="western">
            <surname>Khan</surname>
            <given-names>S</given-names>
          </name>
        </person-group>
        <article-title>Using Facebook for Sexual Health Social Marketing in Conservative Asian Countries: A Systematic Examination</article-title>
        <source>J Health Commun</source>  
        <year>2017</year>  
        <month>12</month>  
        <volume>22</volume>  
        <issue>2</issue>  
        <fpage>111</fpage>  
        <lpage>123</lpage>  
        <pub-id pub-id-type="doi">10.1080/10810730.2016.1222031</pub-id>
        <pub-id pub-id-type="medline">28103152</pub-id></nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Picanço</surname>
            <given-names>Luisa</given-names>
          </name>
          <name name-style="western">
            <surname>Biancovilli</surname>
            <given-names>P</given-names>
          </name>
          <name name-style="western">
            <surname>Jurberg</surname>
            <given-names>C</given-names>
          </name>
        </person-group>
        <article-title>Beyond the Drama: the Beautiful Life in News Feeds on Cancer</article-title>
        <source>J Cancer Educ</source>  
        <year>2018</year>  
        <month>04</month>  
        <volume>33</volume>  
        <issue>2</issue>  
        <fpage>424</fpage>  
        <lpage>428</lpage>  
        <pub-id pub-id-type="doi">10.1007/s13187-016-1094-2</pub-id>
        <pub-id pub-id-type="medline">27501961</pub-id>
        <pub-id pub-id-type="pii">10.1007/s13187-016-1094-2</pub-id></nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Kim</surname>
            <given-names>SJ</given-names>
          </name>
          <name name-style="western">
            <surname>Marsch</surname>
            <given-names>LA</given-names>
          </name>
          <name name-style="western">
            <surname>Brunette</surname>
            <given-names>MF</given-names>
          </name>
          <name name-style="western">
            <surname>Dallery</surname>
            <given-names>J</given-names>
          </name>
        </person-group>
        <article-title>Harnessing Facebook for Smoking Reduction and Cessation Interventions: Facebook User Engagement and Social Support Predict Smoking Reduction</article-title>
        <source>J Med Internet Res</source>  
        <year>2017</year>  
        <month>05</month>  
        <day>23</day>  
        <volume>19</volume>  
        <issue>5</issue>  
        <fpage>e168</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://www.jmir.org/2017/5/e168/"/>
        </comment>  
        <pub-id pub-id-type="doi">10.2196/jmir.6681</pub-id>
        <pub-id pub-id-type="medline">28536096</pub-id>
        <pub-id pub-id-type="pii">v19i5e168</pub-id>
        <pub-id pub-id-type="pmcid">PMC5461420</pub-id></nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Huesch</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Chetlen</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Segel</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Schetter</surname>
            <given-names>S</given-names>
          </name>
        </person-group>
        <article-title>Frequencies of Private Mentions and Sharing of Mammography and Breast Cancer Terms on Facebook: A Pilot Study</article-title>
        <source>J Med Internet Res</source>  
        <year>2017</year>  
        <month>06</month>  
        <day>09</day>  
        <volume>19</volume>  
        <issue>6</issue>  
        <fpage>e201</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://www.jmir.org/2017/6/e201/"/>
        </comment>  
        <pub-id pub-id-type="doi">10.2196/jmir.7508</pub-id>
        <pub-id pub-id-type="medline">28600279</pub-id>
        <pub-id pub-id-type="pii">v19i6e201</pub-id>
        <pub-id pub-id-type="pmcid">PMC5482928</pub-id></nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="book">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Minayo</surname>
            <given-names>MC</given-names>
          </name>
          <name name-style="western">
            <surname>Minayo-Gomez</surname>
            <given-names>C</given-names>
          </name>
        </person-group>
        <article-title>Difíceis e possíveis relações entre métodos quantitativos e qualitativos nos estudos de problemas de saúde</article-title>
        <source>Goldenberg P, Marsiglia RMG, Gomes MHA. editors. O clássico e o novo: tendências, objetos e abordagens em ciências sociais e saúde</source>  
        <year>2003</year>  
        <publisher-loc>Rio de Janeiro</publisher-loc>
        <publisher-name>Fiocruz</publisher-name>
        <fpage>117</fpage>  
        <lpage>42</lpage> </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="book">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Jackson</surname>
            <given-names>S</given-names>
          </name>
        </person-group>
        <source>Research Methods And Statistics</source>  
        <year>2018</year>  
        <publisher-loc>Boston</publisher-loc>
        <publisher-name>Cengage Learning</publisher-name></nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="book">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Bardin</surname>
            <given-names>L</given-names>
          </name>
        </person-group>
        <source>Análise de Conteúdo</source>  
        <year>2011</year>  
        <publisher-loc>São Paulo</publisher-loc>
        <publisher-name>Edições 70</publisher-name></nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Elo</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Kyngäs</surname>
            <given-names>Helvi</given-names>
          </name>
        </person-group>
        <article-title>The qualitative content analysis process</article-title>
        <source>J Adv Nurs</source>  
        <year>2008</year>  
        <month>04</month>  
        <volume>62</volume>  
        <issue>1</issue>  
        <fpage>107</fpage>  
        <lpage>15</lpage>  
        <pub-id pub-id-type="doi">10.1111/j.1365-2648.2007.04569.x</pub-id>
        <pub-id pub-id-type="medline">18352969</pub-id>
        <pub-id pub-id-type="pii">JAN4569</pub-id></nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Biancovilli</surname>
            <given-names>P</given-names>
          </name>
          <name name-style="western">
            <surname>Picanço</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Jurberg</surname>
            <given-names>C</given-names>
          </name>
        </person-group>
        <article-title>To read or not to read? Identifying communication patterns in three cancer-related Facebook pages</article-title>
        <source>Cogent Social Sciences</source>  
        <year>2017</year>  
        <month>5</month>  
        <day>24</day>  
        <volume>3</volume>  
        <issue>1</issue>  
        <pub-id pub-id-type="doi">10.1080/23311886.2017.1331816</pub-id></nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Pang</surname>
            <given-names>B</given-names>
          </name>
          <name name-style="western">
            <surname>Lee</surname>
            <given-names>L</given-names>
          </name>
        </person-group>
        <article-title>Seeing stars: exploiting class relationships for sentiment categorization with respect to rating scales</article-title>
        <year>2005</year>  
        <conf-name>Proceedings of the 43rd Annual Meeting on Association for Computational Linguistics (ACL'05)</conf-name>
        <conf-date>June 2005</conf-date>
        <conf-loc>University of Michigan</conf-loc>
        <fpage>115</fpage>  
        <lpage>24</lpage>  
        <pub-id pub-id-type="doi">10.3115/1219840.1219855</pub-id></nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Qu</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Ifrim</surname>
            <given-names>G</given-names>
          </name>
          <name name-style="western">
            <surname>Weikum</surname>
            <given-names>G</given-names>
          </name>
        </person-group>
        <article-title>The bag-of-opinions method for review rating prediction from sparse text patterns</article-title>
        <year>2010</year>  
        <conf-name>Proceedings of the 23rd International Conference on Computational Linguistics</conf-name>
        <conf-date>August 23 - 27, 2010</conf-date>
        <conf-loc>Beijing</conf-loc>
        <fpage>913</fpage>  
        <lpage>21</lpage> </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Long</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Zhang</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Zhut</surname>
            <given-names>X</given-names>
          </name>
        </person-group>
        <article-title>A review selection approach for accurate feature rating estimation</article-title>
        <year>2010</year>  
        <conf-name>Proceedings of the 23rd International Conference on Computational Linguistics: Posters</conf-name>
        <conf-date>August 23 - 27, 2010</conf-date>
        <conf-loc>Beijing</conf-loc>
        <fpage>766</fpage>  
        <lpage>74</lpage> </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Paltoglou</surname>
            <given-names>G</given-names>
          </name>
          <name name-style="western">
            <surname>Thelwall</surname>
            <given-names>M</given-names>
          </name>
        </person-group>
        <article-title>Seeing Stars of Valence and Arousal in Blog Posts</article-title>
        <source>IEEE Trans. Affective Comput</source>  
        <year>2013</year>  
        <month>01</month>  
        <volume>4</volume>  
        <issue>1</issue>  
        <fpage>116</fpage>  
        <lpage>123</lpage>  
        <pub-id pub-id-type="doi">10.1109/T-AFFC.2012.36</pub-id></nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="book">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Lunardi</surname>
            <given-names>AC</given-names>
          </name>
          <name name-style="western">
            <surname>Viterbo</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Bernardini</surname>
            <given-names>F</given-names>
          </name>
        </person-group>
        <article-title>Análise de sentimentos utilizando técnicas de classificação multiclasse</article-title>
        <source>Tópicos em Sistemas de Informação: Minicursos SBSI</source>  
        <year>2016</year>  
        <publisher-loc>Florianópolis</publisher-loc>
        <publisher-name>UFSC Departamento de Informática e Estatística</publisher-name>
        <fpage>1</fpage>  
        <lpage>30</lpage> </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="web">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Ayres</surname>
            <given-names>S</given-names>
          </name>
        </person-group>
        <source>Who else wants to get more comments on your Facebook posts?</source>  
        <year>2015</year>  
        <access-date>2018-09-17</access-date>
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://www.postplanner.com/get-more-comments-on-facebook-posts/">https://www.postplanner.com/get-more-comments-on-facebook-posts/</ext-link>
          <ext-link ext-link-type="webcite" xlink:href="72UpDDfj5"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="web">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Porto</surname>
            <given-names>C</given-names>
          </name>
        </person-group>
        <source>O Edgerank nunca existiu? Saiba que muda no seu Feed de Notícias</source>  
        <year>2013</year>  
        <access-date>2018-09-17</access-date>
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://www.camilaporto.com.br/facebook/o-edgerank-nunca-existiu-saiba-que-muda-no-seu-feed-de-noticias">https://www.camilaporto.com.br/facebook/o-edgerank-nunca-existiu-saiba-que-muda-no-seu-feed-de-noticias</ext-link>
          <ext-link ext-link-type="webcite" xlink:href="72UpUttoW"/>
        </comment> </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
