<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JC</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Cancer</journal-id>
      <journal-title>JMIR Cancer</journal-title>
      <issn pub-type="epub">2369-1999</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v8i3e39003</article-id>
      <article-id pub-id-type="pmid">35816382</article-id>
      <article-id pub-id-type="doi">10.2196/39003</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Exploring the Association of Cancer and Depression in Electronic Health Records: Combining Encoded Diagnosis and Mining Free-Text Clinical Notes</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Mavragani</surname>
            <given-names>Amaryllis</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>González</surname>
            <given-names>Alejandro</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Adapa</surname>
            <given-names>Karthik</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author">
          <name name-style="western">
            <surname>Leis</surname>
            <given-names>Angela</given-names>
          </name>
          <degrees>PsyM, PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-4780-7111</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author">
          <name name-style="western">
            <surname>Casadevall</surname>
            <given-names>David</given-names>
          </name>
          <degrees>MD, PhD</degrees>
          <xref rid="aff3" ref-type="aff">3</xref>
          <xref rid="aff4" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-3986-2084</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Albanell</surname>
            <given-names>Joan</given-names>
          </name>
          <degrees>MD, PhD</degrees>
          <xref rid="aff3" ref-type="aff">3</xref>
          <xref rid="aff4" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-1239-4580</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Posso</surname>
            <given-names>Margarita</given-names>
          </name>
          <degrees>MD, PhD</degrees>
          <xref rid="aff5" ref-type="aff">5</xref>
          <xref rid="aff6" ref-type="aff">6</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-5053-257X</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author">
          <name name-style="western">
            <surname>Macià</surname>
            <given-names>Francesc</given-names>
          </name>
          <degrees>MD, PhD</degrees>
          <xref rid="aff5" ref-type="aff">5</xref>
          <xref rid="aff6" ref-type="aff">6</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-6090-5894</ext-link>
        </contrib>
        <contrib id="contrib6" contrib-type="author">
          <name name-style="western">
            <surname>Castells</surname>
            <given-names>Xavier</given-names>
          </name>
          <degrees>MD, PhD</degrees>
          <xref rid="aff5" ref-type="aff">5</xref>
          <xref rid="aff6" ref-type="aff">6</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-2528-0382</ext-link>
        </contrib>
        <contrib id="contrib7" contrib-type="author">
          <name name-style="western">
            <surname>Ramírez-Anguita</surname>
            <given-names>Juan Manuel</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-8509-0927</ext-link>
        </contrib>
        <contrib id="contrib8" contrib-type="author">
          <name name-style="western">
            <surname>Martínez Roldán</surname>
            <given-names>Jordi</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff7" ref-type="aff">7</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-4565-6228</ext-link>
        </contrib>
        <contrib id="contrib9" contrib-type="author">
          <name name-style="western">
            <surname>Furlong</surname>
            <given-names>Laura I</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-9383-528X</ext-link>
        </contrib>
        <contrib id="contrib10" contrib-type="author">
          <name name-style="western">
            <surname>Sanz</surname>
            <given-names>Ferran</given-names>
          </name>
          <degrees>Prof Dr</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-7534-7661</ext-link>
        </contrib>
        <contrib id="contrib11" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Ronzano</surname>
            <given-names>Francesco</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <address>
            <institution>Department of Medicine and Life Sciences</institution>
            <institution>Universitat Pompeu Fabra</institution>
            <addr-line>C/Aiguader 88</addr-line>
            <addr-line>Barcelona, 08003</addr-line>
            <country>Spain</country>
            <phone>34 933160539</phone>
            <email>francesco.ronzano@upf.edu</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-5037-9061</ext-link>
        </contrib>
        <contrib id="contrib12" contrib-type="author">
          <name name-style="western">
            <surname>Mayer</surname>
            <given-names>Miguel A</given-names>
          </name>
          <degrees>MD, PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-0362-6298</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Research Programme on Biomedical Informatics</institution>
        <institution>Hospital del Mar Medical Research Institute</institution>
        <addr-line>Barcelona</addr-line>
        <country>Spain</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Department of Medicine and Life Sciences</institution>
        <institution>Universitat Pompeu Fabra</institution>
        <addr-line>Barcelona</addr-line>
        <country>Spain</country>
      </aff>
      <aff id="aff3">
        <label>3</label>
        <institution>Cancer Research Program</institution>
        <institution>Hospital del Mar Research Institute</institution>
        <addr-line>Barcelona</addr-line>
        <country>Spain</country>
      </aff>
      <aff id="aff4">
        <label>4</label>
        <institution>Medical Oncology Department</institution>
        <institution>Hospital del Mar</institution>
        <addr-line>Barcelona</addr-line>
        <country>Spain</country>
      </aff>
      <aff id="aff5">
        <label>5</label>
        <institution>Department of Epidemiology</institution>
        <institution>Hospital del Mar Research Institute</institution>
        <addr-line>Barcelona</addr-line>
        <country>Spain</country>
      </aff>
      <aff id="aff6">
        <label>6</label>
        <institution>Research Network on Chronicity, Primary Care and Health Promotion (RICAPPS)</institution>
        <addr-line>Barcelona</addr-line>
        <country>Spain</country>
      </aff>
      <aff id="aff7">
        <label>7</label>
        <institution>Innovation and Digital Transformation Area</institution>
        <institution>Hospital del Mar</institution>
        <addr-line>Barcelona</addr-line>
        <country>Spain</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Francesco Ronzano <email>francesco.ronzano@upf.edu</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <season>Jul-Sep</season>
        <year>2022</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>11</day>
        <month>7</month>
        <year>2022</year>
      </pub-date>
      <volume>8</volume>
      <issue>3</issue>
      <elocation-id>e39003</elocation-id>
      <history>
        <date date-type="received">
          <day>26</day>
          <month>4</month>
          <year>2022</year>
        </date>
        <date date-type="rev-request">
          <day>3</day>
          <month>6</month>
          <year>2022</year>
        </date>
        <date date-type="rev-recd">
          <day>17</day>
          <month>6</month>
          <year>2022</year>
        </date>
        <date date-type="accepted">
          <day>20</day>
          <month>6</month>
          <year>2022</year>
        </date>
      </history>
      <copyright-statement>©Angela Leis, David Casadevall, Joan Albanell, Margarita Posso, Francesc Macià, Xavier Castells, Juan Manuel Ramírez-Anguita, Jordi Martínez Roldán, Laura I Furlong, Ferran Sanz, Francesco Ronzano, Miguel A Mayer. Originally published in JMIR Cancer (https://cancer.jmir.org), 11.07.2022.</copyright-statement>
      <copyright-year>2022</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Cancer, is properly cited. The complete bibliographic information, a link to the original publication on https://cancer.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://cancer.jmir.org/2022/3/e39003" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>A cancer diagnosis is a source of psychological and emotional stress, which are often maintained for sustained periods of time that may lead to depressive disorders. Depression is one of the most common psychological conditions in patients with cancer. According to the Global Cancer Observatory, breast and colorectal cancers are the most prevalent cancers in both sexes and across all age groups in Spain.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>This study aimed to compare the prevalence of depression in patients before and after the diagnosis of breast or colorectal cancer, as well as to assess the usefulness of the analysis of free-text clinical notes in 2 languages (Spanish or Catalan) for detecting depression in combination with encoded diagnoses.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>We carried out an analysis of the electronic health records from a general hospital by considering the different sources of clinical information related to depression in patients with breast and colorectal cancer. This analysis included ICD-9-CM (International Classification of Diseases, Ninth Revision, Clinical Modification) diagnosis codes and unstructured information extracted by mining free-text clinical notes via natural language processing tools based on Systematized Nomenclature of Medicine Clinical Terms that mentions symptoms and drugs used for the treatment of depression.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>We observed that the percentage of patients diagnosed with depressive disorders significantly increased after cancer diagnosis in the 2 types of cancer considered—breast and colorectal cancers. We managed to identify a higher number of patients with depression by mining free-text clinical notes than the group selected exclusively on ICD-9-CM codes, increasing the number of patients diagnosed with depression by 34.8% (441/1269). In addition, the number of patients with depression who received chemotherapy was higher than those who did not receive this treatment, with significant differences (<italic>P</italic>&#60;.001).</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>This study provides new clinical evidence of the depression-cancer comorbidity and supports the use of natural language processing for extracting and analyzing free-text clinical notes from electronic health records, contributing to the identification of additional clinical data that complements those provided by coded data to improve the management of these patients.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>cancer</kwd>
        <kwd>depression</kwd>
        <kwd>electronic health records</kwd>
        <kwd>text mining</kwd>
        <kwd>natural language processing</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <sec>
        <title>Background</title>
        <p>Cancer continues to be one of the main causes of morbidity and mortality in the world, with approximately 19.3 million new cancer cases in 2020 [<xref ref-type="bibr" rid="ref1">1</xref>]. Population estimates indicate that the number of new cases will increase in the next 2 decades to 30.2 million cases per year in 2040 [<xref ref-type="bibr" rid="ref2">2</xref>]. The Global Cancer Observatory estimated that breast, prostate, and colorectal cancers were among the most frequent cancers in 2020 [<xref ref-type="bibr" rid="ref3">3</xref>]. The Global Cancer Observatory pointed out that in Spain, with a population of 46,754,783, the most prevalent cancers in both sexes and across all age groups were colorectal (14.3%, 40,441/282,421) and breast (12.1%, 34,088/282,421) cancers [<xref ref-type="bibr" rid="ref2">2</xref>,<xref ref-type="bibr" rid="ref4">4</xref>]. With the advances in treatment efficacy, cancer is being increasingly viewed and treated as a chronic disease that can be effectively managed for many years [<xref ref-type="bibr" rid="ref5">5</xref>].</p>
        <p>A cancer diagnosis is life‑changing; it is a source of important psychological and emotional stress, which is usually maintained for sustained periods of time that may lead to depressive disorders [<xref ref-type="bibr" rid="ref6">6</xref>]. Depression is one of the most common psychological conditions experienced by patients with cancer [<xref ref-type="bibr" rid="ref6">6</xref>-<xref ref-type="bibr" rid="ref9">9</xref>], a frequent comorbidity [<xref ref-type="bibr" rid="ref6">6</xref>], and one of the factors impairing the life quality of these patients [<xref ref-type="bibr" rid="ref10">10</xref>]. Depressive disorders are related to psychophysiological side effects, poorer treatment outcomes [<xref ref-type="bibr" rid="ref6">6</xref>,<xref ref-type="bibr" rid="ref9">9</xref>], longer hospital stays [<xref ref-type="bibr" rid="ref6">6</xref>,<xref ref-type="bibr" rid="ref11">11</xref>], higher mortality rates [<xref ref-type="bibr" rid="ref5">5</xref>,<xref ref-type="bibr" rid="ref8">8</xref>], and poorer quality of life [<xref ref-type="bibr" rid="ref6">6</xref>]. The prevalence of depressive disorders in patients with cancer depends on different aspects such as cancer type and stage, diagnostic criteria applied, or population studied [<xref ref-type="bibr" rid="ref7">7</xref>]. In patients with cancer, the prevalence of depression is 2 to 3 times higher than in the general population [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref12">12</xref>-<xref ref-type="bibr" rid="ref14">14</xref>], and in some studies, depression is associated with worse overall survival rates due to impaired immune response and higher rates of suicide in patients with cancer [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref15">15</xref>,<xref ref-type="bibr" rid="ref16">16</xref>]. Depression is also one of the most common mental disorders among patients with breast and colorectal cancers [<xref ref-type="bibr" rid="ref17">17</xref>-<xref ref-type="bibr" rid="ref20">20</xref>], affecting their daily lives and deteriorating the quality of life [<xref ref-type="bibr" rid="ref18">18</xref>,<xref ref-type="bibr" rid="ref21">21</xref>]. The consequence of this mental disorder affects patients during cancer treatment and endures beyond the end of the treatment [<xref ref-type="bibr" rid="ref20">20</xref>,<xref ref-type="bibr" rid="ref22">22</xref>]. Moreover, depression remains an underdiagnosed disease in patients with cancer and is markedly different from depression in healthy individuals [<xref ref-type="bibr" rid="ref6">6</xref>,<xref ref-type="bibr" rid="ref23">23</xref>]. The different symptoms of cancer and its treatment, such as fatigue, anorexia or loss of weight, and sleep and cognitive disorders, overlap with those of depression, which leads to an underdiagnosis of this mental disorder in these patients [<xref ref-type="bibr" rid="ref6">6</xref>,<xref ref-type="bibr" rid="ref7">7</xref>,<xref ref-type="bibr" rid="ref14">14</xref>].</p>
        <p>For these reasons, it is critical to detect, diagnose, and treat depression symptoms in patients with cancer and depression. Based on the information available in electronic health records (EHRs), it is possible to have a complete clinical history of these patients, but it is necessary to fully exploit its content to make the most of these information systems [<xref ref-type="bibr" rid="ref24">24</xref>]. EHRs are increasingly implemented in many health care systems around the world, but the clinical information included in these information systems is underused in general and for research purposes and not exploited to its full potential [<xref ref-type="bibr" rid="ref25">25</xref>]. The reuse of data from EHRs for biomedical research deals with 2 main types of information. Structured data, such as patient demographics, encoded diagnosis, procedures, or drug information, are the easiest data sources to process using standard statistical methods [<xref ref-type="bibr" rid="ref26">26</xref>]. Unstructured data, including free-text clinical notes, often requires more complex analysis approaches, relying on text mining and natural language processing (NLP) tools to make it possible to extract relevant, structured information [<xref ref-type="bibr" rid="ref25">25</xref>]. NLP is used to process large amounts of unstructured text from clinical notes and return structured information about their meaning [<xref ref-type="bibr" rid="ref27">27</xref>]. The textual content of clinical notes constitutes a valuable source of information that is useful to obtaining a complete knowledge of patients’ phenotypes by complementing the information encoded in structured clinical data [<xref ref-type="bibr" rid="ref27">27</xref>-<xref ref-type="bibr" rid="ref29">29</xref>]. The capacity to integrate these 2 types of clinical knowledge sources by using biomedical informatics tools is especially critical for the management of complex diseases such as cancer and depression [<xref ref-type="bibr" rid="ref30">30</xref>].</p>
        <p>In this study, we identified and analyzed the presence of depressive disorders in patients with the most common cancers in Spain—breast or colorectal cancer—using 2 different sources of clinical information: diagnosis codes in ICD-9-CM (International Classification of Diseases, Ninth Revision, Clinical Modification) and free-text clinical notes, including mentions of depression diagnoses, their symptoms, and antidepressants.</p>
      </sec>
      <sec>
        <title>Objectives</title>
        <p>The aim of the study was twofold: (1) to compare the association between depression in patients with breast or colorectal cancer before and after these diagnoses and (2) to determine the usefulness of the free-text clinical notes analysis using NLP for detecting the diagnosis of depression among patients with cancer in combination with encoded structured clinical information.</p>
      </sec>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Clinical Database</title>
        <p>The clinical database used for the study was the EHR of the Parc de Salut Mar Barcelona, a complete health care services organization with its information system database (IMASIS). IMASIS includes the clinical information of 2 general hospitals, 1 mental health care center, and 1 social health care center in the Barcelona city area (Catalonia, Spain) since 1990, including different settings such as admissions, outpatient consultations, and emergency department visits [<xref ref-type="bibr" rid="ref31">31</xref>]. IMASIS-2 is the anonymized relational database of IMASIS, being the data source used for research purposes. To identify the diagnosis of depressive disorders, we analyzed both structured and free-text clinical notes obtained from the IMASIS-2 database [<xref ref-type="bibr" rid="ref32">32</xref>].</p>
        <p>The diagnoses included in IMASIS-2 are encoded using the ICD-9-CM codification [<xref ref-type="bibr" rid="ref33">33</xref>]. In addition, during the interaction with their patients, physicians generate clinical notes to record the details of the anamnesis such as the diagnosis performed, prescription of drugs, as well as any kind of related information of clinical interest. At the time of the study, IMASIS-2 included the anonymized clinical information of 876,747 patients, with more than 16.7 million visits from the beginning of 1992 to the end of 2018.</p>
        <p>The Hospital del Mar Cancer Registry, which included 37,741 diagnosed malignant tumors, was also used as an additional source of information, providing data on the number of cases, characteristics, diagnostic and therapeutic process, and survival of patients with cancer at Parc de Salut Mar Barcelona [<xref ref-type="bibr" rid="ref34">34</xref>]. Each clinical record includes the timeline of the patient visits. In addition, each visit is characterized by ICD-9-CM diagnosis codes and 1 or more free-text notes written in Spanish or Catalan (both official languages used in Catalonia) generated by physicians during their interactions with patients that include the anamnesis, diagnosis, and prescriptions.</p>
      </sec>
      <sec>
        <title>Patients’ Selection Criteria</title>
        <p>The initial group of patients considered in our study consisted of the 10,668 individuals who were diagnosed with breast cancer (in women; ICD-9-CM–related code 174) and colorectal cancer (ICD-9-CM–related codes 153 and 154). The patients with cancer were classified in the Cancer Registry by stage (one of in situ, I, II, III, or IV stages) and the type of treatment received including chemotherapy. We obtained a sample of 10,668 patients with breast cancer or colorectal cancer. Of the total 10,668 patients, 2485 were excluded due to having more than 1 cancer or incomplete clinical information, with 8147 patients remaining. Of these 8147 patients, we selected 4238 individuals for the study who had (1) at least 4 or more visits recorded in the IMASIS-2, including 2 before and 2 after the cancer diagnosis; (2) breast or colorectal cancer that were in the “in situ” stage or stages I, II, or III; and (3) complete information about the treatments received for cancer. Patients in stage IV were not included because these patients were in an advanced stage of cancer, and they usually received palliative care or experienced depression [<xref ref-type="bibr" rid="ref9">9</xref>]. Each visit is characterized by the diagnosis codes and 1 or more free-text notes written in Spanish or Catalan generated by physicians during their interaction with the patients. Physicians and health care practitioners usually rely on clinical notes to record the details of the anamnesis and diagnosis they performed, prescriptions and doses of drugs, as well as any kind of related information of interest. Considering that patients with cancer usually have several visits and clinical complexity, we decided to include at least 4 visits to ensure that enough clinical information of the follow-up was analyzed. The flow diagram of the study is depicted in <xref rid="figure1" ref-type="fig">Figure 1</xref>.</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>Flow diagram of the study process.</p>
          </caption>
          <graphic xlink:href="cancer_v8i3e39003_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <p>To get thorough information describing the occurrence of depressive disorders among patients with breast and colorectal cancers, we used a combination of different sources of clinical information present in the EHR. The included sources are the occurrence of ICD-9-CM diagnosis codes registered and related to depressive disorders (<xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>) and the text mining of clinical notes by means of NLP tools to detect mentions of (1) terms and expressions that are commonly used to describe depressive disorders (based on Systematized Nomenclature of Medicine Clinical Terms [SNOMED CT] related to depressive disorders) [<xref ref-type="bibr" rid="ref35">35</xref>] and (2) drugs used for the treatment of depression (<xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref>).</p>
        <p>We analyzed the textual content of the 272,575 clinical notes from the visits of the 4238 patients with the considered cancers. The text of each clinical note was processed by means of the FreeLing [<xref ref-type="bibr" rid="ref36">36</xref>] open-source language analysis framework, and the following text analysis steps were performed (see <xref rid="figure2" ref-type="fig">Figure 2</xref>).</p>
        <fig id="figure2" position="float">
          <label>Figure 2</label>
          <caption>
            <p>The different text mining tools used and applied for the clinical annotations analysis.</p>
          </caption>
          <graphic xlink:href="cancer_v8i3e39003_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <list list-type="bullet">
          <list-item>
            <p>Language identification: The FreeLing language analyzer determined, for each clinical note, the language used (Spanish or Catalan). All subsequent NLP analyses performed were language-specific.</p>
          </list-item>
          <list-item>
            <p>Tokenization and part-of-speech tagging: The text of each clinical note was divided into tokens (substrings with assigned and identified meaning), and the part of speech of each token was identified (determiner, preposition, conjunction, punctuation, verb, adjective, pronoun, adverb, and name).</p>
          </list-item>
          <list-item>
            <p>Terms detection: In the text of each clinical note, mentions of the following types of terms were identified: (1) names of the active substances of the 35 antidepressants and their corresponding 82 brand names used in Spain; and (2) SNOMED CT with depressive disorders–related terms, including the lexicalizations of the 139 concepts classified under the concept “trastorno depresivo (trastorno)” (depressive disorder [disorder] in Spanish; SNOMED CT ID 35489007). We searched for mentions of antidepressant active substances and their commercial drug names over the whole textual content of clinical notes. For this purpose, we exploited the Elasticsearch search and analytics tool [<xref ref-type="bibr" rid="ref37">37</xref>]. This search engine, apart from substantially speeding up the search for relevant mentions in the huge collections of clinical notes, allowed us to properly match the variations of the considered terms with respect to misspellings that are frequent in free-text clinical notes.</p>
          </list-item>
          <list-item>
            <p>Negation characterization: A negation detection algorithm tailored to the Spanish and Catalan languages was applied to the clinical notes for both SNOMED CT depressive disorders terms and antidepressant active substance and brand names to exclude the negated occurrences of these terms from our study. This detection was performed using a negation detection algorithm implemented as a token sequence tagger, relying on Conditional Random Fields. For this purpose, a corpus of 949 sentences (572 in Spanish and 277 in Catalan) extracted from clinical notes were manually annotated, detecting for each sentence the negation marker and the related negation span (ie, the portion of the text of the sentence that is actually negated). This corpus has been used to train a Conditional Random Fields sequence tagger that is able to automatically identify negation markers and related spans inside the text of clinical notes in Spanish and Catalan.</p>
          </list-item>
        </list>
        <p>When needed, the names of antidepressant active substances as well as the names of depressive disorders–related terms from SNOMED CT were manually translated into Spanish and Catalan by a bilingual psychologist, since the textual content of the clinical notes analyzed in our study includes both languages.</p>
      </sec>
      <sec>
        <title>Ethics Approval</title>
        <p>The study was approved by the Hospital del Mar Research Ethics Committee (Comitè Ètic d'Investigació Clínica del Parc de Salut Mar; 2016/7130/l) and performed according to the Declaration of Helsinki, the General Data Protection Regulation (EU 2016/679), and the Spanish Law (3/2018) for data protection. All data were anonymized and treated with maximal confidentiality and respect according to good clinical practice guidelines.</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <p>The number of patients with cancer included in our study was 4238. There were 2032 women with breast cancer with a mean age of 62.3 (SD 13.2) years, and there were 2206 patients with colorectal cancer with a mean age of 70.5 (SD 11.4) years, including 1277 (57.9%) men and 929 (42.1%) women with significant differences in the ages of both groups of patients with these cancers (<italic>P</italic>&#60;.001). The distribution of age by stages of both cancers is shown in <xref rid="figure3" ref-type="fig">Figure 3</xref>. The median age increases gradually according to the stage of the cancer, and it is higher in patients with colorectal cancer. The median age changed from 60 years in the “in situ” stage to 68 years in stage III for breast cancer and from 68 years in the “in situ” stage to 73 years in stage III for colorectal cancer.</p>
      <fig id="figure3" position="float">
        <label>Figure 3</label>
        <caption>
          <p>Distribution of age by the stages of breast and colorectal cancers. The median age is shown as a vertical line.</p>
        </caption>
        <graphic xlink:href="cancer_v8i3e39003_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
      </fig>
      <p>The total number of patients with depression based on the use of ICD-9-CM, antidepressants drug mentions, SNOMED CT concepts related to depressive disorders, or the combination of these 3 methods was 1269. The percentage of patients diagnosed with depressive disorders increased after cancer diagnosis, with significant differences across all the types of cancer considered (<italic>P</italic>=.004) and the stages of cancer (<italic>P</italic>&#60;.001). In <xref ref-type="table" rid="table1">Table 1</xref>, the distribution of patients according to the type of cancer, stage, and depression after the date of diagnosis of cancer based on ICD-9-CM codes is shown.</p>
      <p>The increase in the number of patients with depression observed was a trend that we found separately in the ICD-9-CM codes, mentions of antidepressant drugs, and mentions of the set of SNOMED CT depression concepts. In the tables below, we show the number of patients with depression before and after the diagnosis of cancer using 3 different methods to detect them: the ICD-9-CM depression codes, antidepressant drug mentions, and SNOMED CT concepts related to “trastorno depresivo,” and the combination of the 3 methods.</p>
      <p>Considering exclusively the ICD-9-CM codes of depressive disorders and excluding patients diagnosed with depression in visits both before and after the date of cancer diagnosis (n=164), of the 4074 remaining patients, 16.3% (n=664) were diagnosed with depression, and 86.6% (575/664) were diagnosed after the cancer diagnosis date (see <xref ref-type="table" rid="table2">Table 2</xref>). The total number of patients with depression increased significantly after the date of cancer diagnosis (McNemar test: <italic>χ</italic><sup>2</sup><sub>1</sub>=354.25; <italic>P</italic>&#60;.001).</p>
      <p>Considering the diagnosis of depression based on antidepressant drug mentions and excluding patients diagnosed with depression in visits both before and after the date of diagnosis cancer (n=68), of the 4170 remaining patients, 15% (n=624) were diagnosed with depression, and 91% (568/624) were diagnosed after the cancer diagnosis date (see <xref ref-type="table" rid="table3">Table 3</xref>). The total number of patients with depression increased significantly after the diagnosis date of cancer (McNemar test: <italic>χ</italic><sup>2</sup><sub>1</sub>=418.46: <italic>P</italic>&#60;.001).</p>
      <p>Of the 824 antidepressant mentions, the most frequent were citalopram (n=274, 33.3%), escitalopram (n=174, 21.1%), amitriptyline (n=125, 15.2%), trazodone (n=64, 7.8%), venlafaxine (n=57, 6.9%), paroxetine (n=37, 4.5%), desvenlafaxine (n=22, 2.7%), fluoxetine (n=22, 2.7%), and bupropion (n=21, 2.5%).</p>
      <p>Considering the mentions of SNOMED CT depression concepts and excluding patients diagnosed with depression in visits both before and after the date of cancer diagnosis (n=20), of the 4218 remaining patients, 379 (89%, N=426) patients with depression were diagnosed after the data of cancer diagnosis—222 (94.5%) out of 235 for breast cancer and 157 (82.2%) out of 191 for colorectal cancer (see <xref ref-type="table" rid="table4">Table 4</xref>). The total number of patients with depression increased significantly after the diagnosis date of cancer (McNemar test: <italic>χ</italic><sup>2</sup><sub>1</sub>=257.19; <italic>P</italic>&#60;.001).</p>
      <table-wrap position="float" id="table1">
        <label>Table 1</label>
        <caption>
          <p>Distribution of patients according to the type of cancer, stage, and diagnosis of depression based on ICD-9-CM (International Classification of Diseases, Ninth Revision, Clinical Modification) codification.</p>
        </caption>
        <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
          <col width="30"/>
          <col width="270"/>
          <col width="320"/>
          <col width="380"/>
          <thead>
            <tr valign="top">
              <td colspan="2">Cancer type, cancer stage</td>
              <td>Number of patients, n/N (%)</td>
              <td>Depression (ICD-9-CM) after cancer diagnosis, n/N (%)</td>
            </tr>
          </thead>
          <tbody>
            <tr valign="top">
              <td colspan="4">
                <bold>Breast</bold>
              </td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>In situ</td>
              <td>234/2032 (11.5)</td>
              <td>40/234 (17.1)</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Stage I</td>
              <td>739/2032 (36.4)</td>
              <td>152/739 (20.6)</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Stage II</td>
              <td>781/2032 (38.4)</td>
              <td>166/781 (21.3)</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Stage III</td>
              <td>278/2032 (13.7)</td>
              <td>82/278 (29.5)</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>All stages</td>
              <td>2032/2032 (100)</td>
              <td>440/2032 (21.7)</td>
            </tr>
            <tr valign="top">
              <td colspan="4">
                <bold>Colorectal</bold>
              </td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>In situ</td>
              <td>544/2206 (24.7)</td>
              <td>48/544 (8.8)</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Stage I</td>
              <td>438/2206 (19.9)</td>
              <td>61/438 (13.9)</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Stage II</td>
              <td>656/2206 (29.7)</td>
              <td>94/656 (14.3)</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Stage III</td>
              <td>568/2206 (25.7)</td>
              <td>96/568 (16.9)</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>All stages</td>
              <td>2206/2206 (100)</td>
              <td>299/2206 (13.6)</td>
            </tr>
            <tr valign="top">
              <td colspan="2">Total</td>
              <td>4238/4238 (100)</td>
              <td>739/4238 (17.4)</td>
            </tr>
          </tbody>
        </table>
      </table-wrap>
      <table-wrap position="float" id="table2">
        <label>Table 2</label>
        <caption>
          <p>Number of patients characterized by ICD-9-CM (International Classification of Diseases, Ninth Revision, Clinical Modification) depression diagnosis codes before and after the cancer diagnosis date.</p>
        </caption>
        <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
          <col width="160"/>
          <col width="220"/>
          <col width="210"/>
          <col width="200"/>
          <col width="210"/>
          <thead>
            <tr valign="top">
              <td>Cancer type</td>
              <td>Before cancer diagnosis date, n/N (%)</td>
              <td>After cancer diagnosis date, n/N (%)</td>
              <td>Patients with depression, n/N (%)</td>
              <td>Patients without depression, n/N (%)</td>
            </tr>
          </thead>
          <tbody>
            <tr valign="top">
              <td>Breast</td>
              <td>39/398 (9.8)</td>
              <td>359/398 (90.2)</td>
              <td>398/1951 (20.4)</td>
              <td>1553/1951 (79.6)</td>
            </tr>
            <tr valign="top">
              <td>Colorectal</td>
              <td>50/266 (18.8)</td>
              <td>216/266 (81.2)</td>
              <td>266/2123 (12.5)</td>
              <td>1857/2123 (84.5)</td>
            </tr>
            <tr valign="top">
              <td>Total</td>
              <td>89/664 (13.4)</td>
              <td>575/664 (86.6)</td>
              <td>664/4074 (16.3)</td>
              <td>3410/4074 (83.7)</td>
            </tr>
          </tbody>
        </table>
      </table-wrap>
      <table-wrap position="float" id="table3">
        <label>Table 3</label>
        <caption>
          <p>Number of patients with antidepressant drug mentions before and after the cancer diagnosis date.</p>
        </caption>
        <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
          <col width="160"/>
          <col width="220"/>
          <col width="210"/>
          <col width="200"/>
          <col width="210"/>
          <thead>
            <tr valign="top">
              <td>Cancer type</td>
              <td>Before cancer diagnosis date, n/N (%)</td>
              <td>After cancer diagnosis date, n/N (%)</td>
              <td>Patients with depression, n/N (%)</td>
              <td>Patients without depression, n/N (%)</td>
            </tr>
          </thead>
          <tbody>
            <tr valign="top">
              <td>Breast</td>
              <td>27/352 (7.7)</td>
              <td>325/352 (92.3)</td>
              <td>352/2009 (17.5)</td>
              <td>1657/2009 (82.5)</td>
            </tr>
            <tr valign="top">
              <td>Colorectal</td>
              <td>29/272 (10.7)</td>
              <td>243/272 (89.3)</td>
              <td>272/2161 (12.6)</td>
              <td>1889/2161 (87.4)</td>
            </tr>
            <tr valign="top">
              <td>Total</td>
              <td>56/624 (9)</td>
              <td>568/624 (91)</td>
              <td>624/4170 (15)</td>
              <td>3546/4170 (85)</td>
            </tr>
          </tbody>
        </table>
      </table-wrap>
      <table-wrap position="float" id="table4">
        <label>Table 4</label>
        <caption>
          <p>Number of patients with mentions of SNOMED CT (Systematized Nomenclature of Medicine Clinical Terms) concepts related to “trastorno depresivo” (depressive disorder in Spanish) before and after the cancer diagnosis date.</p>
        </caption>
        <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
          <col width="160"/>
          <col width="220"/>
          <col width="210"/>
          <col width="200"/>
          <col width="210"/>
          <thead>
            <tr valign="top">
              <td>Cancer type</td>
              <td>Before cancer diagnosis date, n/N (%)</td>
              <td>After cancer diagnosis date, n/N (%)</td>
              <td>Patients with depression, n/N (%)</td>
              <td>Patients without depression, n/N (%)</td>
            </tr>
          </thead>
          <tbody>
            <tr valign="top">
              <td>Breast</td>
              <td>13/235 (5.5)</td>
              <td>222/235 (94.5)</td>
              <td>235/2021 (11.6)</td>
              <td>1786/2021 (88.4)</td>
            </tr>
            <tr valign="top">
              <td>Colorectal</td>
              <td>34/191 (17.8)</td>
              <td>157/191 (82.2)</td>
              <td>191/2197 (8.7)</td>
              <td>2006/2197 (91.3)</td>
            </tr>
            <tr valign="top">
              <td>Total</td>
              <td>47/426 (11)</td>
              <td>379/426 (89)</td>
              <td>426/4218 (10)</td>
              <td>3792/4218 (90)</td>
            </tr>
          </tbody>
        </table>
      </table-wrap>
      <p>When we considered the previous 3 selection criteria together (ICD-9 codes, drug mentions, and SNOMED CT concepts) to detect patients with a diagnosis of depression and excluded the patients with a depression diagnosis both before and after cancer diagnosis date (n=248), of a total of 1021 patients, 920 (90.1%) were diagnosed after the cancer diagnosis date—533 (92.5%) out of 576 for breast cancer and 387 (87%) out of 445 for colorectal cancer (see <xref ref-type="table" rid="table5">Table 5</xref>).</p>
      <p>Of the total 4238 individuals, we identified 1269 (30%) characterized by 1 or more diagnoses of depression by analyzing their clinical histories (both ICD-9-CM codes and clinical notes, including drug mentions and SNOMED CT concepts detection). The identification of a diagnosis of depression in 441 (34.8%) patients out of 1269 has been performed by relying exclusively on the analysis of clinical notes using text mining (drugs and SNOMED CT concepts detection)—such patients would have not been considered as having been diagnosed with depression by relying on ICD-9-CM clinical codes. If we consider patients with breast cancer, the diagnosis of depression has been performed by relying exclusively on text mining in 30.6% (211/690) of the patients; this percentage is 39.7% (230/579) when we consider patients with colorectal cancer. Consequently, thanks to the analysis of clinical notes, we detected a considerably larger number (828/1269, 65.2%) of patients diagnosed with depression, with 34.8% (441/1269) more individuals using text mining (drugs or SNOMED CT concept mentions), by relying on ICD-9-CM codes in combination or not with drugs or SNOMED CT concepts mentions (see <xref ref-type="table" rid="table6">Table 6</xref>).</p>
      <p>Finally, we tried to determine if there was a relationship between the onset of depression and receiving chemotherapy. Of the 2032 patients with breast cancer, 907 (44.6%) received chemotherapy and 1125 (55.4%) did not. Of the 2206 patients with colorectal cancer, 564 (25.6%) received chemotherapy and 1642 (74.4%) did not. The number of patients with depression who received chemotherapy was higher than those who did not receive chemotherapy, with significant differences (<italic>P</italic>&#60;.001).</p>
      <table-wrap position="float" id="table5">
        <label>Table 5</label>
        <caption>
          <p>Number of patients with ICD-9-CM (International Classification of Diseases, Ninth Revision, Clinical Modification) codes of depressive disorders, a mention of antidepressant drugs, or a mention of one of the sets of 139 SNOMED CT (Systematized Nomenclature of Medicine Clinical Terms) concepts subsumed by the concept “trastorno depresivo” (depressive disorder in Spanish), before and after the cancer diagnosis date.</p>
        </caption>
        <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
          <col width="160"/>
          <col width="230"/>
          <col width="230"/>
          <col width="180"/>
          <col width="200"/>
          <thead>
            <tr valign="top">
              <td>Cancer type</td>
              <td>ICD-9-CM codes or mentions of drugs and SNOMED CT concepts before cancer diagnosis date, n/N (%)</td>
              <td>ICD-9-CM codes or mentions of drugs and SNOMED CT concepts after cancer diagnosis date, n/N (%)</td>
              <td>ICD-9-CM codes or mentions of drugs and SNOMED CT concepts, n/N (%)</td>
              <td>No ICD-9-CM codes or mentions of drugs and SNOMED CT, concepts, n/N (%)</td>
            </tr>
          </thead>
          <tbody>
            <tr valign="top">
              <td>Breast</td>
              <td>43/576 (7.5)</td>
              <td>533/576 (92.5)</td>
              <td>576/1918 (30)</td>
              <td>1342/1918 (70)</td>
            </tr>
            <tr valign="top">
              <td>Colorectal</td>
              <td>58/445 (13)</td>
              <td>387/445 (87)</td>
              <td>445/2072 (21.5)</td>
              <td>1627/2072 (78.5)</td>
            </tr>
            <tr valign="top">
              <td>Total</td>
              <td>101/1021 (9.9)</td>
              <td>920/1021 (90.1)</td>
              <td>1021/3990 (25.6)</td>
              <td>2969/3990 (74.4)</td>
            </tr>
          </tbody>
        </table>
      </table-wrap>
      <table-wrap position="float" id="table6">
        <label>Table 6</label>
        <caption>
          <p>Number of patients with ICD-9-CM (International Classification of Diseases, Ninth Revision, Clinical Modification) codes with or without mentions of drugs or SNOMED CT (Systematized Nomenclature of Medicine Clinical Terms) concepts.</p>
        </caption>
        <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
          <col width="160"/>
          <col width="420"/>
          <col width="420"/>
          <thead>
            <tr valign="top">
              <td>Cancer type</td>
              <td>ICD-9-CM codes without mentions of drugs or SNOMED CT concepts, n/N (%)</td>
              <td>ICD-9-CM codes with mentions of drugs or SNOMED CT concepts, n/N (%)</td>
            </tr>
          </thead>
          <tbody>
            <tr valign="top">
              <td>Breast</td>
              <td>479/690 (69.4)</td>
              <td>211/690 (30.6)</td>
            </tr>
            <tr valign="top">
              <td>Colorectal</td>
              <td>349/579 (60.3)</td>
              <td>230/579 (39.7)</td>
            </tr>
            <tr valign="top">
              <td>Total</td>
              <td>828/1269 (65.2)</td>
              <td>441/1269 (34.8)</td>
            </tr>
          </tbody>
        </table>
      </table-wrap>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>The detection of depressive disorders in patients with cancer is a key element in the management of these patients, which can impact the treatment outcomes of cancer [<xref ref-type="bibr" rid="ref6">6</xref>]. In this study, we analyzed the relationship between depression and cancer diagnosis, particularly in breast and colorectal cancers. We considered the diagnosis of depression based on both structured information encoded by ICD-9-CM codes and extracted information from free-text clinical notes, using text mining and NLP tools for the mentions of antidepressant drugs and SNOMED CT concepts related to the concept “trastorno depresivo” (depressive disorder in Spanish). We identified a significantly higher number of patients with depression after the diagnosis of cancer, in both breast and colorectal cancers, thus highlighting the importance of such comorbidity in patients with these conditions [<xref ref-type="bibr" rid="ref9">9</xref>]. The proportion of patients with depression increased with the progression of the cancer stage and when receiving chemotherapy. In addition, this trend was maintained when we detected patients with depression using the different sources of information that are available in the EHR, including structured data and free-text clinical notes in which antidepressants and depressive symptoms are mentioned. Nevertheless, our study demonstrates that the diagnosis of depression detected by medical doctors is not always registered using codifications (ie, ICD-9-CM codes), but it is often mentioned exclusively in free text in clinical notes where it can be indirectly detected based on the mentions of depressive symptoms or antidepressant drugs [<xref ref-type="bibr" rid="ref38">38</xref>]. The detection of information related to depression from unstructured EHR data identified individuals among the patients included in the study who were missed based only on the information from encoded data.</p>
        <p>The use of unstructured data for the identification of conditions such as depression, as well as other diseases and comorbidities [<xref ref-type="bibr" rid="ref26">26</xref>], should be considered as a source of information that can contribute to the management of complex diseases such as cancer and depression. Using NLP methods to detect patients with conditions that are previously encoded can improve the codification process and follow-up of these patients. In addition, the use of NLP to detect symptoms and comorbidities from free text in the EHR can contribute to the characterization of diseases or predict response to treatment [<xref ref-type="bibr" rid="ref39">39</xref>-<xref ref-type="bibr" rid="ref41">41</xref>].</p>
        <p>The value of relying on these 2 types of clinical information—structured and unstructured—has been analyzed in other conditions such as geriatric syndrome [<xref ref-type="bibr" rid="ref26">26</xref>], different mental illnesses [<xref ref-type="bibr" rid="ref42">42</xref>], and psychiatric phenotyping [<xref ref-type="bibr" rid="ref43">43</xref>], helping in the identification of additional clinical information not registered using codifications, although the extraction of this data is challenging and resource intensive.</p>
      </sec>
      <sec>
        <title>Limitations</title>
        <p>This study has some limitations. It is not uncommon that if the main cause of admission of a patient is a complication of cancer, other secondary diagnoses such as depression are not included in the medical discharge report, and for this reason, these diagnoses can be underrecorded. However, specific words and expressions used by medical doctors to mention depression-related symptoms in clinical notes may not have been included among the terms used in this study. We based our analyses of clinical notes exclusively on the terminology encoded in SNOMED CT to capture mentions of depressive disorders, and therefore, our terminology could underestimate the number of patients with depression. In this regard, free text can be further explored to identify other expressions and terms used by clinicians to describe depression symptoms [<xref ref-type="bibr" rid="ref26">26</xref>]. Finally, the mentions of antidepressant drugs could not always be associated with a diagnosis of depression but rather with other mental disorders in which these drugs are prescribed.</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>This study demonstrated that the use of NLP for extracting and processing unstructured clinical information, which is present in free-text clinical notes in the EHR, in combination with encoded diagnosis can contribute to the identification of relevant clinical data—in this case, the detection of depressive disorders in patients with breast and colorectal cancers. This study shows the possibility of combining structured and unstructured data included in the EHR, providing new opportunities to better understand and manage complex diseases and their comorbidities, such as cancer and depression, to the benefit of these patients. In future works, we intend to extract information from the EHR using NLP in combination with machine learning methods and apply prediction models to estimate different possible outcomes.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>ICD-9-CM (International Classification of Diseases, Ninth Revision, Clinical Modification) diagnosis codes related to depressive disorders used in the study.</p>
        <media xlink:href="cancer_v8i3e39003_app1.docx" xlink:title="DOCX File , 16 KB"/>
      </supplementary-material>
      <supplementary-material id="app2">
        <label>Multimedia Appendix 2</label>
        <p>Names of the active substances of the 35 antidepressants and their corresponding 82 brand names used in Spain.</p>
        <media xlink:href="cancer_v8i3e39003_app2.docx" xlink:title="DOCX File , 17 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">EHR</term>
          <def>
            <p>electronic health record</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">ICD-9-CM</term>
          <def>
            <p>International Classification of Diseases, Ninth Revision, Clinical Modification</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">NLP</term>
          <def>
            <p>natural language processing</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">SNOMED CT</term>
          <def>
            <p>Systematized Nomenclature of Medicine Clinical Terms</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>The Research Programme on Biomedical Informatics (GRIB) is a member of the Spanish National Bioinformatics Institute and funded by Instituto de Salud Carlos III and FEDER (PT17/0009/0014). The GRIB is also supported by the Agència de Gestió d’Ajuts Universitaris i de Recerca, Generalitat de Catalunya (2017 SGR 00519). This research was carried out under the framework of the project Creating medically-driven integrative bioinformatics applications focused on oncology, CNS disorders and their comorbidities (MedBioinformatics, H2020-EU; grant 634143); and partially funded by the Institute of Health Carlos III (project IMPaCT-Data; IMP/00019) and cofunded by the European Union, European Regional Development Fund (“A way to make Europe”); and the Clinical Knowledge Aggregation by Mining Medical Reports (CliKA-MinE; PI17/00230), which is funded by Institute of Health Carlos III and cofunded by the European Union.</p>
    </ack>
    <notes>
      <sec>
        <title>Data Availability</title>
        <p>The study involves the use of patients’ medical data from the Hospital del Mar according to the General Data Protection Regulation. The data is not publicly available due to the ethical regulations under which the data is collected from our hospital database.</p>
      </sec>
    </notes>
    <fn-group>
      <fn fn-type="con">
        <p>The first draft was written jointly by AL, MAM, and FR. All the authors have read and agreed to the final version of the manuscript.</p>
      </fn>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sung</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Ferlay</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Siegel</surname>
              <given-names>RL</given-names>
            </name>
            <name name-style="western">
              <surname>Laversanne</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Soerjomataram</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Jemal</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Bray</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>Global cancer statistics 2020: GLOBOCAN estimates of incidence and mortality worldwide for 36 cancers in 185 countries</article-title>
          <source>CA Cancer J Clin</source>
          <year>2021</year>
          <month>05</month>
          <volume>71</volume>
          <issue>3</issue>
          <fpage>209</fpage>
          <lpage>249</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.3322/caac.21660"/>
          </comment>
          <pub-id pub-id-type="doi">10.3322/caac.21660</pub-id>
          <pub-id pub-id-type="medline">33538338</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="web">
          <article-title>Las cifras del cáncer en España 2021</article-title>
          <source>Sociedad Española de Oncología Médica (SEOM)</source>
          <year>2021</year>
          <access-date>2022-06-28</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://seom.org/images/Cifras_del_cancer_en_Espnaha_2021.pdf">https://seom.org/images/Cifras_del_cancer_en_Espnaha_2021.pdf</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="web">
          <article-title>World summary statistics (2020)</article-title>
          <source>The Global Cancer Observatory</source>
          <year>2021</year>
          <month>03</month>
          <access-date>2022-02-01</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://gco.iarc.fr/today/data/factsheets/populations/900-world-fact-sheets.pdf">https://gco.iarc.fr/today/data/factsheets/populations/900-world-fact-sheets.pdf</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="web">
          <article-title>Spain summary statistics (2020)</article-title>
          <source>The Global Cancer Observatory</source>
          <year>2021</year>
          <month>03</month>
          <access-date>2022-02-01</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://gco.iarc.fr/today/data/factsheets/populations/724-spain-fact-sheets.pdf">https://gco.iarc.fr/today/data/factsheets/populations/724-spain-fact-sheets.pdf</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Watts</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Leydon</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Birch</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Prescott</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Lai</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Eardley</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Lewith</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Depression and anxiety in prostate cancer: a systematic review and meta-analysis of prevalence rates</article-title>
          <source>BMJ Open</source>
          <year>2014</year>
          <month>03</month>
          <day>13</day>
          <volume>4</volume>
          <issue>3</issue>
          <fpage>e003901</fpage>
          <pub-id pub-id-type="doi">10.1136/bmjopen-2013-003901</pub-id>
          <pub-id pub-id-type="medline">24625637</pub-id>
          <pub-id pub-id-type="pii">bmjopen-2013-003901</pub-id>
          <pub-id pub-id-type="pmcid">PMC3963074</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>HR</given-names>
            </name>
          </person-group>
          <article-title>Depression in cancer patients: pathogenesis, implications and treatment (review)</article-title>
          <source>Oncol Lett</source>
          <year>2015</year>
          <month>04</month>
          <volume>9</volume>
          <issue>4</issue>
          <fpage>1509</fpage>
          <lpage>1514</lpage>
          <pub-id pub-id-type="doi">10.3892/ol.2015.2944</pub-id>
          <pub-id pub-id-type="medline">25788991</pub-id>
          <pub-id pub-id-type="pii">ol-09-04-1509</pub-id>
          <pub-id pub-id-type="pmcid">PMC4356432</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Li</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Fitzgerald</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Rodin</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Evidence-based treatment of depression in patients with cancer</article-title>
          <source>J Clin Oncol</source>
          <year>2012</year>
          <month>04</month>
          <day>10</day>
          <volume>30</volume>
          <issue>11</issue>
          <fpage>1187</fpage>
          <lpage>96</lpage>
          <pub-id pub-id-type="doi">10.1200/JCO.2011.39.7372</pub-id>
          <pub-id pub-id-type="medline">22412144</pub-id>
          <pub-id pub-id-type="pii">JCO.2011.39.7372</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hinz</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Herzberg</surname>
              <given-names>PY</given-names>
            </name>
            <name name-style="western">
              <surname>Lordick</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Weis</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Faller</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Brähler</surname>
              <given-names>Elmar</given-names>
            </name>
            <name name-style="western">
              <surname>Härter</surname>
              <given-names>Martin</given-names>
            </name>
            <name name-style="western">
              <surname>Wegscheider</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Geue</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Mehnert</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Age and gender differences in anxiety and depression in cancer patients compared with the general population</article-title>
          <source>Eur J Cancer Care (Engl)</source>
          <year>2019</year>
          <month>09</month>
          <day>09</day>
          <volume>28</volume>
          <issue>5</issue>
          <fpage>e13129</fpage>
          <pub-id pub-id-type="doi">10.1111/ecc.13129</pub-id>
          <pub-id pub-id-type="medline">31290218</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hinz</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Krauss</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Hauss</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Höckel</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Kortmann</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Stolzenburg</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Schwarz</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Anxiety and depression in cancer patients compared with the general population</article-title>
          <source>Eur J Cancer Care (Engl)</source>
          <year>2010</year>
          <month>07</month>
          <volume>19</volume>
          <issue>4</issue>
          <fpage>522</fpage>
          <lpage>9</lpage>
          <pub-id pub-id-type="doi">10.1111/j.1365-2354.2009.01088.x</pub-id>
          <pub-id pub-id-type="medline">20030697</pub-id>
          <pub-id pub-id-type="pii">ECC1088</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mayr</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Schmid</surname>
              <given-names>RM</given-names>
            </name>
          </person-group>
          <article-title>Pancreatic cancer and depression: myth and truth</article-title>
          <source>BMC Cancer</source>
          <year>2010</year>
          <month>10</month>
          <day>20</day>
          <volume>10</volume>
          <issue>1</issue>
          <fpage>569</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmccancer.biomedcentral.com/articles/10.1186/1471-2407-10-569"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/1471-2407-10-569</pub-id>
          <pub-id pub-id-type="medline">20961421</pub-id>
          <pub-id pub-id-type="pii">1471-2407-10-569</pub-id>
          <pub-id pub-id-type="pmcid">PMC2976753</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Satin</surname>
              <given-names>JR</given-names>
            </name>
            <name name-style="western">
              <surname>Linden</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Phillips</surname>
              <given-names>MJ</given-names>
            </name>
          </person-group>
          <article-title>Depression as a predictor of disease progression and mortality in cancer patients: a meta-analysis</article-title>
          <source>Cancer</source>
          <year>2009</year>
          <month>11</month>
          <day>15</day>
          <volume>115</volume>
          <issue>22</issue>
          <fpage>5349</fpage>
          <lpage>61</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1002/cncr.24561"/>
          </comment>
          <pub-id pub-id-type="doi">10.1002/cncr.24561</pub-id>
          <pub-id pub-id-type="medline">19753617</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Linden</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Vodermaier</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Mackenzie</surname>
              <given-names>Regina</given-names>
            </name>
            <name name-style="western">
              <surname>Greig</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Anxiety and depression after cancer diagnosis: prevalence rates by cancer type, gender, and age</article-title>
          <source>J Affect Disord</source>
          <year>2012</year>
          <month>12</month>
          <day>10</day>
          <volume>141</volume>
          <issue>2-3</issue>
          <fpage>343</fpage>
          <lpage>51</lpage>
          <pub-id pub-id-type="doi">10.1016/j.jad.2012.03.025</pub-id>
          <pub-id pub-id-type="medline">22727334</pub-id>
          <pub-id pub-id-type="pii">S0165-0327(12)00221-2</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mehnert</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Brähler</surname>
              <given-names>Elmar</given-names>
            </name>
            <name name-style="western">
              <surname>Faller</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Härter</surname>
              <given-names>Martin</given-names>
            </name>
            <name name-style="western">
              <surname>Keller</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Schulz</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Wegscheider</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Weis</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Boehncke</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Hund</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Reuter</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Richard</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Sehner</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Sommerfeldt</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Szalai</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Wittchen</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Koch</surname>
              <given-names>U</given-names>
            </name>
          </person-group>
          <article-title>Four-week prevalence of mental disorders in patients with cancer across major tumor entities</article-title>
          <source>J Clin Oncol</source>
          <year>2014</year>
          <month>11</month>
          <day>01</day>
          <volume>32</volume>
          <issue>31</issue>
          <fpage>3540</fpage>
          <lpage>6</lpage>
          <pub-id pub-id-type="doi">10.1200/JCO.2014.56.0086</pub-id>
          <pub-id pub-id-type="medline">25287821</pub-id>
          <pub-id pub-id-type="pii">JCO.2014.56.0086</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dauchy</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Dolbeault</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Reich</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Depression in cancer patients</article-title>
          <source>EJC Suppl</source>
          <year>2013</year>
          <month>09</month>
          <volume>11</volume>
          <issue>2</issue>
          <fpage>205</fpage>
          <lpage>15</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1359-6349(13)00007-4"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.ejcsup.2013.07.006</pub-id>
          <pub-id pub-id-type="medline">26217129</pub-id>
          <pub-id pub-id-type="pii">S1359-6349(13)00007-4</pub-id>
          <pub-id pub-id-type="pmcid">PMC4041309</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Misono</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Weiss</surname>
              <given-names>NS</given-names>
            </name>
            <name name-style="western">
              <surname>Fann</surname>
              <given-names>JR</given-names>
            </name>
            <name name-style="western">
              <surname>Redman</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Yueh</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Incidence of suicide in persons with cancer</article-title>
          <source>J Clin Oncol</source>
          <year>2008</year>
          <month>10</month>
          <day>10</day>
          <volume>26</volume>
          <issue>29</issue>
          <fpage>4731</fpage>
          <lpage>8</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/18695257"/>
          </comment>
          <pub-id pub-id-type="doi">10.1200/JCO.2007.13.8941</pub-id>
          <pub-id pub-id-type="medline">18695257</pub-id>
          <pub-id pub-id-type="pii">JCO.2007.13.8941</pub-id>
          <pub-id pub-id-type="pmcid">PMC2653137</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pinquart</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Duberstein</surname>
              <given-names>PR</given-names>
            </name>
          </person-group>
          <article-title>Depression and cancer mortality: a meta-analysis</article-title>
          <source>Psychol Med</source>
          <year>2010</year>
          <month>11</month>
          <volume>40</volume>
          <issue>11</issue>
          <fpage>1797</fpage>
          <lpage>810</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/20085667"/>
          </comment>
          <pub-id pub-id-type="doi">10.1017/S0033291709992285</pub-id>
          <pub-id pub-id-type="medline">20085667</pub-id>
          <pub-id pub-id-type="pii">S0033291709992285</pub-id>
          <pub-id pub-id-type="pmcid">PMC2935927</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tsaras</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Papathanasiou</surname>
              <given-names>IV</given-names>
            </name>
            <name name-style="western">
              <surname>Mitsi</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Veneti</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Kelesi</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Zyga</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Fradelos</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Assessment of depression and anxiety in breast cancer patients: prevalence and associated factors</article-title>
          <source>Asian Pac J Cancer Prev</source>
          <year>2018</year>
          <month>06</month>
          <day>25</day>
          <volume>19</volume>
          <issue>6</issue>
          <fpage>1661</fpage>
          <lpage>1669</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://journal.waocp.org/?sid=Entrez:PubMed&#38;id=pmid:29938451&#38;key=2018.19.6.1661"/>
          </comment>
          <pub-id pub-id-type="doi">10.22034/APJCP.2018.19.6.1661</pub-id>
          <pub-id pub-id-type="medline">29938451</pub-id>
          <pub-id pub-id-type="pmcid">PMC6103579</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pilevarzadeh</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Amirshahi</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Afsargharehbagh</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Rafiemanesh</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Hashemi</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Balouchi</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Global prevalence of depression among breast cancer patients: a systematic review and meta-analysis</article-title>
          <source>Breast Cancer Res Treat</source>
          <year>2019</year>
          <month>08</month>
          <day>13</day>
          <volume>176</volume>
          <issue>3</issue>
          <fpage>519</fpage>
          <lpage>533</lpage>
          <pub-id pub-id-type="doi">10.1007/s10549-019-05271-3</pub-id>
          <pub-id pub-id-type="medline">31087199</pub-id>
          <pub-id pub-id-type="pii">10.1007/s10549-019-05271-3</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lloyd</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Baraghoshi</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Tao</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Garrido-Laguna</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Gilcrease</surname>
              <given-names>IG</given-names>
            </name>
            <name name-style="western">
              <surname>Whisenant</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Weis</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Scaife</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Pickron</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Monroe</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Abdelaziz</surname>
              <given-names>Sarah</given-names>
            </name>
            <name name-style="western">
              <surname>Fraser</surname>
              <given-names>Alison M</given-names>
            </name>
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>Ken R</given-names>
            </name>
            <name name-style="western">
              <surname>Deshmukh</surname>
              <given-names>Vikrant</given-names>
            </name>
            <name name-style="western">
              <surname>Newman</surname>
              <given-names>Michael</given-names>
            </name>
            <name name-style="western">
              <surname>Rowe</surname>
              <given-names>Kerry G</given-names>
            </name>
            <name name-style="western">
              <surname>Snyder</surname>
              <given-names>John</given-names>
            </name>
            <name name-style="western">
              <surname>Samadder</surname>
              <given-names>Niloy J</given-names>
            </name>
            <name name-style="western">
              <surname>Hashibe</surname>
              <given-names>Mia</given-names>
            </name>
          </person-group>
          <article-title>Mental health disorders are more common in colorectal cancer survivors and associated with decreased overall survival</article-title>
          <source>Am J Clin Oncol</source>
          <year>2019</year>
          <month>04</month>
          <volume>42</volume>
          <issue>4</issue>
          <fpage>355</fpage>
          <lpage>362</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/30844850"/>
          </comment>
          <pub-id pub-id-type="doi">10.1097/COC.0000000000000529</pub-id>
          <pub-id pub-id-type="medline">30844850</pub-id>
          <pub-id pub-id-type="pmcid">PMC6433523</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Peng</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Kao</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Prevalence of depression and anxiety in colorectal cancer patients: a literature review</article-title>
          <source>Int J Environ Res Public Health</source>
          <year>2019</year>
          <month>01</month>
          <day>31</day>
          <volume>16</volume>
          <issue>3</issue>
          <fpage>411</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mdpi.com/resolver?pii=ijerph16030411"/>
          </comment>
          <pub-id pub-id-type="doi">10.3390/ijerph16030411</pub-id>
          <pub-id pub-id-type="medline">30709020</pub-id>
          <pub-id pub-id-type="pii">ijerph16030411</pub-id>
          <pub-id pub-id-type="pmcid">PMC6388369</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Aminisani</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Nikbakht</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Asghari Jafarabadi</surname>
              <given-names>Mohammad</given-names>
            </name>
            <name name-style="western">
              <surname>Shamshirgaran</surname>
              <given-names>SM</given-names>
            </name>
          </person-group>
          <article-title>Depression, anxiety, and health related quality of life among colorectal cancer survivors</article-title>
          <source>J Gastrointest Oncol</source>
          <year>2017</year>
          <month>02</month>
          <volume>8</volume>
          <issue>1</issue>
          <fpage>81</fpage>
          <lpage>88</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.21037/jgo.2017.01.12"/>
          </comment>
          <pub-id pub-id-type="doi">10.21037/jgo.2017.01.12</pub-id>
          <pub-id pub-id-type="medline">28280612</pub-id>
          <pub-id pub-id-type="pii">jgo-08-01-081</pub-id>
          <pub-id pub-id-type="pmcid">PMC5334052</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cvetković</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Nenadović</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Depression in breast cancer patients</article-title>
          <source>Psychiatry Res</source>
          <year>2016</year>
          <month>06</month>
          <day>30</day>
          <volume>240</volume>
          <fpage>343</fpage>
          <lpage>347</lpage>
          <pub-id pub-id-type="doi">10.1016/j.psychres.2016.04.048</pub-id>
          <pub-id pub-id-type="medline">27138829</pub-id>
          <pub-id pub-id-type="pii">S0165-1781(16)30519-4</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lloyd-Williams</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Depression--the hidden symptom in advanced cancer</article-title>
          <source>J R Soc Med</source>
          <year>2003</year>
          <month>12</month>
          <day>01</day>
          <volume>96</volume>
          <issue>12</issue>
          <fpage>577</fpage>
          <lpage>81</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/14645605"/>
          </comment>
          <pub-id pub-id-type="doi">10.1258/jrsm.96.12.577</pub-id>
          <pub-id pub-id-type="medline">14645605</pub-id>
          <pub-id pub-id-type="pmcid">PMC539654</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tayefi</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ngo</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Chomutare</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Dalianis</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Salvi</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Budrionis</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Godtliebsen</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>Challenges and opportunities beyond structured data in analysis of electronic health records</article-title>
          <source>WIREs Comp Stat</source>
          <year>2021</year>
          <month>02</month>
          <day>14</day>
          <volume>13</volume>
          <issue>6</issue>
          <fpage>e1549</fpage>
          <pub-id pub-id-type="doi">10.1002/wics.1549</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jensen</surname>
              <given-names>PB</given-names>
            </name>
            <name name-style="western">
              <surname>Jensen</surname>
              <given-names>LJ</given-names>
            </name>
            <name name-style="western">
              <surname>Brunak</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Mining electronic health records: towards better research applications and clinical care</article-title>
          <source>Nat Rev Genet</source>
          <year>2012</year>
          <month>05</month>
          <day>02</day>
          <volume>13</volume>
          <issue>6</issue>
          <fpage>395</fpage>
          <lpage>405</lpage>
          <pub-id pub-id-type="doi">10.1038/nrg3208</pub-id>
          <pub-id pub-id-type="medline">22549152</pub-id>
          <pub-id pub-id-type="pii">nrg3208</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kharrazi</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Anzaldi</surname>
              <given-names>LJ</given-names>
            </name>
            <name name-style="western">
              <surname>Hernandez</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Davison</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Boyd</surname>
              <given-names>CM</given-names>
            </name>
            <name name-style="western">
              <surname>Leff</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Kimura</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Weiner</surname>
              <given-names>JP</given-names>
            </name>
          </person-group>
          <article-title>The value of unstructured electronic health record data in geriatric syndrome case identification</article-title>
          <source>J Am Geriatr Soc</source>
          <year>2018</year>
          <month>08</month>
          <volume>66</volume>
          <issue>8</issue>
          <fpage>1499</fpage>
          <lpage>1507</lpage>
          <pub-id pub-id-type="doi">10.1111/jgs.15411</pub-id>
          <pub-id pub-id-type="medline">29972595</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Simmons</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Singhal</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>Z</given-names>
            </name>
          </person-group>
          <article-title>Text mining for precision medicine: bringing structure to EHRs and biomedical literature to understand genes and health</article-title>
          <source>Adv Exp Med Biol</source>
          <year>2016</year>
          <volume>939</volume>
          <fpage>139</fpage>
          <lpage>166</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/27807747"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/978-981-10-1503-8_7</pub-id>
          <pub-id pub-id-type="medline">27807747</pub-id>
          <pub-id pub-id-type="pmcid">PMC5931382</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Shao</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Zeng</surname>
              <given-names>QT</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>KK</given-names>
            </name>
            <name name-style="western">
              <surname>Shutes-David</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Thielke</surname>
              <given-names>SM</given-names>
            </name>
            <name name-style="western">
              <surname>Tsuang</surname>
              <given-names>DW</given-names>
            </name>
          </person-group>
          <article-title>Detection of probable dementia cases in undiagnosed patients using structured and unstructured electronic health records</article-title>
          <source>BMC Med Inform Decis Mak</source>
          <year>2019</year>
          <month>07</month>
          <day>09</day>
          <volume>19</volume>
          <issue>1</issue>
          <fpage>128</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcmedinformdecismak.biomedcentral.com/articles/10.1186/s12911-019-0846-4"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12911-019-0846-4</pub-id>
          <pub-id pub-id-type="medline">31288818</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12911-019-0846-4</pub-id>
          <pub-id pub-id-type="pmcid">PMC6617952</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sheikhalishahi</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Miotto</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Dudley</surname>
              <given-names>JT</given-names>
            </name>
            <name name-style="western">
              <surname>Lavelli</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Rinaldi</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Osmani</surname>
              <given-names>V</given-names>
            </name>
          </person-group>
          <article-title>Natural language processing of clinical notes on chronic diseases: systematic review</article-title>
          <source>JMIR Med Inform</source>
          <year>2019</year>
          <month>04</month>
          <day>27</day>
          <volume>7</volume>
          <issue>2</issue>
          <fpage>e12239</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medinform.jmir.org/2019/2/e12239/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/12239</pub-id>
          <pub-id pub-id-type="medline">31066697</pub-id>
          <pub-id pub-id-type="pii">v7i2e12239</pub-id>
          <pub-id pub-id-type="pmcid">PMC6528438</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jackson</surname>
              <given-names>RG</given-names>
            </name>
            <name name-style="western">
              <surname>Patel</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Jayatilleke</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Kolliakou</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Ball</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Gorrell</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Roberts</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Dobson</surname>
              <given-names>RJ</given-names>
            </name>
            <name name-style="western">
              <surname>Stewart</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Natural language processing to extract symptoms of severe mental illness from clinical text: the Clinical Record Interactive Search Comprehensive Data Extraction (CRIS-CODE) project</article-title>
          <source>BMJ Open</source>
          <year>2017</year>
          <month>01</month>
          <day>17</day>
          <volume>7</volume>
          <issue>1</issue>
          <fpage>e012012</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmjopen.bmj.com/lookup/pmidlookup?view=long&#38;pmid=28096249"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/bmjopen-2016-012012</pub-id>
          <pub-id pub-id-type="medline">28096249</pub-id>
          <pub-id pub-id-type="pii">bmjopen-2016-012012</pub-id>
          <pub-id pub-id-type="pmcid">PMC5253558</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mayer</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Gutierrez-Sacristan</surname>
              <given-names>Alba</given-names>
            </name>
            <name name-style="western">
              <surname>Leis</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>De La Peña</surname>
              <given-names>Santiago</given-names>
            </name>
            <name name-style="western">
              <surname>Sanz</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Furlong</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Using electronic health records to assess depression and cancer comorbidities</article-title>
          <source>Stud Health Technol Inform</source>
          <year>2017</year>
          <volume>235</volume>
          <fpage>236</fpage>
          <lpage>240</lpage>
          <pub-id pub-id-type="doi">10.3233/978-1-61499-753-5-236</pub-id>
          <pub-id pub-id-type="medline">28423789</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Aerts</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Kalra</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Sáez</surname>
              <given-names>Carlos</given-names>
            </name>
            <name name-style="western">
              <surname>Ramírez-Anguita</surname>
              <given-names>Juan Manuel</given-names>
            </name>
            <name name-style="western">
              <surname>Mayer</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Garcia-Gomez</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Durà-Hernández</surname>
              <given-names>Marta</given-names>
            </name>
            <name name-style="western">
              <surname>Thienpont</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Coorevits</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Quality of hospital electronic health record (EHR) data based on the International Consortium for Health Outcomes Measurement (ICHOM) in heart failure: pilot data quality assessment study</article-title>
          <source>JMIR Med Inform</source>
          <year>2021</year>
          <month>08</month>
          <day>04</day>
          <volume>9</volume>
          <issue>8</issue>
          <fpage>e27842</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medinform.jmir.org/2021/8/e27842/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/27842</pub-id>
          <pub-id pub-id-type="medline">34346902</pub-id>
          <pub-id pub-id-type="pii">v9i8e27842</pub-id>
          <pub-id pub-id-type="pmcid">PMC8374665</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="web">
          <article-title>International Classification of Diseases, Ninth Revision, Clinical Modification (ICD-9-CM)</article-title>
          <source>Centers for Disease Control and Prevention</source>
          <access-date>2022-02-09</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.cdc.gov/nchs/icd/icd9cm.htm">https://www.cdc.gov/nchs/icd/icd9cm.htm</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Agüero</surname>
              <given-names>Fernando</given-names>
            </name>
            <name name-style="western">
              <surname>Murta-Nascimento</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Gallén</surname>
              <given-names>Manuel</given-names>
            </name>
            <name name-style="western">
              <surname>Andreu-García</surname>
              <given-names>Montserrat</given-names>
            </name>
            <name name-style="western">
              <surname>Pera</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Hernández</surname>
              <given-names>Cristina</given-names>
            </name>
            <name name-style="western">
              <surname>Burón</surname>
              <given-names>Andrea</given-names>
            </name>
            <name name-style="western">
              <surname>Macià</surname>
              <given-names>Francesc</given-names>
            </name>
          </person-group>
          <article-title>Colorectal cancer survival: results from a hospital-based cancer registry</article-title>
          <source>Rev Esp Enferm Dig</source>
          <year>2012</year>
          <month>12</month>
          <volume>104</volume>
          <issue>11</issue>
          <fpage>572</fpage>
          <lpage>7</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.grupoaran.com/mrmUpdate/lecturaPDFfromXML.asp?IdArt=4620427&#38;TO=RVN&#38;Eng=1"/>
          </comment>
          <pub-id pub-id-type="doi">10.4321/s1130-01082012001100004</pub-id>
          <pub-id pub-id-type="medline">23368648</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="web">
          <article-title>SNOMED International SNOMED CT Browser</article-title>
          <source>SNOMED International</source>
          <access-date>2022-02-09</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://browser.ihtsdotools.org">https://browser.ihtsdotools.org</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Padró</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Stanilovsky</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>FreeLing 3.0: Towards wider multilinguality</article-title>
          <source>Proceedings of the Eighth International Conference on Language Resources and Evaluation</source>
          <year>2012</year>
          <conf-name>LREC'12</conf-name>
          <conf-date>May 21-27, 2012</conf-date>
          <conf-loc>Istanbul, Turkey</conf-loc>
          <fpage>2473</fpage>
          <lpage>2479</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.lrec-conf.org/proceedings/lrec2012/pdf/430_Paper.pdf"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="web">
          <source>Elasticsearch</source>
          <access-date>2022-02-01</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.elastic.co/">https://www.elastic.co/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Vaci</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Kormilitzin</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>De Crescenzo</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Kurtulmus</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Harvey</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>O'Dell</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Innocent</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Tomlinson</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Cipriani</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Nevado-Holgado</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Natural language processing for structuring clinical text data on depression using UK-CRIS</article-title>
          <source>Evid Based Ment Health</source>
          <year>2020</year>
          <month>02</month>
          <day>11</day>
          <volume>23</volume>
          <issue>1</issue>
          <fpage>21</fpage>
          <lpage>26</lpage>
          <pub-id pub-id-type="doi">10.1136/ebmental-2019-300134</pub-id>
          <pub-id pub-id-type="medline">32046989</pub-id>
          <pub-id pub-id-type="pii">ebmental-2019-300134</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Koleck</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Dreisbach</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Bourne</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Bakken</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Natural language processing of symptoms documented in free-text narratives of electronic health records: a systematic review</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2019</year>
          <month>04</month>
          <day>01</day>
          <volume>26</volume>
          <issue>4</issue>
          <fpage>364</fpage>
          <lpage>379</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/30726935"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/jamia/ocy173</pub-id>
          <pub-id pub-id-type="medline">30726935</pub-id>
          <pub-id pub-id-type="pii">5307912</pub-id>
          <pub-id pub-id-type="pmcid">PMC6657282</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yim</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Yetisgen</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Harris</surname>
              <given-names>WP</given-names>
            </name>
            <name name-style="western">
              <surname>Kwan</surname>
              <given-names>SW</given-names>
            </name>
          </person-group>
          <article-title>Natural language processing in oncology: a review</article-title>
          <source>JAMA Oncol</source>
          <year>2016</year>
          <month>06</month>
          <day>01</day>
          <volume>2</volume>
          <issue>6</issue>
          <fpage>797</fpage>
          <lpage>804</lpage>
          <pub-id pub-id-type="doi">10.1001/jamaoncol.2016.0213</pub-id>
          <pub-id pub-id-type="medline">27124593</pub-id>
          <pub-id pub-id-type="pii">2517402</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Menasalvas Ruiz</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Tuñas</surname>
              <given-names>Juan Manuel</given-names>
            </name>
            <name name-style="western">
              <surname>Bermejo</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Gonzalo Martín</surname>
              <given-names>Consuelo</given-names>
            </name>
            <name name-style="western">
              <surname>Rodríguez-González</surname>
              <given-names>Alejandro</given-names>
            </name>
            <name name-style="western">
              <surname>Zanin</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>González de Pedro</surname>
              <given-names>Cristina</given-names>
            </name>
            <name name-style="western">
              <surname>Méndez</surname>
              <given-names>Marta</given-names>
            </name>
            <name name-style="western">
              <surname>Zaretskaia</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Rey</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Parejo</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Cruz Bermudez</surname>
              <given-names>JL</given-names>
            </name>
            <name name-style="western">
              <surname>Provencio</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Profiling lung cancer patients using electronic health records</article-title>
          <source>J Med Syst</source>
          <year>2018</year>
          <month>05</month>
          <day>31</day>
          <volume>42</volume>
          <issue>7</issue>
          <fpage>126</fpage>
          <pub-id pub-id-type="doi">10.1007/s10916-018-0975-9</pub-id>
          <pub-id pub-id-type="medline">29855732</pub-id>
          <pub-id pub-id-type="pii">10.1007/s10916-018-0975-9</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Spiranovic</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Matthews</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Scanlan</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Kirkby</surname>
              <given-names>KC</given-names>
            </name>
          </person-group>
          <article-title>Increasing knowledge of mental illness through secondary research of electronic health records: opportunities and challenges</article-title>
          <source>Adv Ment Health</source>
          <year>2015</year>
          <month>07</month>
          <day>21</day>
          <volume>14</volume>
          <issue>1</issue>
          <fpage>14</fpage>
          <lpage>25</lpage>
          <pub-id pub-id-type="doi">10.1080/18387357.2015.1063635</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref43">
        <label>43</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Smoller</surname>
              <given-names>JW</given-names>
            </name>
          </person-group>
          <article-title>The use of electronic health records for psychiatric phenotyping and genomics</article-title>
          <source>Am J Med Genet B Neuropsychiatr Genet</source>
          <year>2018</year>
          <month>10</month>
          <day>30</day>
          <volume>177</volume>
          <issue>7</issue>
          <fpage>601</fpage>
          <lpage>612</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/28557243"/>
          </comment>
          <pub-id pub-id-type="doi">10.1002/ajmg.b.32548</pub-id>
          <pub-id pub-id-type="medline">28557243</pub-id>
          <pub-id pub-id-type="pmcid">PMC6440216</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
